diff --git "a/sf_log.txt" "b/sf_log.txt" new file mode 100644--- /dev/null +++ "b/sf_log.txt" @@ -0,0 +1,26690 @@ +[2023-10-08 15:41:17,629][19739] Saving configuration to ./train_atari/atari_atlantis_APPO/config.json... +[2023-10-08 15:41:17,895][19739] Rollout worker 0 uses device cpu +[2023-10-08 15:41:17,896][19739] Rollout worker 1 uses device cpu +[2023-10-08 15:41:17,896][19739] Rollout worker 2 uses device cpu +[2023-10-08 15:41:17,897][19739] Rollout worker 3 uses device cpu +[2023-10-08 15:41:17,897][19739] Rollout worker 4 uses device cpu +[2023-10-08 15:41:17,898][19739] Rollout worker 5 uses device cpu +[2023-10-08 15:41:17,898][19739] Rollout worker 6 uses device cpu +[2023-10-08 15:41:17,899][19739] Rollout worker 7 uses device cpu +[2023-10-08 15:41:17,899][19739] Rollout worker 8 uses device cpu +[2023-10-08 15:41:17,899][19739] Rollout worker 9 uses device cpu +[2023-10-08 15:41:17,900][19739] Rollout worker 10 uses device cpu +[2023-10-08 15:41:17,900][19739] Rollout worker 11 uses device cpu +[2023-10-08 15:41:17,901][19739] Rollout worker 12 uses device cpu +[2023-10-08 15:41:17,901][19739] Rollout worker 13 uses device cpu +[2023-10-08 15:41:17,901][19739] Rollout worker 14 uses device cpu +[2023-10-08 15:41:17,902][19739] Rollout worker 15 uses device cpu +[2023-10-08 15:41:18,190][19739] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-10-08 15:41:18,191][19739] InferenceWorker_p0-w0: min num requests: 2 +[2023-10-08 15:41:18,194][19739] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-10-08 15:41:18,194][19739] InferenceWorker_p1-w0: min num requests: 2 +[2023-10-08 15:41:18,241][19739] Starting all processes... +[2023-10-08 15:41:18,241][19739] Starting process learner_proc0 +[2023-10-08 15:41:19,910][19739] Starting process learner_proc1 +[2023-10-08 15:41:19,913][20740] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-10-08 15:41:19,913][20740] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 +[2023-10-08 15:41:19,931][20740] Num visible devices: 1 +[2023-10-08 15:41:19,947][20740] Setting fixed seed 1234 +[2023-10-08 15:41:19,948][20740] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-10-08 15:41:19,948][20740] Initializing actor-critic model on device cuda:0 +[2023-10-08 15:41:19,948][20740] RunningMeanStd input shape: (4, 84, 84) +[2023-10-08 15:41:19,949][20740] RunningMeanStd input shape: (1,) +[2023-10-08 15:41:19,960][20740] ConvEncoder: input_channels=4 +[2023-10-08 15:41:20,137][20740] Conv encoder output size: 512 +[2023-10-08 15:41:20,139][20740] Created Actor Critic model with architecture: +[2023-10-08 15:41:20,139][20740] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): MultiInputEncoder( + (encoders): ModuleDict( + (obs): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ReLU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ReLU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ReLU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ReLU) + ) + ) + ) + ) + ) + (core): ModelCoreIdentity() + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=4, bias=True) + ) +) +[2023-10-08 15:41:20,696][20740] Using optimizer +[2023-10-08 15:41:20,697][20740] No checkpoints found +[2023-10-08 15:41:20,697][20740] Did not load from checkpoint, starting from scratch! +[2023-10-08 15:41:20,697][20740] Initialized policy 0 weights for model version 0 +[2023-10-08 15:41:20,699][20740] LearnerWorker_p0 finished initialization! +[2023-10-08 15:41:20,699][20740] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-10-08 15:41:21,674][19739] Starting all processes... +[2023-10-08 15:41:21,677][20836] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-10-08 15:41:21,678][20836] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for learning process 1 +[2023-10-08 15:41:21,682][19739] Starting process inference_proc0-0 +[2023-10-08 15:41:21,682][19739] Starting process inference_proc1-0 +[2023-10-08 15:41:21,683][19739] Starting process rollout_proc0 +[2023-10-08 15:41:21,683][19739] Starting process rollout_proc1 +[2023-10-08 15:41:21,683][19739] Starting process rollout_proc2 +[2023-10-08 15:41:21,696][20836] Num visible devices: 1 +[2023-10-08 15:41:21,683][19739] Starting process rollout_proc3 +[2023-10-08 15:41:21,684][19739] Starting process rollout_proc4 +[2023-10-08 15:41:21,686][19739] Starting process rollout_proc5 +[2023-10-08 15:41:21,720][20836] Setting fixed seed 1234 +[2023-10-08 15:41:21,688][19739] Starting process rollout_proc6 +[2023-10-08 15:41:21,722][20836] Using GPUs [0] for process 1 (actually maps to GPUs [1]) +[2023-10-08 15:41:21,722][20836] Initializing actor-critic model on device cuda:0 +[2023-10-08 15:41:21,722][20836] RunningMeanStd input shape: (4, 84, 84) +[2023-10-08 15:41:21,723][20836] RunningMeanStd input shape: (1,) +[2023-10-08 15:41:21,689][19739] Starting process rollout_proc7 +[2023-10-08 15:41:21,692][19739] Starting process rollout_proc8 +[2023-10-08 15:41:21,694][19739] Starting process rollout_proc9 +[2023-10-08 15:41:21,694][19739] Starting process rollout_proc10 +[2023-10-08 15:41:21,698][19739] Starting process rollout_proc11 +[2023-10-08 15:41:21,735][20836] ConvEncoder: input_channels=4 +[2023-10-08 15:41:21,698][19739] Starting process rollout_proc12 +[2023-10-08 15:41:21,700][19739] Starting process rollout_proc13 +[2023-10-08 15:41:22,217][20836] Conv encoder output size: 512 +[2023-10-08 15:41:22,220][20836] Created Actor Critic model with architecture: +[2023-10-08 15:41:22,220][20836] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): MultiInputEncoder( + (encoders): ModuleDict( + (obs): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ReLU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ReLU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ReLU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ReLU) + ) + ) + ) + ) + ) + (core): ModelCoreIdentity() + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=4, bias=True) + ) +) +[2023-10-08 15:41:22,828][20836] Using optimizer +[2023-10-08 15:41:22,829][20836] No checkpoints found +[2023-10-08 15:41:22,829][20836] Did not load from checkpoint, starting from scratch! +[2023-10-08 15:41:22,830][20836] Initialized policy 1 weights for model version 0 +[2023-10-08 15:41:22,831][20836] LearnerWorker_p1 finished initialization! +[2023-10-08 15:41:22,831][20836] Using GPUs [0] for process 1 (actually maps to GPUs [1]) +[2023-10-08 15:41:23,874][19739] Starting process rollout_proc14 +[2023-10-08 15:41:23,879][21195] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-10-08 15:41:23,880][21195] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 +[2023-10-08 15:41:23,898][21195] Num visible devices: 1 +[2023-10-08 15:41:23,898][19739] Starting process rollout_proc15 +[2023-10-08 15:41:23,905][21234] Worker 0 uses CPU cores [0, 1] +[2023-10-08 15:41:23,919][21232] Worker 2 uses CPU cores [4, 5] +[2023-10-08 15:41:24,007][21239] Worker 9 uses CPU cores [18, 19] +[2023-10-08 15:41:24,104][21229] Worker 1 uses CPU cores [2, 3] +[2023-10-08 15:41:24,146][21238] Worker 8 uses CPU cores [16, 17] +[2023-10-08 15:41:24,215][21194] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-10-08 15:41:24,216][21194] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for inference process 1 +[2023-10-08 15:41:24,235][21230] Worker 3 uses CPU cores [6, 7] +[2023-10-08 15:41:24,238][21194] Num visible devices: 1 +[2023-10-08 15:41:24,243][21240] Worker 11 uses CPU cores [22, 23] +[2023-10-08 15:41:24,246][21237] Worker 6 uses CPU cores [12, 13] +[2023-10-08 15:41:24,354][21236] Worker 5 uses CPU cores [10, 11] +[2023-10-08 15:41:24,392][21242] Worker 12 uses CPU cores [24, 25] +[2023-10-08 15:41:24,402][21233] Worker 7 uses CPU cores [14, 15] +[2023-10-08 15:41:24,441][21235] Worker 4 uses CPU cores [8, 9] +[2023-10-08 15:41:24,477][21243] Worker 13 uses CPU cores [26, 27] +[2023-10-08 15:41:24,492][21241] Worker 10 uses CPU cores [20, 21] +[2023-10-08 15:41:24,610][21195] RunningMeanStd input shape: (4, 84, 84) +[2023-10-08 15:41:24,610][21195] RunningMeanStd input shape: (1,) +[2023-10-08 15:41:24,622][21195] ConvEncoder: input_channels=4 +[2023-10-08 15:41:24,727][21195] Conv encoder output size: 512 +[2023-10-08 15:41:24,841][21194] RunningMeanStd input shape: (4, 84, 84) +[2023-10-08 15:41:24,842][21194] RunningMeanStd input shape: (1,) +[2023-10-08 15:41:24,852][21194] ConvEncoder: input_channels=4 +[2023-10-08 15:41:24,949][21194] Conv encoder output size: 512 +[2023-10-08 15:41:25,812][21924] Worker 15 uses CPU cores [30, 31] +[2023-10-08 15:41:25,851][19739] Inference worker 0-0 is ready! +[2023-10-08 15:41:25,852][19739] Inference worker 1-0 is ready! +[2023-10-08 15:41:25,852][19739] All inference workers are ready! Signal rollout workers to start! +[2023-10-08 15:41:25,853][21233] EnvRunner 7-0 uses policy 1 +[2023-10-08 15:41:25,853][21237] EnvRunner 6-0 uses policy 0 +[2023-10-08 15:41:25,853][21230] EnvRunner 3-0 uses policy 1 +[2023-10-08 15:41:25,853][19739] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 0. Throughput: 0: nan, 1: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-10-08 15:41:25,853][21236] EnvRunner 5-0 uses policy 1 +[2023-10-08 15:41:25,853][21238] EnvRunner 8-0 uses policy 0 +[2023-10-08 15:41:25,853][21234] EnvRunner 0-0 uses policy 0 +[2023-10-08 15:41:25,853][21235] EnvRunner 4-0 uses policy 0 +[2023-10-08 15:41:25,853][21241] EnvRunner 10-0 uses policy 0 +[2023-10-08 15:41:25,853][21229] EnvRunner 1-0 uses policy 1 +[2023-10-08 15:41:25,854][21239] EnvRunner 9-0 uses policy 1 +[2023-10-08 15:41:25,854][21232] EnvRunner 2-0 uses policy 0 +[2023-10-08 15:41:25,854][21242] EnvRunner 12-0 uses policy 0 +[2023-10-08 15:41:25,854][21243] EnvRunner 13-0 uses policy 1 +[2023-10-08 15:41:25,853][21240] EnvRunner 11-0 uses policy 1 +[2023-10-08 15:41:25,854][21886] Worker 14 uses CPU cores [28, 29] +[2023-10-08 15:41:25,996][21924] EnvRunner 15-0 uses policy 1 +[2023-10-08 15:41:26,040][21886] EnvRunner 14-0 uses policy 0 +[2023-10-08 15:41:28,178][19739] Heartbeat connected on Batcher_0 +[2023-10-08 15:41:28,181][19739] Heartbeat connected on LearnerWorker_p0 +[2023-10-08 15:41:28,184][19739] Heartbeat connected on Batcher_1 +[2023-10-08 15:41:28,186][19739] Heartbeat connected on LearnerWorker_p1 +[2023-10-08 15:41:28,192][19739] Heartbeat connected on InferenceWorker_p0-w0 +[2023-10-08 15:41:28,199][19739] Heartbeat connected on InferenceWorker_p1-w0 +[2023-10-08 15:41:28,201][19739] Heartbeat connected on RolloutWorker_w1 +[2023-10-08 15:41:28,201][19739] Heartbeat connected on RolloutWorker_w0 +[2023-10-08 15:41:28,204][19739] Heartbeat connected on RolloutWorker_w2 +[2023-10-08 15:41:28,209][19739] Heartbeat connected on RolloutWorker_w3 +[2023-10-08 15:41:28,209][19739] Heartbeat connected on RolloutWorker_w4 +[2023-10-08 15:41:28,212][19739] Heartbeat connected on RolloutWorker_w5 +[2023-10-08 15:41:28,218][19739] Heartbeat connected on RolloutWorker_w7 +[2023-10-08 15:41:28,220][19739] Heartbeat connected on RolloutWorker_w8 +[2023-10-08 15:41:28,220][19739] Heartbeat connected on RolloutWorker_w6 +[2023-10-08 15:41:28,223][19739] Heartbeat connected on RolloutWorker_w9 +[2023-10-08 15:41:28,226][19739] Heartbeat connected on RolloutWorker_w10 +[2023-10-08 15:41:28,228][19739] Heartbeat connected on RolloutWorker_w11 +[2023-10-08 15:41:28,231][19739] Heartbeat connected on RolloutWorker_w12 +[2023-10-08 15:41:28,238][19739] Heartbeat connected on RolloutWorker_w14 +[2023-10-08 15:41:28,239][19739] Heartbeat connected on RolloutWorker_w13 +[2023-10-08 15:41:28,240][19739] Heartbeat connected on RolloutWorker_w15 +[2023-10-08 15:41:28,803][19739] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 324.8, 1: 477.4. Samples: 2366. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-10-08 15:41:28,803][19739] Avg episode reward: [(0, '2.000'), (1, '2.000')] +[2023-10-08 15:41:33,803][19739] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 1477.9, 1: 940.5. Samples: 19224. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-10-08 15:41:33,803][19739] Avg episode reward: [(0, '4.756'), (1, '4.600')] +[2023-10-08 15:41:35,578][21194] Updated weights for policy 1, policy_version 10 (0.0010) +[2023-10-08 15:41:35,627][21195] Updated weights for policy 0, policy_version 10 (0.0008) +[2023-10-08 15:41:35,939][21194] Updated weights for policy 1, policy_version 20 (0.0008) +[2023-10-08 15:41:35,992][21195] Updated weights for policy 0, policy_version 20 (0.0008) +[2023-10-08 15:41:36,306][21194] Updated weights for policy 1, policy_version 30 (0.0007) +[2023-10-08 15:41:36,371][21195] Updated weights for policy 0, policy_version 30 (0.0007) +[2023-10-08 15:41:38,803][19739] Fps is (10 sec: 6553.6, 60 sec: 5060.9, 300 sec: 5060.9). Total num frames: 65536. Throughput: 0: 1186.0, 1: 1220.4. Samples: 31162. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:41:38,803][19739] Avg episode reward: [(0, '4.322'), (1, '3.796')] +[2023-10-08 15:41:38,846][21195] Updated weights for policy 0, policy_version 40 (0.0008) +[2023-10-08 15:41:39,025][21194] Updated weights for policy 1, policy_version 40 (0.0009) +[2023-10-08 15:41:39,221][21195] Updated weights for policy 0, policy_version 50 (0.0010) +[2023-10-08 15:41:39,402][21194] Updated weights for policy 1, policy_version 50 (0.0009) +[2023-10-08 15:41:39,586][21195] Updated weights for policy 0, policy_version 60 (0.0007) +[2023-10-08 15:41:39,761][21194] Updated weights for policy 1, policy_version 60 (0.0010) +[2023-10-08 15:41:43,047][21194] Updated weights for policy 1, policy_version 70 (0.0008) +[2023-10-08 15:41:43,084][21195] Updated weights for policy 0, policy_version 70 (0.0007) +[2023-10-08 15:41:43,408][21194] Updated weights for policy 1, policy_version 80 (0.0009) +[2023-10-08 15:41:43,449][21195] Updated weights for policy 0, policy_version 80 (0.0007) +[2023-10-08 15:41:43,777][21194] Updated weights for policy 1, policy_version 90 (0.0007) +[2023-10-08 15:41:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 7302.3, 300 sec: 7302.3). Total num frames: 131072. Throughput: 0: 1454.5, 1: 1450.3. Samples: 52140. Policy #0 lag: (min: 33.0, avg: 33.0, max: 33.0) +[2023-10-08 15:41:43,803][19739] Avg episode reward: [(0, '4.240'), (1, '3.270')] +[2023-10-08 15:41:43,822][21195] Updated weights for policy 0, policy_version 90 (0.0009) +[2023-10-08 15:41:47,542][21194] Updated weights for policy 1, policy_version 100 (0.0008) +[2023-10-08 15:41:47,555][21195] Updated weights for policy 0, policy_version 100 (0.0009) +[2023-10-08 15:41:47,898][21194] Updated weights for policy 1, policy_version 110 (0.0009) +[2023-10-08 15:41:47,921][21195] Updated weights for policy 0, policy_version 110 (0.0008) +[2023-10-08 15:41:48,269][21194] Updated weights for policy 1, policy_version 120 (0.0008) +[2023-10-08 15:41:48,294][21195] Updated weights for policy 0, policy_version 120 (0.0008) +[2023-10-08 15:41:48,802][19739] Fps is (10 sec: 19661.1, 60 sec: 11422.8, 300 sec: 11422.8). Total num frames: 262144. Throughput: 0: 1550.9, 1: 1350.0. Samples: 66574. Policy #0 lag: (min: 22.0, avg: 29.9, max: 54.0) +[2023-10-08 15:41:48,803][19739] Avg episode reward: [(0, '3.960'), (1, '4.050')] +[2023-10-08 15:41:48,804][20740] Saving new best policy, reward=3.960! +[2023-10-08 15:41:48,804][20836] Saving new best policy, reward=4.050! +[2023-10-08 15:41:52,230][21194] Updated weights for policy 1, policy_version 130 (0.0007) +[2023-10-08 15:41:52,248][21195] Updated weights for policy 0, policy_version 130 (0.0008) +[2023-10-08 15:41:52,596][21194] Updated weights for policy 1, policy_version 140 (0.0007) +[2023-10-08 15:41:52,616][21195] Updated weights for policy 0, policy_version 140 (0.0008) +[2023-10-08 15:41:52,959][21194] Updated weights for policy 1, policy_version 150 (0.0007) +[2023-10-08 15:41:52,985][21195] Updated weights for policy 0, policy_version 150 (0.0008) +[2023-10-08 15:41:53,328][21194] Updated weights for policy 1, policy_version 160 (0.0008) +[2023-10-08 15:41:53,358][21195] Updated weights for policy 0, policy_version 160 (0.0007) +[2023-10-08 15:41:53,802][19739] Fps is (10 sec: 19661.0, 60 sec: 11724.1, 300 sec: 11724.1). Total num frames: 327680. Throughput: 0: 1480.8, 1: 1482.7. Samples: 82826. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:41:53,803][19739] Avg episode reward: [(0, '4.690'), (1, '3.980')] +[2023-10-08 15:41:53,804][20740] Saving new best policy, reward=4.690! +[2023-10-08 15:41:57,231][21194] Updated weights for policy 1, policy_version 170 (0.0008) +[2023-10-08 15:41:57,393][21195] Updated weights for policy 0, policy_version 170 (0.0008) +[2023-10-08 15:41:57,595][21194] Updated weights for policy 1, policy_version 180 (0.0007) +[2023-10-08 15:41:57,763][21195] Updated weights for policy 0, policy_version 180 (0.0007) +[2023-10-08 15:41:57,957][21194] Updated weights for policy 1, policy_version 190 (0.0008) +[2023-10-08 15:41:58,134][21195] Updated weights for policy 0, policy_version 190 (0.0009) +[2023-10-08 15:41:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 11934.0, 300 sec: 11934.0). Total num frames: 393216. Throughput: 0: 1551.1, 1: 1546.0. Samples: 102046. Policy #0 lag: (min: 31.0, avg: 41.4, max: 63.0) +[2023-10-08 15:41:58,803][19739] Avg episode reward: [(0, '4.750'), (1, '4.650')] +[2023-10-08 15:41:58,810][20740] Saving new best policy, reward=4.750! +[2023-10-08 15:41:58,810][20836] Saving new best policy, reward=4.650! +[2023-10-08 15:42:01,927][21194] Updated weights for policy 1, policy_version 200 (0.0007) +[2023-10-08 15:42:02,124][21195] Updated weights for policy 0, policy_version 200 (0.0009) +[2023-10-08 15:42:02,296][21194] Updated weights for policy 1, policy_version 210 (0.0009) +[2023-10-08 15:42:02,495][21195] Updated weights for policy 0, policy_version 210 (0.0007) +[2023-10-08 15:42:02,666][21194] Updated weights for policy 1, policy_version 220 (0.0009) +[2023-10-08 15:42:02,863][21195] Updated weights for policy 0, policy_version 220 (0.0008) +[2023-10-08 15:42:03,803][19739] Fps is (10 sec: 13106.9, 60 sec: 12088.5, 300 sec: 12088.5). Total num frames: 458752. Throughput: 0: 1614.6, 1: 1498.2. Samples: 118128. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:42:03,804][19739] Avg episode reward: [(0, '3.880'), (1, '4.730')] +[2023-10-08 15:42:03,806][20836] Saving new best policy, reward=4.730! +[2023-10-08 15:42:06,693][21195] Updated weights for policy 0, policy_version 230 (0.0008) +[2023-10-08 15:42:06,739][21194] Updated weights for policy 1, policy_version 230 (0.0009) +[2023-10-08 15:42:07,054][21195] Updated weights for policy 0, policy_version 240 (0.0007) +[2023-10-08 15:42:07,108][21194] Updated weights for policy 1, policy_version 240 (0.0010) +[2023-10-08 15:42:07,432][21195] Updated weights for policy 0, policy_version 250 (0.0007) +[2023-10-08 15:42:07,475][21194] Updated weights for policy 1, policy_version 250 (0.0008) +[2023-10-08 15:42:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 12207.1, 300 sec: 12207.1). Total num frames: 524288. Throughput: 0: 1557.8, 1: 1557.8. Samples: 133814. Policy #0 lag: (min: 4.0, avg: 11.9, max: 36.0) +[2023-10-08 15:42:08,803][19739] Avg episode reward: [(0, '3.830'), (1, '4.430')] +[2023-10-08 15:42:11,402][21194] Updated weights for policy 1, policy_version 260 (0.0007) +[2023-10-08 15:42:11,427][21195] Updated weights for policy 0, policy_version 260 (0.0009) +[2023-10-08 15:42:11,761][21194] Updated weights for policy 1, policy_version 270 (0.0009) +[2023-10-08 15:42:11,799][21195] Updated weights for policy 0, policy_version 270 (0.0009) +[2023-10-08 15:42:12,128][21194] Updated weights for policy 1, policy_version 280 (0.0008) +[2023-10-08 15:42:12,168][21195] Updated weights for policy 0, policy_version 280 (0.0007) +[2023-10-08 15:42:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 12301.0, 300 sec: 12301.0). Total num frames: 589824. Throughput: 0: 1678.4, 1: 1673.4. Samples: 153196. Policy #0 lag: (min: 31.0, avg: 37.6, max: 63.0) +[2023-10-08 15:42:13,803][19739] Avg episode reward: [(0, '4.470'), (1, '4.640')] +[2023-10-08 15:42:16,127][21195] Updated weights for policy 0, policy_version 290 (0.0009) +[2023-10-08 15:42:16,186][21194] Updated weights for policy 1, policy_version 290 (0.0008) +[2023-10-08 15:42:16,502][21195] Updated weights for policy 0, policy_version 300 (0.0008) +[2023-10-08 15:42:16,603][21194] Updated weights for policy 1, policy_version 300 (0.0007) +[2023-10-08 15:42:16,858][21195] Updated weights for policy 0, policy_version 310 (0.0008) +[2023-10-08 15:42:16,972][21194] Updated weights for policy 1, policy_version 310 (0.0008) +[2023-10-08 15:42:17,231][21195] Updated weights for policy 0, policy_version 320 (0.0008) +[2023-10-08 15:42:17,333][21194] Updated weights for policy 1, policy_version 320 (0.0007) +[2023-10-08 15:42:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 12377.1, 300 sec: 12377.1). Total num frames: 655360. Throughput: 0: 1673.8, 1: 1671.2. Samples: 169746. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 15:42:18,803][19739] Avg episode reward: [(0, '4.660'), (1, '5.280')] +[2023-10-08 15:42:18,804][20836] Saving new best policy, reward=5.280! +[2023-10-08 15:42:21,165][21195] Updated weights for policy 0, policy_version 330 (0.0008) +[2023-10-08 15:42:21,346][21194] Updated weights for policy 1, policy_version 330 (0.0007) +[2023-10-08 15:42:21,530][21195] Updated weights for policy 0, policy_version 340 (0.0007) +[2023-10-08 15:42:21,710][21194] Updated weights for policy 1, policy_version 340 (0.0008) +[2023-10-08 15:42:21,903][21195] Updated weights for policy 0, policy_version 350 (0.0010) +[2023-10-08 15:42:22,075][21194] Updated weights for policy 1, policy_version 350 (0.0007) +[2023-10-08 15:42:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 12440.1, 300 sec: 12440.1). Total num frames: 720896. Throughput: 0: 1703.4, 1: 1693.5. Samples: 184024. Policy #0 lag: (min: 26.0, avg: 26.0, max: 26.0) +[2023-10-08 15:42:23,804][19739] Avg episode reward: [(0, '4.040'), (1, '5.310')] +[2023-10-08 15:42:23,805][20836] Saving new best policy, reward=5.310! +[2023-10-08 15:42:25,950][21195] Updated weights for policy 0, policy_version 360 (0.0009) +[2023-10-08 15:42:26,050][21194] Updated weights for policy 1, policy_version 360 (0.0007) +[2023-10-08 15:42:26,321][21195] Updated weights for policy 0, policy_version 370 (0.0009) +[2023-10-08 15:42:26,406][21194] Updated weights for policy 1, policy_version 370 (0.0008) +[2023-10-08 15:42:26,692][21195] Updated weights for policy 0, policy_version 380 (0.0007) +[2023-10-08 15:42:26,782][21194] Updated weights for policy 1, policy_version 380 (0.0008) +[2023-10-08 15:42:28,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 12493.1). Total num frames: 786432. Throughput: 0: 1693.7, 1: 1698.1. Samples: 204772. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:42:28,803][19739] Avg episode reward: [(0, '4.530'), (1, '4.870')] +[2023-10-08 15:42:30,589][21195] Updated weights for policy 0, policy_version 390 (0.0008) +[2023-10-08 15:42:30,813][21194] Updated weights for policy 1, policy_version 390 (0.0009) +[2023-10-08 15:42:30,967][21195] Updated weights for policy 0, policy_version 400 (0.0008) +[2023-10-08 15:42:31,181][21194] Updated weights for policy 1, policy_version 400 (0.0009) +[2023-10-08 15:42:31,334][21195] Updated weights for policy 0, policy_version 410 (0.0007) +[2023-10-08 15:42:31,553][21194] Updated weights for policy 1, policy_version 410 (0.0008) +[2023-10-08 15:42:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 12538.3). Total num frames: 851968. Throughput: 0: 1723.6, 1: 1710.4. Samples: 221104. Policy #0 lag: (min: 22.0, avg: 27.0, max: 54.0) +[2023-10-08 15:42:33,803][19739] Avg episode reward: [(0, '4.260'), (1, '4.600')] +[2023-10-08 15:42:35,171][21195] Updated weights for policy 0, policy_version 420 (0.0009) +[2023-10-08 15:42:35,350][21194] Updated weights for policy 1, policy_version 420 (0.0007) +[2023-10-08 15:42:35,538][21195] Updated weights for policy 0, policy_version 430 (0.0008) +[2023-10-08 15:42:35,706][21194] Updated weights for policy 1, policy_version 430 (0.0007) +[2023-10-08 15:42:35,904][21195] Updated weights for policy 0, policy_version 440 (0.0009) +[2023-10-08 15:42:36,065][21194] Updated weights for policy 1, policy_version 440 (0.0008) +[2023-10-08 15:42:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 12577.3). Total num frames: 917504. Throughput: 0: 1703.0, 1: 1700.8. Samples: 235994. Policy #0 lag: (min: 31.0, avg: 37.3, max: 63.0) +[2023-10-08 15:42:38,803][19739] Avg episode reward: [(0, '4.090'), (1, '4.410')] +[2023-10-08 15:42:39,702][21195] Updated weights for policy 0, policy_version 450 (0.0008) +[2023-10-08 15:42:39,938][21194] Updated weights for policy 1, policy_version 450 (0.0008) +[2023-10-08 15:42:40,070][21195] Updated weights for policy 0, policy_version 460 (0.0008) +[2023-10-08 15:42:40,312][21194] Updated weights for policy 1, policy_version 460 (0.0007) +[2023-10-08 15:42:40,438][21195] Updated weights for policy 0, policy_version 470 (0.0008) +[2023-10-08 15:42:40,675][21194] Updated weights for policy 1, policy_version 470 (0.0009) +[2023-10-08 15:42:40,811][21195] Updated weights for policy 0, policy_version 480 (0.0008) +[2023-10-08 15:42:41,048][21194] Updated weights for policy 1, policy_version 480 (0.0011) +[2023-10-08 15:42:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 12611.3). Total num frames: 983040. Throughput: 0: 1729.5, 1: 1728.4. Samples: 257650. Policy #0 lag: (min: 1.0, avg: 1.4, max: 12.0) +[2023-10-08 15:42:43,803][19739] Avg episode reward: [(0, '4.460'), (1, '5.270')] +[2023-10-08 15:42:44,598][21195] Updated weights for policy 0, policy_version 490 (0.0008) +[2023-10-08 15:42:44,967][21195] Updated weights for policy 0, policy_version 500 (0.0009) +[2023-10-08 15:42:45,033][21194] Updated weights for policy 1, policy_version 490 (0.0007) +[2023-10-08 15:42:45,337][21195] Updated weights for policy 0, policy_version 510 (0.0008) +[2023-10-08 15:42:45,393][21194] Updated weights for policy 1, policy_version 500 (0.0007) +[2023-10-08 15:42:45,760][21194] Updated weights for policy 1, policy_version 510 (0.0009) +[2023-10-08 15:42:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 12641.1). Total num frames: 1048576. Throughput: 0: 1741.3, 1: 1702.9. Samples: 273116. Policy #0 lag: (min: 26.0, avg: 26.0, max: 26.0) +[2023-10-08 15:42:48,804][19739] Avg episode reward: [(0, '4.320'), (1, '5.190')] +[2023-10-08 15:42:49,414][21195] Updated weights for policy 0, policy_version 520 (0.0008) +[2023-10-08 15:42:49,782][21195] Updated weights for policy 0, policy_version 530 (0.0008) +[2023-10-08 15:42:49,890][21194] Updated weights for policy 1, policy_version 520 (0.0010) +[2023-10-08 15:42:50,152][21195] Updated weights for policy 0, policy_version 540 (0.0008) +[2023-10-08 15:42:50,258][21194] Updated weights for policy 1, policy_version 530 (0.0008) +[2023-10-08 15:42:50,627][21194] Updated weights for policy 1, policy_version 540 (0.0007) +[2023-10-08 15:42:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 12667.7). Total num frames: 1114112. Throughput: 0: 1721.9, 1: 1709.6. Samples: 288228. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:42:53,803][19739] Avg episode reward: [(0, '5.140'), (1, '5.430')] +[2023-10-08 15:42:53,804][20836] Saving new best policy, reward=5.430! +[2023-10-08 15:42:54,040][21195] Updated weights for policy 0, policy_version 550 (0.0007) +[2023-10-08 15:42:54,413][21195] Updated weights for policy 0, policy_version 560 (0.0009) +[2023-10-08 15:42:54,545][21194] Updated weights for policy 1, policy_version 550 (0.0008) +[2023-10-08 15:42:54,775][21195] Updated weights for policy 0, policy_version 570 (0.0009) +[2023-10-08 15:42:54,910][21194] Updated weights for policy 1, policy_version 560 (0.0007) +[2023-10-08 15:42:54,998][20740] Saving new best policy, reward=5.140! +[2023-10-08 15:42:55,273][21194] Updated weights for policy 1, policy_version 570 (0.0009) +[2023-10-08 15:42:58,604][21195] Updated weights for policy 0, policy_version 580 (0.0008) +[2023-10-08 15:42:58,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 12691.3). Total num frames: 1179648. Throughput: 0: 1754.1, 1: 1727.6. Samples: 309874. Policy #0 lag: (min: 31.0, avg: 37.3, max: 63.0) +[2023-10-08 15:42:58,803][19739] Avg episode reward: [(0, '4.840'), (1, '5.350')] +[2023-10-08 15:42:58,972][21195] Updated weights for policy 0, policy_version 590 (0.0007) +[2023-10-08 15:42:59,267][21194] Updated weights for policy 1, policy_version 580 (0.0007) +[2023-10-08 15:42:59,352][21195] Updated weights for policy 0, policy_version 600 (0.0009) +[2023-10-08 15:42:59,634][21194] Updated weights for policy 1, policy_version 590 (0.0008) +[2023-10-08 15:43:00,008][21194] Updated weights for policy 1, policy_version 600 (0.0008) +[2023-10-08 15:43:03,368][21195] Updated weights for policy 0, policy_version 610 (0.0010) +[2023-10-08 15:43:03,730][21195] Updated weights for policy 0, policy_version 620 (0.0008) +[2023-10-08 15:43:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 12712.5). Total num frames: 1245184. Throughput: 0: 1744.3, 1: 1696.4. Samples: 324580. Policy #0 lag: (min: 17.0, avg: 18.5, max: 43.0) +[2023-10-08 15:43:03,803][19739] Avg episode reward: [(0, '4.250'), (1, '5.060')] +[2023-10-08 15:43:04,061][21194] Updated weights for policy 1, policy_version 610 (0.0008) +[2023-10-08 15:43:04,104][21195] Updated weights for policy 0, policy_version 630 (0.0008) +[2023-10-08 15:43:04,467][21194] Updated weights for policy 1, policy_version 620 (0.0007) +[2023-10-08 15:43:04,472][21195] Updated weights for policy 0, policy_version 640 (0.0009) +[2023-10-08 15:43:04,840][21194] Updated weights for policy 1, policy_version 630 (0.0007) +[2023-10-08 15:43:05,201][21194] Updated weights for policy 1, policy_version 640 (0.0008) +[2023-10-08 15:43:08,369][21195] Updated weights for policy 0, policy_version 650 (0.0007) +[2023-10-08 15:43:08,744][21195] Updated weights for policy 0, policy_version 660 (0.0008) +[2023-10-08 15:43:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 12731.7). Total num frames: 1310720. Throughput: 0: 1749.1, 1: 1731.5. Samples: 340650. Policy #0 lag: (min: 28.0, avg: 33.2, max: 60.0) +[2023-10-08 15:43:08,803][19739] Avg episode reward: [(0, '4.560'), (1, '5.660')] +[2023-10-08 15:43:09,067][21194] Updated weights for policy 1, policy_version 650 (0.0009) +[2023-10-08 15:43:09,111][21195] Updated weights for policy 0, policy_version 670 (0.0007) +[2023-10-08 15:43:09,443][21194] Updated weights for policy 1, policy_version 660 (0.0010) +[2023-10-08 15:43:09,809][21194] Updated weights for policy 1, policy_version 670 (0.0008) +[2023-10-08 15:43:09,878][20836] Saving new best policy, reward=5.660! +[2023-10-08 15:43:13,188][21195] Updated weights for policy 0, policy_version 680 (0.0009) +[2023-10-08 15:43:13,562][21195] Updated weights for policy 0, policy_version 690 (0.0008) +[2023-10-08 15:43:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 12749.1). Total num frames: 1376256. Throughput: 0: 1759.4, 1: 1735.4. Samples: 362040. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:43:13,803][19739] Avg episode reward: [(0, '5.340'), (1, '5.890')] +[2023-10-08 15:43:13,810][21194] Updated weights for policy 1, policy_version 680 (0.0008) +[2023-10-08 15:43:13,927][21195] Updated weights for policy 0, policy_version 700 (0.0007) +[2023-10-08 15:43:14,078][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000000704_720896.pth... +[2023-10-08 15:43:14,108][20740] Saving new best policy, reward=5.340! +[2023-10-08 15:43:14,189][21194] Updated weights for policy 1, policy_version 690 (0.0009) +[2023-10-08 15:43:14,562][21194] Updated weights for policy 1, policy_version 700 (0.0011) +[2023-10-08 15:43:14,701][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000000704_720896.pth... +[2023-10-08 15:43:14,730][20836] Saving new best policy, reward=5.890! +[2023-10-08 15:43:17,618][21195] Updated weights for policy 0, policy_version 710 (0.0008) +[2023-10-08 15:43:17,994][21195] Updated weights for policy 0, policy_version 720 (0.0009) +[2023-10-08 15:43:18,354][21195] Updated weights for policy 0, policy_version 730 (0.0008) +[2023-10-08 15:43:18,362][21194] Updated weights for policy 1, policy_version 710 (0.0008) +[2023-10-08 15:43:18,740][21194] Updated weights for policy 1, policy_version 720 (0.0009) +[2023-10-08 15:43:18,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13055.1). Total num frames: 1474560. Throughput: 0: 1718.9, 1: 1714.5. Samples: 375608. Policy #0 lag: (min: 4.0, avg: 7.2, max: 36.0) +[2023-10-08 15:43:18,803][19739] Avg episode reward: [(0, '5.790'), (1, '5.650')] +[2023-10-08 15:43:18,804][20740] Saving new best policy, reward=5.790! +[2023-10-08 15:43:19,103][21194] Updated weights for policy 1, policy_version 730 (0.0009) +[2023-10-08 15:43:22,323][21195] Updated weights for policy 0, policy_version 740 (0.0008) +[2023-10-08 15:43:22,698][21195] Updated weights for policy 0, policy_version 750 (0.0010) +[2023-10-08 15:43:22,969][21194] Updated weights for policy 1, policy_version 740 (0.0007) +[2023-10-08 15:43:23,064][21195] Updated weights for policy 0, policy_version 760 (0.0008) +[2023-10-08 15:43:23,330][21194] Updated weights for policy 1, policy_version 750 (0.0008) +[2023-10-08 15:43:23,698][21194] Updated weights for policy 1, policy_version 760 (0.0007) +[2023-10-08 15:43:23,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13057.3). Total num frames: 1540096. Throughput: 0: 1747.4, 1: 1727.4. Samples: 392360. Policy #0 lag: (min: 31.0, avg: 31.0, max: 36.0) +[2023-10-08 15:43:23,803][19739] Avg episode reward: [(0, '6.760'), (1, '6.210')] +[2023-10-08 15:43:23,804][20740] Saving new best policy, reward=6.760! +[2023-10-08 15:43:23,991][20836] Saving new best policy, reward=6.210! +[2023-10-08 15:43:27,123][21195] Updated weights for policy 0, policy_version 770 (0.0008) +[2023-10-08 15:43:27,492][21195] Updated weights for policy 0, policy_version 780 (0.0009) +[2023-10-08 15:43:27,581][21194] Updated weights for policy 1, policy_version 770 (0.0007) +[2023-10-08 15:43:27,867][21195] Updated weights for policy 0, policy_version 790 (0.0007) +[2023-10-08 15:43:27,940][21194] Updated weights for policy 1, policy_version 780 (0.0008) +[2023-10-08 15:43:28,238][21195] Updated weights for policy 0, policy_version 800 (0.0007) +[2023-10-08 15:43:28,312][21194] Updated weights for policy 1, policy_version 790 (0.0008) +[2023-10-08 15:43:28,675][21194] Updated weights for policy 1, policy_version 800 (0.0009) +[2023-10-08 15:43:28,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13325.8). Total num frames: 1638400. Throughput: 0: 1718.8, 1: 1719.0. Samples: 412352. Policy #0 lag: (min: 15.0, avg: 18.8, max: 47.0) +[2023-10-08 15:43:28,803][19739] Avg episode reward: [(0, '6.770'), (1, '6.540')] +[2023-10-08 15:43:28,810][20740] Saving new best policy, reward=6.770! +[2023-10-08 15:43:28,810][20836] Saving new best policy, reward=6.540! +[2023-10-08 15:43:32,209][21195] Updated weights for policy 0, policy_version 810 (0.0009) +[2023-10-08 15:43:32,556][21194] Updated weights for policy 1, policy_version 810 (0.0008) +[2023-10-08 15:43:32,586][21195] Updated weights for policy 0, policy_version 820 (0.0008) +[2023-10-08 15:43:32,922][21194] Updated weights for policy 1, policy_version 820 (0.0008) +[2023-10-08 15:43:32,964][21195] Updated weights for policy 0, policy_version 830 (0.0007) +[2023-10-08 15:43:33,290][21194] Updated weights for policy 1, policy_version 830 (0.0007) +[2023-10-08 15:43:33,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13317.3). Total num frames: 1703936. Throughput: 0: 1705.4, 1: 1732.7. Samples: 427828. Policy #0 lag: (min: 12.0, avg: 23.4, max: 44.0) +[2023-10-08 15:43:33,804][19739] Avg episode reward: [(0, '6.980'), (1, '6.140')] +[2023-10-08 15:43:33,805][20740] Saving new best policy, reward=6.980! +[2023-10-08 15:43:36,989][21195] Updated weights for policy 0, policy_version 840 (0.0009) +[2023-10-08 15:43:37,287][21194] Updated weights for policy 1, policy_version 840 (0.0009) +[2023-10-08 15:43:37,361][21195] Updated weights for policy 0, policy_version 850 (0.0009) +[2023-10-08 15:43:37,651][21194] Updated weights for policy 1, policy_version 850 (0.0010) +[2023-10-08 15:43:37,730][21195] Updated weights for policy 0, policy_version 860 (0.0008) +[2023-10-08 15:43:38,017][21194] Updated weights for policy 1, policy_version 860 (0.0008) +[2023-10-08 15:43:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13309.4). Total num frames: 1769472. Throughput: 0: 1728.9, 1: 1741.7. Samples: 444406. Policy #0 lag: (min: 8.0, avg: 33.3, max: 40.0) +[2023-10-08 15:43:38,803][19739] Avg episode reward: [(0, '6.620'), (1, '5.510')] +[2023-10-08 15:43:41,688][21195] Updated weights for policy 0, policy_version 870 (0.0009) +[2023-10-08 15:43:41,877][21194] Updated weights for policy 1, policy_version 870 (0.0010) +[2023-10-08 15:43:42,060][21195] Updated weights for policy 0, policy_version 880 (0.0009) +[2023-10-08 15:43:42,244][21194] Updated weights for policy 1, policy_version 880 (0.0007) +[2023-10-08 15:43:42,433][21195] Updated weights for policy 0, policy_version 890 (0.0008) +[2023-10-08 15:43:42,614][21194] Updated weights for policy 1, policy_version 890 (0.0007) +[2023-10-08 15:43:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13302.0). Total num frames: 1835008. Throughput: 0: 1692.7, 1: 1716.9. Samples: 463306. Policy #0 lag: (min: 16.0, avg: 36.2, max: 48.0) +[2023-10-08 15:43:43,803][19739] Avg episode reward: [(0, '5.280'), (1, '5.230')] +[2023-10-08 15:43:46,362][21195] Updated weights for policy 0, policy_version 900 (0.0009) +[2023-10-08 15:43:46,572][21194] Updated weights for policy 1, policy_version 900 (0.0007) +[2023-10-08 15:43:46,729][21195] Updated weights for policy 0, policy_version 910 (0.0010) +[2023-10-08 15:43:46,950][21194] Updated weights for policy 1, policy_version 910 (0.0009) +[2023-10-08 15:43:47,101][21195] Updated weights for policy 0, policy_version 920 (0.0009) +[2023-10-08 15:43:47,314][21194] Updated weights for policy 1, policy_version 920 (0.0010) +[2023-10-08 15:43:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13295.2). Total num frames: 1900544. Throughput: 0: 1703.5, 1: 1747.2. Samples: 479864. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 15:43:48,803][19739] Avg episode reward: [(0, '5.870'), (1, '6.240')] +[2023-10-08 15:43:51,207][21195] Updated weights for policy 0, policy_version 930 (0.0010) +[2023-10-08 15:43:51,423][21194] Updated weights for policy 1, policy_version 930 (0.0010) +[2023-10-08 15:43:51,572][21195] Updated weights for policy 0, policy_version 940 (0.0007) +[2023-10-08 15:43:51,810][21194] Updated weights for policy 1, policy_version 940 (0.0008) +[2023-10-08 15:43:51,932][21195] Updated weights for policy 0, policy_version 950 (0.0007) +[2023-10-08 15:43:52,174][21194] Updated weights for policy 1, policy_version 950 (0.0007) +[2023-10-08 15:43:52,312][21195] Updated weights for policy 0, policy_version 960 (0.0007) +[2023-10-08 15:43:52,543][21194] Updated weights for policy 1, policy_version 960 (0.0007) +[2023-10-08 15:43:53,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13288.9). Total num frames: 1966080. Throughput: 0: 1702.9, 1: 1723.0. Samples: 494816. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:43:53,803][19739] Avg episode reward: [(0, '5.810'), (1, '6.680')] +[2023-10-08 15:43:53,804][20836] Saving new best policy, reward=6.680! +[2023-10-08 15:43:56,210][21195] Updated weights for policy 0, policy_version 970 (0.0009) +[2023-10-08 15:43:56,520][21194] Updated weights for policy 1, policy_version 970 (0.0007) +[2023-10-08 15:43:56,574][21195] Updated weights for policy 0, policy_version 980 (0.0007) +[2023-10-08 15:43:56,897][21194] Updated weights for policy 1, policy_version 980 (0.0008) +[2023-10-08 15:43:56,949][21195] Updated weights for policy 0, policy_version 990 (0.0007) +[2023-10-08 15:43:57,272][21194] Updated weights for policy 1, policy_version 990 (0.0010) +[2023-10-08 15:43:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13282.9). Total num frames: 2031616. Throughput: 0: 1688.1, 1: 1709.6. Samples: 514938. Policy #0 lag: (min: 21.0, avg: 22.5, max: 48.0) +[2023-10-08 15:43:58,803][19739] Avg episode reward: [(0, '7.770'), (1, '7.380')] +[2023-10-08 15:43:58,811][20740] Saving new best policy, reward=7.770! +[2023-10-08 15:43:58,811][20836] Saving new best policy, reward=7.380! +[2023-10-08 15:44:00,923][21195] Updated weights for policy 0, policy_version 1000 (0.0009) +[2023-10-08 15:44:01,029][21194] Updated weights for policy 1, policy_version 1000 (0.0008) +[2023-10-08 15:44:01,302][21195] Updated weights for policy 0, policy_version 1010 (0.0010) +[2023-10-08 15:44:01,398][21194] Updated weights for policy 1, policy_version 1010 (0.0007) +[2023-10-08 15:44:01,663][21195] Updated weights for policy 0, policy_version 1020 (0.0008) +[2023-10-08 15:44:01,769][21194] Updated weights for policy 1, policy_version 1020 (0.0008) +[2023-10-08 15:44:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13277.4). Total num frames: 2097152. Throughput: 0: 1724.8, 1: 1738.2. Samples: 531444. Policy #0 lag: (min: 13.0, avg: 20.9, max: 45.0) +[2023-10-08 15:44:03,803][19739] Avg episode reward: [(0, '6.330'), (1, '7.160')] +[2023-10-08 15:44:05,609][21195] Updated weights for policy 0, policy_version 1030 (0.0010) +[2023-10-08 15:44:05,902][21194] Updated weights for policy 1, policy_version 1030 (0.0008) +[2023-10-08 15:44:05,981][21195] Updated weights for policy 0, policy_version 1040 (0.0007) +[2023-10-08 15:44:06,271][21194] Updated weights for policy 1, policy_version 1040 (0.0008) +[2023-10-08 15:44:06,344][21195] Updated weights for policy 0, policy_version 1050 (0.0007) +[2023-10-08 15:44:06,633][21194] Updated weights for policy 1, policy_version 1050 (0.0008) +[2023-10-08 15:44:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13272.2). Total num frames: 2162688. Throughput: 0: 1692.8, 1: 1713.2. Samples: 545632. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:44:08,803][19739] Avg episode reward: [(0, '6.360'), (1, '5.670')] +[2023-10-08 15:44:10,214][21195] Updated weights for policy 0, policy_version 1060 (0.0008) +[2023-10-08 15:44:10,581][21195] Updated weights for policy 0, policy_version 1070 (0.0011) +[2023-10-08 15:44:10,654][21194] Updated weights for policy 1, policy_version 1060 (0.0009) +[2023-10-08 15:44:10,949][21195] Updated weights for policy 0, policy_version 1080 (0.0009) +[2023-10-08 15:44:11,024][21194] Updated weights for policy 1, policy_version 1070 (0.0010) +[2023-10-08 15:44:11,392][21194] Updated weights for policy 1, policy_version 1080 (0.0009) +[2023-10-08 15:44:13,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13267.2). Total num frames: 2228224. Throughput: 0: 1721.7, 1: 1713.2. Samples: 566924. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:44:13,803][19739] Avg episode reward: [(0, '5.470'), (1, '5.720')] +[2023-10-08 15:44:14,808][21195] Updated weights for policy 0, policy_version 1090 (0.0009) +[2023-10-08 15:44:15,180][21195] Updated weights for policy 0, policy_version 1100 (0.0007) +[2023-10-08 15:44:15,485][21194] Updated weights for policy 1, policy_version 1090 (0.0008) +[2023-10-08 15:44:15,547][21195] Updated weights for policy 0, policy_version 1110 (0.0009) +[2023-10-08 15:44:15,855][21194] Updated weights for policy 1, policy_version 1100 (0.0008) +[2023-10-08 15:44:15,918][21195] Updated weights for policy 0, policy_version 1120 (0.0009) +[2023-10-08 15:44:16,220][21194] Updated weights for policy 1, policy_version 1110 (0.0008) +[2023-10-08 15:44:16,587][21194] Updated weights for policy 1, policy_version 1120 (0.0007) +[2023-10-08 15:44:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13262.6). Total num frames: 2293760. Throughput: 0: 1738.4, 1: 1711.0. Samples: 583050. Policy #0 lag: (min: 6.0, avg: 8.0, max: 38.0) +[2023-10-08 15:44:18,803][19739] Avg episode reward: [(0, '7.330'), (1, '6.900')] +[2023-10-08 15:44:19,797][21195] Updated weights for policy 0, policy_version 1130 (0.0007) +[2023-10-08 15:44:20,182][21195] Updated weights for policy 0, policy_version 1140 (0.0008) +[2023-10-08 15:44:20,552][21195] Updated weights for policy 0, policy_version 1150 (0.0010) +[2023-10-08 15:44:20,657][21194] Updated weights for policy 1, policy_version 1130 (0.0009) +[2023-10-08 15:44:21,032][21194] Updated weights for policy 1, policy_version 1140 (0.0008) +[2023-10-08 15:44:21,395][21194] Updated weights for policy 1, policy_version 1150 (0.0009) +[2023-10-08 15:44:23,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13258.2). Total num frames: 2359296. Throughput: 0: 1713.8, 1: 1690.2. Samples: 597586. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:44:23,803][19739] Avg episode reward: [(0, '7.740'), (1, '7.590')] +[2023-10-08 15:44:23,804][20836] Saving new best policy, reward=7.590! +[2023-10-08 15:44:24,471][21195] Updated weights for policy 0, policy_version 1160 (0.0010) +[2023-10-08 15:44:24,847][21195] Updated weights for policy 0, policy_version 1170 (0.0007) +[2023-10-08 15:44:25,129][21194] Updated weights for policy 1, policy_version 1160 (0.0009) +[2023-10-08 15:44:25,216][21195] Updated weights for policy 0, policy_version 1180 (0.0007) +[2023-10-08 15:44:25,492][21194] Updated weights for policy 1, policy_version 1170 (0.0009) +[2023-10-08 15:44:25,859][21194] Updated weights for policy 1, policy_version 1180 (0.0009) +[2023-10-08 15:44:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13254.1). Total num frames: 2424832. Throughput: 0: 1745.2, 1: 1720.4. Samples: 619260. Policy #0 lag: (min: 31.0, avg: 35.6, max: 63.0) +[2023-10-08 15:44:28,803][19739] Avg episode reward: [(0, '6.200'), (1, '7.550')] +[2023-10-08 15:44:29,163][21195] Updated weights for policy 0, policy_version 1190 (0.0008) +[2023-10-08 15:44:29,542][21195] Updated weights for policy 0, policy_version 1200 (0.0008) +[2023-10-08 15:44:29,838][21194] Updated weights for policy 1, policy_version 1190 (0.0008) +[2023-10-08 15:44:29,914][21195] Updated weights for policy 0, policy_version 1210 (0.0009) +[2023-10-08 15:44:30,200][21194] Updated weights for policy 1, policy_version 1200 (0.0008) +[2023-10-08 15:44:30,565][21194] Updated weights for policy 1, policy_version 1210 (0.0010) +[2023-10-08 15:44:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13250.2). Total num frames: 2490368. Throughput: 0: 1737.0, 1: 1692.5. Samples: 634192. Policy #0 lag: (min: 31.0, avg: 35.4, max: 63.0) +[2023-10-08 15:44:33,803][19739] Avg episode reward: [(0, '5.970'), (1, '5.700')] +[2023-10-08 15:44:33,833][21195] Updated weights for policy 0, policy_version 1220 (0.0009) +[2023-10-08 15:44:34,199][21195] Updated weights for policy 0, policy_version 1230 (0.0007) +[2023-10-08 15:44:34,405][21194] Updated weights for policy 1, policy_version 1220 (0.0008) +[2023-10-08 15:44:34,563][21195] Updated weights for policy 0, policy_version 1240 (0.0007) +[2023-10-08 15:44:34,775][21194] Updated weights for policy 1, policy_version 1230 (0.0008) +[2023-10-08 15:44:35,134][21194] Updated weights for policy 1, policy_version 1240 (0.0009) +[2023-10-08 15:44:38,416][21195] Updated weights for policy 0, policy_version 1250 (0.0008) +[2023-10-08 15:44:38,795][21195] Updated weights for policy 0, policy_version 1260 (0.0009) +[2023-10-08 15:44:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13246.5). Total num frames: 2555904. Throughput: 0: 1730.7, 1: 1708.7. Samples: 649586. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 15:44:38,803][19739] Avg episode reward: [(0, '6.050'), (1, '5.900')] +[2023-10-08 15:44:39,154][21195] Updated weights for policy 0, policy_version 1270 (0.0007) +[2023-10-08 15:44:39,260][21194] Updated weights for policy 1, policy_version 1250 (0.0009) +[2023-10-08 15:44:39,529][21195] Updated weights for policy 0, policy_version 1280 (0.0008) +[2023-10-08 15:44:39,649][21194] Updated weights for policy 1, policy_version 1260 (0.0009) +[2023-10-08 15:44:40,023][21194] Updated weights for policy 1, policy_version 1270 (0.0008) +[2023-10-08 15:44:40,394][21194] Updated weights for policy 1, policy_version 1280 (0.0009) +[2023-10-08 15:44:43,385][21195] Updated weights for policy 0, policy_version 1290 (0.0008) +[2023-10-08 15:44:43,763][21195] Updated weights for policy 0, policy_version 1300 (0.0009) +[2023-10-08 15:44:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13243.0). Total num frames: 2621440. Throughput: 0: 1748.8, 1: 1720.9. Samples: 671078. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:44:43,803][19739] Avg episode reward: [(0, '7.870'), (1, '5.690')] +[2023-10-08 15:44:44,132][21195] Updated weights for policy 0, policy_version 1310 (0.0010) +[2023-10-08 15:44:44,205][20740] Saving new best policy, reward=7.870! +[2023-10-08 15:44:44,258][21194] Updated weights for policy 1, policy_version 1290 (0.0008) +[2023-10-08 15:44:44,631][21194] Updated weights for policy 1, policy_version 1300 (0.0011) +[2023-10-08 15:44:45,003][21194] Updated weights for policy 1, policy_version 1310 (0.0011) +[2023-10-08 15:44:48,364][21195] Updated weights for policy 0, policy_version 1320 (0.0011) +[2023-10-08 15:44:48,733][21195] Updated weights for policy 0, policy_version 1330 (0.0007) +[2023-10-08 15:44:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13239.6). Total num frames: 2686976. Throughput: 0: 1726.4, 1: 1695.4. Samples: 685426. Policy #0 lag: (min: 26.0, avg: 26.0, max: 26.0) +[2023-10-08 15:44:48,803][19739] Avg episode reward: [(0, '7.750'), (1, '6.970')] +[2023-10-08 15:44:49,114][21195] Updated weights for policy 0, policy_version 1340 (0.0009) +[2023-10-08 15:44:49,162][21194] Updated weights for policy 1, policy_version 1320 (0.0008) +[2023-10-08 15:44:49,537][21194] Updated weights for policy 1, policy_version 1330 (0.0008) +[2023-10-08 15:44:49,912][21194] Updated weights for policy 1, policy_version 1340 (0.0007) +[2023-10-08 15:44:52,954][21195] Updated weights for policy 0, policy_version 1350 (0.0007) +[2023-10-08 15:44:53,332][21195] Updated weights for policy 0, policy_version 1360 (0.0009) +[2023-10-08 15:44:53,704][21195] Updated weights for policy 0, policy_version 1370 (0.0007) +[2023-10-08 15:44:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13236.5). Total num frames: 2752512. Throughput: 0: 1746.4, 1: 1714.7. Samples: 701380. Policy #0 lag: (min: 28.0, avg: 31.3, max: 60.0) +[2023-10-08 15:44:53,803][19739] Avg episode reward: [(0, '7.160'), (1, '7.720')] +[2023-10-08 15:44:53,872][21194] Updated weights for policy 1, policy_version 1350 (0.0007) +[2023-10-08 15:44:54,242][21194] Updated weights for policy 1, policy_version 1360 (0.0007) +[2023-10-08 15:44:54,605][21194] Updated weights for policy 1, policy_version 1370 (0.0007) +[2023-10-08 15:44:54,821][20836] Saving new best policy, reward=7.720! +[2023-10-08 15:44:57,583][21195] Updated weights for policy 0, policy_version 1380 (0.0009) +[2023-10-08 15:44:57,965][21195] Updated weights for policy 0, policy_version 1390 (0.0008) +[2023-10-08 15:44:58,328][21195] Updated weights for policy 0, policy_version 1400 (0.0009) +[2023-10-08 15:44:58,467][21194] Updated weights for policy 1, policy_version 1380 (0.0007) +[2023-10-08 15:44:58,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13387.3). Total num frames: 2850816. Throughput: 0: 1733.5, 1: 1726.4. Samples: 722620. Policy #0 lag: (min: 10.0, avg: 13.0, max: 42.0) +[2023-10-08 15:44:58,803][19739] Avg episode reward: [(0, '6.150'), (1, '7.730')] +[2023-10-08 15:44:58,839][21194] Updated weights for policy 1, policy_version 1390 (0.0007) +[2023-10-08 15:44:59,215][21194] Updated weights for policy 1, policy_version 1400 (0.0008) +[2023-10-08 15:44:59,506][20836] Saving new best policy, reward=7.730! +[2023-10-08 15:45:02,353][21195] Updated weights for policy 0, policy_version 1410 (0.0010) +[2023-10-08 15:45:02,730][21195] Updated weights for policy 0, policy_version 1420 (0.0008) +[2023-10-08 15:45:03,100][21195] Updated weights for policy 0, policy_version 1430 (0.0007) +[2023-10-08 15:45:03,421][21194] Updated weights for policy 1, policy_version 1410 (0.0009) +[2023-10-08 15:45:03,469][21195] Updated weights for policy 0, policy_version 1440 (0.0007) +[2023-10-08 15:45:03,780][21194] Updated weights for policy 1, policy_version 1420 (0.0008) +[2023-10-08 15:45:03,802][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13380.9). Total num frames: 2916352. Throughput: 0: 1705.7, 1: 1709.7. Samples: 736746. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 15:45:03,803][19739] Avg episode reward: [(0, '6.380'), (1, '6.770')] +[2023-10-08 15:45:04,152][21194] Updated weights for policy 1, policy_version 1430 (0.0010) +[2023-10-08 15:45:04,530][21194] Updated weights for policy 1, policy_version 1440 (0.0011) +[2023-10-08 15:45:07,310][21195] Updated weights for policy 0, policy_version 1450 (0.0009) +[2023-10-08 15:45:07,684][21195] Updated weights for policy 0, policy_version 1460 (0.0009) +[2023-10-08 15:45:08,051][21195] Updated weights for policy 0, policy_version 1470 (0.0009) +[2023-10-08 15:45:08,465][21194] Updated weights for policy 1, policy_version 1450 (0.0010) +[2023-10-08 15:45:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13374.7). Total num frames: 2981888. Throughput: 0: 1735.7, 1: 1724.6. Samples: 753300. Policy #0 lag: (min: 31.0, avg: 32.9, max: 61.0) +[2023-10-08 15:45:08,803][19739] Avg episode reward: [(0, '7.250'), (1, '6.480')] +[2023-10-08 15:45:08,834][21194] Updated weights for policy 1, policy_version 1460 (0.0010) +[2023-10-08 15:45:09,200][21194] Updated weights for policy 1, policy_version 1470 (0.0011) +[2023-10-08 15:45:11,979][21195] Updated weights for policy 0, policy_version 1480 (0.0008) +[2023-10-08 15:45:12,350][21195] Updated weights for policy 0, policy_version 1490 (0.0008) +[2023-10-08 15:45:12,725][21195] Updated weights for policy 0, policy_version 1500 (0.0008) +[2023-10-08 15:45:13,232][21194] Updated weights for policy 1, policy_version 1480 (0.0010) +[2023-10-08 15:45:13,601][21194] Updated weights for policy 1, policy_version 1490 (0.0007) +[2023-10-08 15:45:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13368.9). Total num frames: 3047424. Throughput: 0: 1707.2, 1: 1717.3. Samples: 773362. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:45:13,803][19739] Avg episode reward: [(0, '7.880'), (1, '7.190')] +[2023-10-08 15:45:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000001504_1540096.pth... +[2023-10-08 15:45:13,846][20740] Saving new best policy, reward=7.880! +[2023-10-08 15:45:13,969][21194] Updated weights for policy 1, policy_version 1500 (0.0008) +[2023-10-08 15:45:14,117][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000001504_1540096.pth... +[2023-10-08 15:45:16,487][21195] Updated weights for policy 0, policy_version 1510 (0.0009) +[2023-10-08 15:45:16,865][21195] Updated weights for policy 0, policy_version 1520 (0.0007) +[2023-10-08 15:45:17,241][21195] Updated weights for policy 0, policy_version 1530 (0.0008) +[2023-10-08 15:45:17,786][21194] Updated weights for policy 1, policy_version 1510 (0.0009) +[2023-10-08 15:45:18,156][21194] Updated weights for policy 1, policy_version 1520 (0.0008) +[2023-10-08 15:45:18,513][21194] Updated weights for policy 1, policy_version 1530 (0.0008) +[2023-10-08 15:45:18,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13503.9). Total num frames: 3145728. Throughput: 0: 1722.6, 1: 1718.7. Samples: 789050. Policy #0 lag: (min: 5.0, avg: 5.0, max: 5.0) +[2023-10-08 15:45:18,803][19739] Avg episode reward: [(0, '7.090'), (1, '8.340')] +[2023-10-08 15:45:18,804][20836] Saving new best policy, reward=8.340! +[2023-10-08 15:45:21,114][21195] Updated weights for policy 0, policy_version 1540 (0.0009) +[2023-10-08 15:45:21,492][21195] Updated weights for policy 0, policy_version 1550 (0.0007) +[2023-10-08 15:45:21,869][21195] Updated weights for policy 0, policy_version 1560 (0.0011) +[2023-10-08 15:45:22,410][21194] Updated weights for policy 1, policy_version 1540 (0.0008) +[2023-10-08 15:45:22,778][21194] Updated weights for policy 1, policy_version 1550 (0.0007) +[2023-10-08 15:45:23,157][21194] Updated weights for policy 1, policy_version 1560 (0.0009) +[2023-10-08 15:45:23,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13495.6). Total num frames: 3211264. Throughput: 0: 1728.3, 1: 1722.0. Samples: 804848. Policy #0 lag: (min: 17.0, avg: 27.8, max: 49.0) +[2023-10-08 15:45:23,804][19739] Avg episode reward: [(0, '6.210'), (1, '8.490')] +[2023-10-08 15:45:23,805][20836] Saving new best policy, reward=8.490! +[2023-10-08 15:45:25,875][21195] Updated weights for policy 0, policy_version 1570 (0.0007) +[2023-10-08 15:45:26,247][21195] Updated weights for policy 0, policy_version 1580 (0.0007) +[2023-10-08 15:45:26,621][21195] Updated weights for policy 0, policy_version 1590 (0.0008) +[2023-10-08 15:45:27,001][21195] Updated weights for policy 0, policy_version 1600 (0.0009) +[2023-10-08 15:45:27,128][21194] Updated weights for policy 1, policy_version 1570 (0.0010) +[2023-10-08 15:45:27,515][21194] Updated weights for policy 1, policy_version 1580 (0.0008) +[2023-10-08 15:45:27,885][21194] Updated weights for policy 1, policy_version 1590 (0.0011) +[2023-10-08 15:45:28,264][21194] Updated weights for policy 1, policy_version 1600 (0.0009) +[2023-10-08 15:45:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13487.6). Total num frames: 3276800. Throughput: 0: 1713.0, 1: 1700.2. Samples: 824670. Policy #0 lag: (min: 30.0, avg: 31.8, max: 57.0) +[2023-10-08 15:45:28,803][19739] Avg episode reward: [(0, '6.420'), (1, '6.450')] +[2023-10-08 15:45:30,819][21195] Updated weights for policy 0, policy_version 1610 (0.0008) +[2023-10-08 15:45:31,197][21195] Updated weights for policy 0, policy_version 1620 (0.0008) +[2023-10-08 15:45:31,568][21195] Updated weights for policy 0, policy_version 1630 (0.0008) +[2023-10-08 15:45:32,212][21194] Updated weights for policy 1, policy_version 1610 (0.0007) +[2023-10-08 15:45:32,578][21194] Updated weights for policy 1, policy_version 1620 (0.0011) +[2023-10-08 15:45:32,946][21194] Updated weights for policy 1, policy_version 1630 (0.0008) +[2023-10-08 15:45:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13479.9). Total num frames: 3342336. Throughput: 0: 1739.6, 1: 1722.5. Samples: 841220. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 15:45:33,803][19739] Avg episode reward: [(0, '8.050'), (1, '6.430')] +[2023-10-08 15:45:33,804][20740] Saving new best policy, reward=8.050! +[2023-10-08 15:45:35,483][21195] Updated weights for policy 0, policy_version 1640 (0.0009) +[2023-10-08 15:45:35,851][21195] Updated weights for policy 0, policy_version 1650 (0.0010) +[2023-10-08 15:45:36,213][21195] Updated weights for policy 0, policy_version 1660 (0.0009) +[2023-10-08 15:45:36,931][21194] Updated weights for policy 1, policy_version 1640 (0.0009) +[2023-10-08 15:45:37,295][21194] Updated weights for policy 1, policy_version 1650 (0.0009) +[2023-10-08 15:45:37,666][21194] Updated weights for policy 1, policy_version 1660 (0.0008) +[2023-10-08 15:45:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13472.6). Total num frames: 3407872. Throughput: 0: 1717.6, 1: 1722.3. Samples: 856176. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 15:45:38,803][19739] Avg episode reward: [(0, '8.870'), (1, '8.370')] +[2023-10-08 15:45:38,804][20740] Saving new best policy, reward=8.870! +[2023-10-08 15:45:40,149][21195] Updated weights for policy 0, policy_version 1670 (0.0010) +[2023-10-08 15:45:40,515][21195] Updated weights for policy 0, policy_version 1680 (0.0008) +[2023-10-08 15:45:40,881][21195] Updated weights for policy 0, policy_version 1690 (0.0009) +[2023-10-08 15:45:41,531][21194] Updated weights for policy 1, policy_version 1670 (0.0007) +[2023-10-08 15:45:41,904][21194] Updated weights for policy 1, policy_version 1680 (0.0008) +[2023-10-08 15:45:42,275][21194] Updated weights for policy 1, policy_version 1690 (0.0008) +[2023-10-08 15:45:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13465.5). Total num frames: 3473408. Throughput: 0: 1733.1, 1: 1694.3. Samples: 876852. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:45:43,803][19739] Avg episode reward: [(0, '8.940'), (1, '8.450')] +[2023-10-08 15:45:43,813][20740] Saving new best policy, reward=8.940! +[2023-10-08 15:45:44,732][21195] Updated weights for policy 0, policy_version 1700 (0.0009) +[2023-10-08 15:45:45,106][21195] Updated weights for policy 0, policy_version 1710 (0.0009) +[2023-10-08 15:45:45,478][21195] Updated weights for policy 0, policy_version 1720 (0.0009) +[2023-10-08 15:45:46,292][21194] Updated weights for policy 1, policy_version 1700 (0.0008) +[2023-10-08 15:45:46,658][21194] Updated weights for policy 1, policy_version 1710 (0.0008) +[2023-10-08 15:45:47,020][21194] Updated weights for policy 1, policy_version 1720 (0.0008) +[2023-10-08 15:45:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13458.7). Total num frames: 3538944. Throughput: 0: 1755.1, 1: 1725.2. Samples: 893360. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 15:45:48,803][19739] Avg episode reward: [(0, '7.040'), (1, '7.090')] +[2023-10-08 15:45:49,444][21195] Updated weights for policy 0, policy_version 1730 (0.0008) +[2023-10-08 15:45:49,816][21195] Updated weights for policy 0, policy_version 1740 (0.0008) +[2023-10-08 15:45:50,199][21195] Updated weights for policy 0, policy_version 1750 (0.0010) +[2023-10-08 15:45:50,566][21195] Updated weights for policy 0, policy_version 1760 (0.0008) +[2023-10-08 15:45:50,982][21194] Updated weights for policy 1, policy_version 1730 (0.0008) +[2023-10-08 15:45:51,344][21194] Updated weights for policy 1, policy_version 1740 (0.0010) +[2023-10-08 15:45:51,717][21194] Updated weights for policy 1, policy_version 1750 (0.0010) +[2023-10-08 15:45:52,084][21194] Updated weights for policy 1, policy_version 1760 (0.0011) +[2023-10-08 15:45:53,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 13452.1). Total num frames: 3604480. Throughput: 0: 1722.3, 1: 1701.7. Samples: 907380. Policy #0 lag: (min: 31.0, avg: 31.3, max: 44.0) +[2023-10-08 15:45:53,803][19739] Avg episode reward: [(0, '6.640'), (1, '6.590')] +[2023-10-08 15:45:54,395][21195] Updated weights for policy 0, policy_version 1770 (0.0007) +[2023-10-08 15:45:54,772][21195] Updated weights for policy 0, policy_version 1780 (0.0007) +[2023-10-08 15:45:55,146][21195] Updated weights for policy 0, policy_version 1790 (0.0008) +[2023-10-08 15:45:56,058][21194] Updated weights for policy 1, policy_version 1770 (0.0009) +[2023-10-08 15:45:56,430][21194] Updated weights for policy 1, policy_version 1780 (0.0009) +[2023-10-08 15:45:56,798][21194] Updated weights for policy 1, policy_version 1790 (0.0008) +[2023-10-08 15:45:58,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13445.8). Total num frames: 3670016. Throughput: 0: 1751.8, 1: 1703.1. Samples: 928830. Policy #0 lag: (min: 8.0, avg: 33.6, max: 40.0) +[2023-10-08 15:45:58,803][19739] Avg episode reward: [(0, '5.650'), (1, '6.740')] +[2023-10-08 15:45:59,015][21195] Updated weights for policy 0, policy_version 1800 (0.0010) +[2023-10-08 15:45:59,396][21195] Updated weights for policy 0, policy_version 1810 (0.0011) +[2023-10-08 15:45:59,774][21195] Updated weights for policy 0, policy_version 1820 (0.0009) +[2023-10-08 15:46:00,669][21194] Updated weights for policy 1, policy_version 1800 (0.0010) +[2023-10-08 15:46:01,037][21194] Updated weights for policy 1, policy_version 1810 (0.0011) +[2023-10-08 15:46:01,418][21194] Updated weights for policy 1, policy_version 1820 (0.0009) +[2023-10-08 15:46:03,775][21195] Updated weights for policy 0, policy_version 1830 (0.0009) +[2023-10-08 15:46:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13439.7). Total num frames: 3735552. Throughput: 0: 1738.7, 1: 1721.2. Samples: 944748. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:46:03,803][19739] Avg episode reward: [(0, '6.630'), (1, '7.770')] +[2023-10-08 15:46:04,142][21195] Updated weights for policy 0, policy_version 1840 (0.0007) +[2023-10-08 15:46:04,516][21195] Updated weights for policy 0, policy_version 1850 (0.0008) +[2023-10-08 15:46:05,409][21194] Updated weights for policy 1, policy_version 1830 (0.0009) +[2023-10-08 15:46:05,776][21194] Updated weights for policy 1, policy_version 1840 (0.0008) +[2023-10-08 15:46:06,149][21194] Updated weights for policy 1, policy_version 1850 (0.0007) +[2023-10-08 15:46:08,452][21195] Updated weights for policy 0, policy_version 1860 (0.0007) +[2023-10-08 15:46:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13433.8). Total num frames: 3801088. Throughput: 0: 1736.4, 1: 1704.3. Samples: 959676. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:46:08,803][19739] Avg episode reward: [(0, '6.500'), (1, '8.820')] +[2023-10-08 15:46:08,804][20836] Saving new best policy, reward=8.820! +[2023-10-08 15:46:08,824][21195] Updated weights for policy 0, policy_version 1870 (0.0008) +[2023-10-08 15:46:09,200][21195] Updated weights for policy 0, policy_version 1880 (0.0008) +[2023-10-08 15:46:10,090][21194] Updated weights for policy 1, policy_version 1860 (0.0008) +[2023-10-08 15:46:10,449][21194] Updated weights for policy 1, policy_version 1870 (0.0009) +[2023-10-08 15:46:10,826][21194] Updated weights for policy 1, policy_version 1880 (0.0009) +[2023-10-08 15:46:13,259][21195] Updated weights for policy 0, policy_version 1890 (0.0008) +[2023-10-08 15:46:13,632][21195] Updated weights for policy 0, policy_version 1900 (0.0007) +[2023-10-08 15:46:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13428.1). Total num frames: 3866624. Throughput: 0: 1749.3, 1: 1729.4. Samples: 981210. Policy #0 lag: (min: 26.0, avg: 29.3, max: 58.0) +[2023-10-08 15:46:13,803][19739] Avg episode reward: [(0, '7.320'), (1, '7.660')] +[2023-10-08 15:46:14,011][21195] Updated weights for policy 0, policy_version 1910 (0.0010) +[2023-10-08 15:46:14,385][21195] Updated weights for policy 0, policy_version 1920 (0.0007) +[2023-10-08 15:46:14,782][21194] Updated weights for policy 1, policy_version 1890 (0.0010) +[2023-10-08 15:46:15,196][21194] Updated weights for policy 1, policy_version 1900 (0.0009) +[2023-10-08 15:46:15,553][21194] Updated weights for policy 1, policy_version 1910 (0.0009) +[2023-10-08 15:46:15,930][21194] Updated weights for policy 1, policy_version 1920 (0.0008) +[2023-10-08 15:46:18,148][21195] Updated weights for policy 0, policy_version 1930 (0.0010) +[2023-10-08 15:46:18,516][21195] Updated weights for policy 0, policy_version 1940 (0.0009) +[2023-10-08 15:46:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13422.7). Total num frames: 3932160. Throughput: 0: 1726.4, 1: 1705.2. Samples: 995646. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:46:18,803][19739] Avg episode reward: [(0, '7.630'), (1, '6.200')] +[2023-10-08 15:46:18,881][21195] Updated weights for policy 0, policy_version 1950 (0.0010) +[2023-10-08 15:46:20,032][21194] Updated weights for policy 1, policy_version 1930 (0.0008) +[2023-10-08 15:46:20,410][21194] Updated weights for policy 1, policy_version 1940 (0.0010) +[2023-10-08 15:46:20,775][21194] Updated weights for policy 1, policy_version 1950 (0.0010) +[2023-10-08 15:46:23,031][21195] Updated weights for policy 0, policy_version 1960 (0.0008) +[2023-10-08 15:46:23,409][21195] Updated weights for policy 0, policy_version 1970 (0.0008) +[2023-10-08 15:46:23,773][21195] Updated weights for policy 0, policy_version 1980 (0.0009) +[2023-10-08 15:46:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13551.5). Total num frames: 3997696. Throughput: 0: 1750.4, 1: 1709.7. Samples: 1011882. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:46:23,804][19739] Avg episode reward: [(0, '9.310'), (1, '6.870')] +[2023-10-08 15:46:23,924][20740] Saving new best policy, reward=9.310! +[2023-10-08 15:46:24,614][21194] Updated weights for policy 1, policy_version 1960 (0.0008) +[2023-10-08 15:46:24,987][21194] Updated weights for policy 1, policy_version 1970 (0.0007) +[2023-10-08 15:46:25,351][21194] Updated weights for policy 1, policy_version 1980 (0.0010) +[2023-10-08 15:46:27,588][21195] Updated weights for policy 0, policy_version 1990 (0.0007) +[2023-10-08 15:46:27,950][21195] Updated weights for policy 0, policy_version 2000 (0.0007) +[2023-10-08 15:46:28,324][21195] Updated weights for policy 0, policy_version 2010 (0.0009) +[2023-10-08 15:46:28,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 4096000. Throughput: 0: 1731.9, 1: 1740.8. Samples: 1033124. Policy #0 lag: (min: 1.0, avg: 22.2, max: 33.0) +[2023-10-08 15:46:28,803][19739] Avg episode reward: [(0, '8.470'), (1, '7.830')] +[2023-10-08 15:46:29,097][21194] Updated weights for policy 1, policy_version 1990 (0.0010) +[2023-10-08 15:46:29,463][21194] Updated weights for policy 1, policy_version 2000 (0.0010) +[2023-10-08 15:46:29,837][21194] Updated weights for policy 1, policy_version 2010 (0.0010) +[2023-10-08 15:46:32,160][21195] Updated weights for policy 0, policy_version 2020 (0.0009) +[2023-10-08 15:46:32,521][21195] Updated weights for policy 0, policy_version 2030 (0.0010) +[2023-10-08 15:46:32,889][21195] Updated weights for policy 0, policy_version 2040 (0.0010) +[2023-10-08 15:46:33,778][21194] Updated weights for policy 1, policy_version 2020 (0.0007) +[2023-10-08 15:46:33,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 4161536. Throughput: 0: 1716.8, 1: 1712.2. Samples: 1047666. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:46:33,803][19739] Avg episode reward: [(0, '8.360'), (1, '8.760')] +[2023-10-08 15:46:34,139][21194] Updated weights for policy 1, policy_version 2030 (0.0010) +[2023-10-08 15:46:34,514][21194] Updated weights for policy 1, policy_version 2040 (0.0008) +[2023-10-08 15:46:36,918][21195] Updated weights for policy 0, policy_version 2050 (0.0011) +[2023-10-08 15:46:37,290][21195] Updated weights for policy 0, policy_version 2060 (0.0010) +[2023-10-08 15:46:37,666][21195] Updated weights for policy 0, policy_version 2070 (0.0009) +[2023-10-08 15:46:38,038][21195] Updated weights for policy 0, policy_version 2080 (0.0010) +[2023-10-08 15:46:38,424][21194] Updated weights for policy 1, policy_version 2050 (0.0008) +[2023-10-08 15:46:38,802][21194] Updated weights for policy 1, policy_version 2060 (0.0009) +[2023-10-08 15:46:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 4227072. Throughput: 0: 1747.2, 1: 1742.2. Samples: 1064406. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:46:38,803][19739] Avg episode reward: [(0, '7.900'), (1, '8.900')] +[2023-10-08 15:46:39,162][21194] Updated weights for policy 1, policy_version 2070 (0.0010) +[2023-10-08 15:46:39,529][20836] Saving new best policy, reward=8.900! +[2023-10-08 15:46:39,531][21194] Updated weights for policy 1, policy_version 2080 (0.0011) +[2023-10-08 15:46:41,882][21195] Updated weights for policy 0, policy_version 2090 (0.0008) +[2023-10-08 15:46:42,250][21195] Updated weights for policy 0, policy_version 2100 (0.0007) +[2023-10-08 15:46:42,636][21195] Updated weights for policy 0, policy_version 2110 (0.0007) +[2023-10-08 15:46:43,537][21194] Updated weights for policy 1, policy_version 2090 (0.0009) +[2023-10-08 15:46:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 4292608. Throughput: 0: 1712.6, 1: 1744.5. Samples: 1084400. Policy #0 lag: (min: 26.0, avg: 28.9, max: 47.0) +[2023-10-08 15:46:43,803][19739] Avg episode reward: [(0, '9.020'), (1, '7.880')] +[2023-10-08 15:46:43,902][21194] Updated weights for policy 1, policy_version 2100 (0.0009) +[2023-10-08 15:46:44,269][21194] Updated weights for policy 1, policy_version 2110 (0.0011) +[2023-10-08 15:46:46,384][21195] Updated weights for policy 0, policy_version 2120 (0.0007) +[2023-10-08 15:46:46,761][21195] Updated weights for policy 0, policy_version 2130 (0.0009) +[2023-10-08 15:46:47,127][21195] Updated weights for policy 0, policy_version 2140 (0.0007) +[2023-10-08 15:46:48,215][21194] Updated weights for policy 1, policy_version 2120 (0.0008) +[2023-10-08 15:46:48,587][21194] Updated weights for policy 1, policy_version 2130 (0.0007) +[2023-10-08 15:46:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 4358144. Throughput: 0: 1723.0, 1: 1722.2. Samples: 1099780. Policy #0 lag: (min: 31.0, avg: 45.0, max: 63.0) +[2023-10-08 15:46:48,803][19739] Avg episode reward: [(0, '9.170'), (1, '7.290')] +[2023-10-08 15:46:48,958][21194] Updated weights for policy 1, policy_version 2140 (0.0009) +[2023-10-08 15:46:51,001][21195] Updated weights for policy 0, policy_version 2150 (0.0008) +[2023-10-08 15:46:51,378][21195] Updated weights for policy 0, policy_version 2160 (0.0008) +[2023-10-08 15:46:51,750][21195] Updated weights for policy 0, policy_version 2170 (0.0008) +[2023-10-08 15:46:52,947][21194] Updated weights for policy 1, policy_version 2150 (0.0008) +[2023-10-08 15:46:53,312][21194] Updated weights for policy 1, policy_version 2160 (0.0008) +[2023-10-08 15:46:53,678][21194] Updated weights for policy 1, policy_version 2170 (0.0009) +[2023-10-08 15:46:53,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 4423680. Throughput: 0: 1719.5, 1: 1740.7. Samples: 1115382. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 15:46:53,803][19739] Avg episode reward: [(0, '6.760'), (1, '7.640')] +[2023-10-08 15:46:55,674][21195] Updated weights for policy 0, policy_version 2180 (0.0008) +[2023-10-08 15:46:56,031][21195] Updated weights for policy 0, policy_version 2190 (0.0007) +[2023-10-08 15:46:56,408][21195] Updated weights for policy 0, policy_version 2200 (0.0007) +[2023-10-08 15:46:57,466][21194] Updated weights for policy 1, policy_version 2180 (0.0008) +[2023-10-08 15:46:57,835][21194] Updated weights for policy 1, policy_version 2190 (0.0007) +[2023-10-08 15:46:58,206][21194] Updated weights for policy 1, policy_version 2200 (0.0007) +[2023-10-08 15:46:58,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 4521984. Throughput: 0: 1712.6, 1: 1723.5. Samples: 1135832. Policy #0 lag: (min: 31.0, avg: 34.9, max: 63.0) +[2023-10-08 15:46:58,803][19739] Avg episode reward: [(0, '6.910'), (1, '7.100')] +[2023-10-08 15:47:00,354][21195] Updated weights for policy 0, policy_version 2210 (0.0007) +[2023-10-08 15:47:00,725][21195] Updated weights for policy 0, policy_version 2220 (0.0008) +[2023-10-08 15:47:01,083][21195] Updated weights for policy 0, policy_version 2230 (0.0009) +[2023-10-08 15:47:01,460][21195] Updated weights for policy 0, policy_version 2240 (0.0008) +[2023-10-08 15:47:02,182][21194] Updated weights for policy 1, policy_version 2210 (0.0008) +[2023-10-08 15:47:02,588][21194] Updated weights for policy 1, policy_version 2220 (0.0008) +[2023-10-08 15:47:02,949][21194] Updated weights for policy 1, policy_version 2230 (0.0007) +[2023-10-08 15:47:03,320][21194] Updated weights for policy 1, policy_version 2240 (0.0007) +[2023-10-08 15:47:03,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 4587520. Throughput: 0: 1739.2, 1: 1742.6. Samples: 1152328. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:47:03,803][19739] Avg episode reward: [(0, '7.320'), (1, '8.800')] +[2023-10-08 15:47:05,372][21195] Updated weights for policy 0, policy_version 2250 (0.0010) +[2023-10-08 15:47:05,744][21195] Updated weights for policy 0, policy_version 2260 (0.0009) +[2023-10-08 15:47:06,116][21195] Updated weights for policy 0, policy_version 2270 (0.0012) +[2023-10-08 15:47:07,331][21194] Updated weights for policy 1, policy_version 2250 (0.0008) +[2023-10-08 15:47:07,698][21194] Updated weights for policy 1, policy_version 2260 (0.0007) +[2023-10-08 15:47:08,064][21194] Updated weights for policy 1, policy_version 2270 (0.0009) +[2023-10-08 15:47:08,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 4653056. Throughput: 0: 1716.4, 1: 1740.9. Samples: 1167460. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:47:08,804][19739] Avg episode reward: [(0, '8.930'), (1, '8.980')] +[2023-10-08 15:47:08,805][20836] Saving new best policy, reward=8.980! +[2023-10-08 15:47:10,001][21195] Updated weights for policy 0, policy_version 2280 (0.0009) +[2023-10-08 15:47:10,365][21195] Updated weights for policy 0, policy_version 2290 (0.0009) +[2023-10-08 15:47:10,736][21195] Updated weights for policy 0, policy_version 2300 (0.0010) +[2023-10-08 15:47:11,984][21194] Updated weights for policy 1, policy_version 2280 (0.0008) +[2023-10-08 15:47:12,366][21194] Updated weights for policy 1, policy_version 2290 (0.0009) +[2023-10-08 15:47:12,739][21194] Updated weights for policy 1, policy_version 2300 (0.0009) +[2023-10-08 15:47:13,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 4718592. Throughput: 0: 1727.2, 1: 1704.8. Samples: 1187568. Policy #0 lag: (min: 9.0, avg: 13.8, max: 41.0) +[2023-10-08 15:47:13,804][19739] Avg episode reward: [(0, '8.910'), (1, '7.920')] +[2023-10-08 15:47:13,813][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000002304_2359296.pth... +[2023-10-08 15:47:13,813][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000002304_2359296.pth... +[2023-10-08 15:47:13,859][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000000704_720896.pth +[2023-10-08 15:47:13,860][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000000704_720896.pth +[2023-10-08 15:47:14,743][21195] Updated weights for policy 0, policy_version 2310 (0.0007) +[2023-10-08 15:47:15,121][21195] Updated weights for policy 0, policy_version 2320 (0.0007) +[2023-10-08 15:47:15,488][21195] Updated weights for policy 0, policy_version 2330 (0.0008) +[2023-10-08 15:47:16,600][21194] Updated weights for policy 1, policy_version 2310 (0.0007) +[2023-10-08 15:47:16,969][21194] Updated weights for policy 1, policy_version 2320 (0.0008) +[2023-10-08 15:47:17,342][21194] Updated weights for policy 1, policy_version 2330 (0.0009) +[2023-10-08 15:47:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 4784128. Throughput: 0: 1746.9, 1: 1740.9. Samples: 1204616. Policy #0 lag: (min: 31.0, avg: 31.0, max: 35.0) +[2023-10-08 15:47:18,804][19739] Avg episode reward: [(0, '6.830'), (1, '8.760')] +[2023-10-08 15:47:19,432][21195] Updated weights for policy 0, policy_version 2340 (0.0007) +[2023-10-08 15:47:19,804][21195] Updated weights for policy 0, policy_version 2350 (0.0009) +[2023-10-08 15:47:20,175][21195] Updated weights for policy 0, policy_version 2360 (0.0008) +[2023-10-08 15:47:21,225][21194] Updated weights for policy 1, policy_version 2340 (0.0010) +[2023-10-08 15:47:21,595][21194] Updated weights for policy 1, policy_version 2350 (0.0010) +[2023-10-08 15:47:21,958][21194] Updated weights for policy 1, policy_version 2360 (0.0010) +[2023-10-08 15:47:23,802][19739] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 4849664. Throughput: 0: 1716.3, 1: 1714.5. Samples: 1218792. Policy #0 lag: (min: 14.0, avg: 14.1, max: 22.0) +[2023-10-08 15:47:23,803][19739] Avg episode reward: [(0, '6.870'), (1, '6.840')] +[2023-10-08 15:47:24,346][21195] Updated weights for policy 0, policy_version 2370 (0.0008) +[2023-10-08 15:47:24,721][21195] Updated weights for policy 0, policy_version 2380 (0.0007) +[2023-10-08 15:47:25,104][21195] Updated weights for policy 0, policy_version 2390 (0.0009) +[2023-10-08 15:47:25,469][21195] Updated weights for policy 0, policy_version 2400 (0.0008) +[2023-10-08 15:47:25,959][21194] Updated weights for policy 1, policy_version 2370 (0.0009) +[2023-10-08 15:47:26,327][21194] Updated weights for policy 1, policy_version 2380 (0.0008) +[2023-10-08 15:47:26,702][21194] Updated weights for policy 1, policy_version 2390 (0.0009) +[2023-10-08 15:47:27,068][21194] Updated weights for policy 1, policy_version 2400 (0.0007) +[2023-10-08 15:47:28,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 4915200. Throughput: 0: 1749.9, 1: 1705.6. Samples: 1239900. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 15:47:28,803][19739] Avg episode reward: [(0, '7.470'), (1, '6.920')] +[2023-10-08 15:47:29,130][21195] Updated weights for policy 0, policy_version 2410 (0.0008) +[2023-10-08 15:47:29,504][21195] Updated weights for policy 0, policy_version 2420 (0.0009) +[2023-10-08 15:47:29,866][21195] Updated weights for policy 0, policy_version 2430 (0.0008) +[2023-10-08 15:47:30,918][21194] Updated weights for policy 1, policy_version 2410 (0.0010) +[2023-10-08 15:47:31,292][21194] Updated weights for policy 1, policy_version 2420 (0.0011) +[2023-10-08 15:47:31,669][21194] Updated weights for policy 1, policy_version 2430 (0.0011) +[2023-10-08 15:47:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 4980736. Throughput: 0: 1738.1, 1: 1727.6. Samples: 1255734. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 15:47:33,803][19739] Avg episode reward: [(0, '8.880'), (1, '7.290')] +[2023-10-08 15:47:33,806][21195] Updated weights for policy 0, policy_version 2440 (0.0008) +[2023-10-08 15:47:34,175][21195] Updated weights for policy 0, policy_version 2450 (0.0009) +[2023-10-08 15:47:34,545][21195] Updated weights for policy 0, policy_version 2460 (0.0009) +[2023-10-08 15:47:35,622][21194] Updated weights for policy 1, policy_version 2440 (0.0009) +[2023-10-08 15:47:35,992][21194] Updated weights for policy 1, policy_version 2450 (0.0007) +[2023-10-08 15:47:36,360][21194] Updated weights for policy 1, policy_version 2460 (0.0007) +[2023-10-08 15:47:38,415][21195] Updated weights for policy 0, policy_version 2470 (0.0007) +[2023-10-08 15:47:38,785][21195] Updated weights for policy 0, policy_version 2480 (0.0009) +[2023-10-08 15:47:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 5046272. Throughput: 0: 1745.1, 1: 1710.6. Samples: 1270888. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:47:38,803][19739] Avg episode reward: [(0, '10.170'), (1, '8.690')] +[2023-10-08 15:47:39,157][21195] Updated weights for policy 0, policy_version 2490 (0.0009) +[2023-10-08 15:47:39,380][20740] Saving new best policy, reward=10.170! +[2023-10-08 15:47:40,186][21194] Updated weights for policy 1, policy_version 2470 (0.0007) +[2023-10-08 15:47:40,565][21194] Updated weights for policy 1, policy_version 2480 (0.0007) +[2023-10-08 15:47:40,927][21194] Updated weights for policy 1, policy_version 2490 (0.0008) +[2023-10-08 15:47:43,114][21195] Updated weights for policy 0, policy_version 2500 (0.0010) +[2023-10-08 15:47:43,486][21195] Updated weights for policy 0, policy_version 2510 (0.0008) +[2023-10-08 15:47:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 5111808. Throughput: 0: 1750.2, 1: 1727.7. Samples: 1292340. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:47:43,803][19739] Avg episode reward: [(0, '9.090'), (1, '9.790')] +[2023-10-08 15:47:43,814][20836] Saving new best policy, reward=9.790! +[2023-10-08 15:47:43,859][21195] Updated weights for policy 0, policy_version 2520 (0.0009) +[2023-10-08 15:47:45,002][21194] Updated weights for policy 1, policy_version 2500 (0.0009) +[2023-10-08 15:47:45,377][21194] Updated weights for policy 1, policy_version 2510 (0.0011) +[2023-10-08 15:47:45,735][21194] Updated weights for policy 1, policy_version 2520 (0.0007) +[2023-10-08 15:47:47,734][21195] Updated weights for policy 0, policy_version 2530 (0.0009) +[2023-10-08 15:47:48,112][21195] Updated weights for policy 0, policy_version 2540 (0.0007) +[2023-10-08 15:47:48,475][21195] Updated weights for policy 0, policy_version 2550 (0.0008) +[2023-10-08 15:47:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 5177344. Throughput: 0: 1720.4, 1: 1710.8. Samples: 1306728. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 15:47:48,803][19739] Avg episode reward: [(0, '8.100'), (1, '10.950')] +[2023-10-08 15:47:48,804][20836] Saving new best policy, reward=10.950! +[2023-10-08 15:47:48,849][21195] Updated weights for policy 0, policy_version 2560 (0.0008) +[2023-10-08 15:47:49,496][21194] Updated weights for policy 1, policy_version 2530 (0.0010) +[2023-10-08 15:47:49,861][21194] Updated weights for policy 1, policy_version 2540 (0.0007) +[2023-10-08 15:47:50,232][21194] Updated weights for policy 1, policy_version 2550 (0.0008) +[2023-10-08 15:47:50,603][21194] Updated weights for policy 1, policy_version 2560 (0.0007) +[2023-10-08 15:47:52,746][21195] Updated weights for policy 0, policy_version 2570 (0.0010) +[2023-10-08 15:47:53,115][21195] Updated weights for policy 0, policy_version 2580 (0.0007) +[2023-10-08 15:47:53,486][21195] Updated weights for policy 0, policy_version 2590 (0.0007) +[2023-10-08 15:47:53,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 5275648. Throughput: 0: 1750.7, 1: 1714.8. Samples: 1323406. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 15:47:53,804][19739] Avg episode reward: [(0, '7.640'), (1, '10.180')] +[2023-10-08 15:47:54,741][21194] Updated weights for policy 1, policy_version 2570 (0.0008) +[2023-10-08 15:47:55,120][21194] Updated weights for policy 1, policy_version 2580 (0.0007) +[2023-10-08 15:47:55,486][21194] Updated weights for policy 1, policy_version 2590 (0.0008) +[2023-10-08 15:47:57,324][21195] Updated weights for policy 0, policy_version 2600 (0.0007) +[2023-10-08 15:47:57,700][21195] Updated weights for policy 0, policy_version 2610 (0.0007) +[2023-10-08 15:47:58,074][21195] Updated weights for policy 0, policy_version 2620 (0.0009) +[2023-10-08 15:47:58,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 5341184. Throughput: 0: 1738.5, 1: 1749.1. Samples: 1344510. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 15:47:58,803][19739] Avg episode reward: [(0, '9.410'), (1, '9.730')] +[2023-10-08 15:47:59,283][21194] Updated weights for policy 1, policy_version 2600 (0.0008) +[2023-10-08 15:47:59,666][21194] Updated weights for policy 1, policy_version 2610 (0.0008) +[2023-10-08 15:48:00,032][21194] Updated weights for policy 1, policy_version 2620 (0.0009) +[2023-10-08 15:48:01,849][21195] Updated weights for policy 0, policy_version 2630 (0.0009) +[2023-10-08 15:48:02,225][21195] Updated weights for policy 0, policy_version 2640 (0.0008) +[2023-10-08 15:48:02,595][21195] Updated weights for policy 0, policy_version 2650 (0.0010) +[2023-10-08 15:48:03,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 5406720. Throughput: 0: 1726.9, 1: 1709.9. Samples: 1359274. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:48:03,803][19739] Avg episode reward: [(0, '11.270'), (1, '9.480')] +[2023-10-08 15:48:03,804][20740] Saving new best policy, reward=11.270! +[2023-10-08 15:48:03,972][21194] Updated weights for policy 1, policy_version 2630 (0.0008) +[2023-10-08 15:48:04,331][21194] Updated weights for policy 1, policy_version 2640 (0.0011) +[2023-10-08 15:48:04,716][21194] Updated weights for policy 1, policy_version 2650 (0.0009) +[2023-10-08 15:48:06,503][21195] Updated weights for policy 0, policy_version 2660 (0.0008) +[2023-10-08 15:48:06,883][21195] Updated weights for policy 0, policy_version 2670 (0.0008) +[2023-10-08 15:48:07,254][21195] Updated weights for policy 0, policy_version 2680 (0.0008) +[2023-10-08 15:48:08,618][21194] Updated weights for policy 1, policy_version 2660 (0.0008) +[2023-10-08 15:48:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 5472256. Throughput: 0: 1749.7, 1: 1737.4. Samples: 1375710. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:48:08,803][19739] Avg episode reward: [(0, '13.010'), (1, '9.120')] +[2023-10-08 15:48:08,804][20740] Saving new best policy, reward=13.010! +[2023-10-08 15:48:08,988][21194] Updated weights for policy 1, policy_version 2670 (0.0011) +[2023-10-08 15:48:09,347][21194] Updated weights for policy 1, policy_version 2680 (0.0009) +[2023-10-08 15:48:11,171][21195] Updated weights for policy 0, policy_version 2690 (0.0008) +[2023-10-08 15:48:11,532][21195] Updated weights for policy 0, policy_version 2700 (0.0009) +[2023-10-08 15:48:11,914][21195] Updated weights for policy 0, policy_version 2710 (0.0007) +[2023-10-08 15:48:12,284][21195] Updated weights for policy 0, policy_version 2720 (0.0008) +[2023-10-08 15:48:13,320][21194] Updated weights for policy 1, policy_version 2690 (0.0007) +[2023-10-08 15:48:13,699][21194] Updated weights for policy 1, policy_version 2700 (0.0009) +[2023-10-08 15:48:13,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 5537792. Throughput: 0: 1730.4, 1: 1748.3. Samples: 1396442. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 15:48:13,804][19739] Avg episode reward: [(0, '8.740'), (1, '7.540')] +[2023-10-08 15:48:14,061][21194] Updated weights for policy 1, policy_version 2710 (0.0007) +[2023-10-08 15:48:14,427][21194] Updated weights for policy 1, policy_version 2720 (0.0007) +[2023-10-08 15:48:16,154][21195] Updated weights for policy 0, policy_version 2730 (0.0009) +[2023-10-08 15:48:16,530][21195] Updated weights for policy 0, policy_version 2740 (0.0009) +[2023-10-08 15:48:16,901][21195] Updated weights for policy 0, policy_version 2750 (0.0007) +[2023-10-08 15:48:18,509][21194] Updated weights for policy 1, policy_version 2730 (0.0009) +[2023-10-08 15:48:18,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 5603328. Throughput: 0: 1741.4, 1: 1727.0. Samples: 1411814. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 15:48:18,804][19739] Avg episode reward: [(0, '7.300'), (1, '8.720')] +[2023-10-08 15:48:18,889][21194] Updated weights for policy 1, policy_version 2740 (0.0008) +[2023-10-08 15:48:19,251][21194] Updated weights for policy 1, policy_version 2750 (0.0009) +[2023-10-08 15:48:20,788][21195] Updated weights for policy 0, policy_version 2760 (0.0009) +[2023-10-08 15:48:21,163][21195] Updated weights for policy 0, policy_version 2770 (0.0008) +[2023-10-08 15:48:21,545][21195] Updated weights for policy 0, policy_version 2780 (0.0008) +[2023-10-08 15:48:23,230][21194] Updated weights for policy 1, policy_version 2760 (0.0011) +[2023-10-08 15:48:23,593][21194] Updated weights for policy 1, policy_version 2770 (0.0008) +[2023-10-08 15:48:23,802][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 5668864. Throughput: 0: 1730.8, 1: 1742.3. Samples: 1427178. Policy #0 lag: (min: 25.0, avg: 39.6, max: 57.0) +[2023-10-08 15:48:23,803][19739] Avg episode reward: [(0, '7.000'), (1, '10.300')] +[2023-10-08 15:48:23,960][21194] Updated weights for policy 1, policy_version 2780 (0.0007) +[2023-10-08 15:48:25,490][21195] Updated weights for policy 0, policy_version 2790 (0.0009) +[2023-10-08 15:48:25,860][21195] Updated weights for policy 0, policy_version 2800 (0.0009) +[2023-10-08 15:48:26,240][21195] Updated weights for policy 0, policy_version 2810 (0.0009) +[2023-10-08 15:48:27,884][21194] Updated weights for policy 1, policy_version 2790 (0.0009) +[2023-10-08 15:48:28,263][21194] Updated weights for policy 1, policy_version 2800 (0.0010) +[2023-10-08 15:48:28,632][21194] Updated weights for policy 1, policy_version 2810 (0.0009) +[2023-10-08 15:48:28,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 5734400. Throughput: 0: 1730.3, 1: 1730.7. Samples: 1448084. Policy #0 lag: (min: 19.0, avg: 34.3, max: 51.0) +[2023-10-08 15:48:28,803][19739] Avg episode reward: [(0, '8.400'), (1, '10.620')] +[2023-10-08 15:48:30,041][21195] Updated weights for policy 0, policy_version 2820 (0.0009) +[2023-10-08 15:48:30,420][21195] Updated weights for policy 0, policy_version 2830 (0.0009) +[2023-10-08 15:48:30,784][21195] Updated weights for policy 0, policy_version 2840 (0.0009) +[2023-10-08 15:48:32,568][21194] Updated weights for policy 1, policy_version 2820 (0.0008) +[2023-10-08 15:48:32,933][21194] Updated weights for policy 1, policy_version 2830 (0.0008) +[2023-10-08 15:48:33,302][21194] Updated weights for policy 1, policy_version 2840 (0.0007) +[2023-10-08 15:48:33,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 5832704. Throughput: 0: 1762.1, 1: 1738.3. Samples: 1464244. Policy #0 lag: (min: 31.0, avg: 39.4, max: 63.0) +[2023-10-08 15:48:33,803][19739] Avg episode reward: [(0, '10.200'), (1, '12.030')] +[2023-10-08 15:48:33,804][20836] Saving new best policy, reward=12.030! +[2023-10-08 15:48:34,598][21195] Updated weights for policy 0, policy_version 2850 (0.0010) +[2023-10-08 15:48:34,970][21195] Updated weights for policy 0, policy_version 2860 (0.0009) +[2023-10-08 15:48:35,344][21195] Updated weights for policy 0, policy_version 2870 (0.0007) +[2023-10-08 15:48:35,717][21195] Updated weights for policy 0, policy_version 2880 (0.0007) +[2023-10-08 15:48:37,245][21194] Updated weights for policy 1, policy_version 2850 (0.0007) +[2023-10-08 15:48:37,620][21194] Updated weights for policy 1, policy_version 2860 (0.0009) +[2023-10-08 15:48:37,988][21194] Updated weights for policy 1, policy_version 2870 (0.0010) +[2023-10-08 15:48:38,360][21194] Updated weights for policy 1, policy_version 2880 (0.0007) +[2023-10-08 15:48:38,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 5898240. Throughput: 0: 1731.2, 1: 1738.6. Samples: 1479546. Policy #0 lag: (min: 31.0, avg: 39.4, max: 63.0) +[2023-10-08 15:48:38,803][19739] Avg episode reward: [(0, '12.940'), (1, '9.480')] +[2023-10-08 15:48:39,652][21195] Updated weights for policy 0, policy_version 2890 (0.0007) +[2023-10-08 15:48:40,023][21195] Updated weights for policy 0, policy_version 2900 (0.0007) +[2023-10-08 15:48:40,401][21195] Updated weights for policy 0, policy_version 2910 (0.0009) +[2023-10-08 15:48:42,018][21194] Updated weights for policy 1, policy_version 2890 (0.0007) +[2023-10-08 15:48:42,387][21194] Updated weights for policy 1, policy_version 2900 (0.0007) +[2023-10-08 15:48:42,753][21194] Updated weights for policy 1, policy_version 2910 (0.0007) +[2023-10-08 15:48:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 5963776. Throughput: 0: 1749.2, 1: 1703.6. Samples: 1499888. Policy #0 lag: (min: 15.0, avg: 21.9, max: 47.0) +[2023-10-08 15:48:43,803][19739] Avg episode reward: [(0, '14.390'), (1, '7.540')] +[2023-10-08 15:48:43,811][20740] Saving new best policy, reward=14.390! +[2023-10-08 15:48:44,433][21195] Updated weights for policy 0, policy_version 2920 (0.0009) +[2023-10-08 15:48:44,814][21195] Updated weights for policy 0, policy_version 2930 (0.0007) +[2023-10-08 15:48:45,187][21195] Updated weights for policy 0, policy_version 2940 (0.0008) +[2023-10-08 15:48:46,708][21194] Updated weights for policy 1, policy_version 2920 (0.0010) +[2023-10-08 15:48:47,087][21194] Updated weights for policy 1, policy_version 2930 (0.0009) +[2023-10-08 15:48:47,449][21194] Updated weights for policy 1, policy_version 2940 (0.0009) +[2023-10-08 15:48:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 6029312. Throughput: 0: 1755.1, 1: 1736.9. Samples: 1516414. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:48:48,803][19739] Avg episode reward: [(0, '12.510'), (1, '8.330')] +[2023-10-08 15:48:48,987][21195] Updated weights for policy 0, policy_version 2950 (0.0008) +[2023-10-08 15:48:49,364][21195] Updated weights for policy 0, policy_version 2960 (0.0007) +[2023-10-08 15:48:49,744][21195] Updated weights for policy 0, policy_version 2970 (0.0008) +[2023-10-08 15:48:51,552][21194] Updated weights for policy 1, policy_version 2950 (0.0009) +[2023-10-08 15:48:51,923][21194] Updated weights for policy 1, policy_version 2960 (0.0007) +[2023-10-08 15:48:52,296][21194] Updated weights for policy 1, policy_version 2970 (0.0008) +[2023-10-08 15:48:53,713][21195] Updated weights for policy 0, policy_version 2980 (0.0011) +[2023-10-08 15:48:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 6094848. Throughput: 0: 1735.3, 1: 1713.2. Samples: 1530896. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:48:53,803][19739] Avg episode reward: [(0, '9.180'), (1, '9.640')] +[2023-10-08 15:48:54,079][21195] Updated weights for policy 0, policy_version 2990 (0.0011) +[2023-10-08 15:48:54,457][21195] Updated weights for policy 0, policy_version 3000 (0.0010) +[2023-10-08 15:48:56,252][21194] Updated weights for policy 1, policy_version 2980 (0.0007) +[2023-10-08 15:48:56,617][21194] Updated weights for policy 1, policy_version 2990 (0.0007) +[2023-10-08 15:48:56,997][21194] Updated weights for policy 1, policy_version 3000 (0.0010) +[2023-10-08 15:48:58,311][21195] Updated weights for policy 0, policy_version 3010 (0.0010) +[2023-10-08 15:48:58,677][21195] Updated weights for policy 0, policy_version 3020 (0.0010) +[2023-10-08 15:48:58,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 6160384. Throughput: 0: 1753.7, 1: 1698.4. Samples: 1551782. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:48:58,803][19739] Avg episode reward: [(0, '8.750'), (1, '10.750')] +[2023-10-08 15:48:59,045][21195] Updated weights for policy 0, policy_version 3030 (0.0011) +[2023-10-08 15:48:59,420][21195] Updated weights for policy 0, policy_version 3040 (0.0008) +[2023-10-08 15:49:00,981][21194] Updated weights for policy 1, policy_version 3010 (0.0010) +[2023-10-08 15:49:01,363][21194] Updated weights for policy 1, policy_version 3020 (0.0007) +[2023-10-08 15:49:01,728][21194] Updated weights for policy 1, policy_version 3030 (0.0009) +[2023-10-08 15:49:02,098][21194] Updated weights for policy 1, policy_version 3040 (0.0009) +[2023-10-08 15:49:03,307][21195] Updated weights for policy 0, policy_version 3050 (0.0008) +[2023-10-08 15:49:03,675][21195] Updated weights for policy 0, policy_version 3060 (0.0009) +[2023-10-08 15:49:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 6225920. Throughput: 0: 1733.7, 1: 1727.7. Samples: 1567580. Policy #0 lag: (min: 31.0, avg: 36.3, max: 63.0) +[2023-10-08 15:49:03,803][19739] Avg episode reward: [(0, '10.480'), (1, '10.820')] +[2023-10-08 15:49:04,043][21195] Updated weights for policy 0, policy_version 3070 (0.0011) +[2023-10-08 15:49:05,971][21194] Updated weights for policy 1, policy_version 3050 (0.0010) +[2023-10-08 15:49:06,343][21194] Updated weights for policy 1, policy_version 3060 (0.0010) +[2023-10-08 15:49:06,709][21194] Updated weights for policy 1, policy_version 3070 (0.0007) +[2023-10-08 15:49:07,820][21195] Updated weights for policy 0, policy_version 3080 (0.0007) +[2023-10-08 15:49:08,190][21195] Updated weights for policy 0, policy_version 3090 (0.0010) +[2023-10-08 15:49:08,556][21195] Updated weights for policy 0, policy_version 3100 (0.0007) +[2023-10-08 15:49:08,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 6324224. Throughput: 0: 1757.6, 1: 1702.6. Samples: 1582884. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:49:08,804][19739] Avg episode reward: [(0, '10.320'), (1, '9.080')] +[2023-10-08 15:49:10,661][21194] Updated weights for policy 1, policy_version 3080 (0.0008) +[2023-10-08 15:49:11,025][21194] Updated weights for policy 1, policy_version 3090 (0.0008) +[2023-10-08 15:49:11,399][21194] Updated weights for policy 1, policy_version 3100 (0.0007) +[2023-10-08 15:49:12,439][21195] Updated weights for policy 0, policy_version 3110 (0.0007) +[2023-10-08 15:49:12,816][21195] Updated weights for policy 0, policy_version 3120 (0.0008) +[2023-10-08 15:49:13,193][21195] Updated weights for policy 0, policy_version 3130 (0.0008) +[2023-10-08 15:49:13,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 6389760. Throughput: 0: 1748.1, 1: 1716.8. Samples: 1604008. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 15:49:13,803][19739] Avg episode reward: [(0, '11.550'), (1, '8.160')] +[2023-10-08 15:49:13,811][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000003104_3178496.pth... +[2023-10-08 15:49:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000003136_3211264.pth... +[2023-10-08 15:49:13,848][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000001504_1540096.pth +[2023-10-08 15:49:13,852][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000001504_1540096.pth +[2023-10-08 15:49:15,322][21194] Updated weights for policy 1, policy_version 3110 (0.0008) +[2023-10-08 15:49:15,686][21194] Updated weights for policy 1, policy_version 3120 (0.0008) +[2023-10-08 15:49:16,050][21194] Updated weights for policy 1, policy_version 3130 (0.0009) +[2023-10-08 15:49:17,032][21195] Updated weights for policy 0, policy_version 3140 (0.0009) +[2023-10-08 15:49:17,407][21195] Updated weights for policy 0, policy_version 3150 (0.0008) +[2023-10-08 15:49:17,772][21195] Updated weights for policy 0, policy_version 3160 (0.0007) +[2023-10-08 15:49:18,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 6455296. Throughput: 0: 1727.7, 1: 1715.7. Samples: 1619200. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 15:49:18,803][19739] Avg episode reward: [(0, '10.400'), (1, '9.920')] +[2023-10-08 15:49:19,945][21194] Updated weights for policy 1, policy_version 3140 (0.0009) +[2023-10-08 15:49:20,310][21194] Updated weights for policy 1, policy_version 3150 (0.0011) +[2023-10-08 15:49:20,680][21194] Updated weights for policy 1, policy_version 3160 (0.0010) +[2023-10-08 15:49:21,693][21195] Updated weights for policy 0, policy_version 3170 (0.0007) +[2023-10-08 15:49:22,069][21195] Updated weights for policy 0, policy_version 3180 (0.0009) +[2023-10-08 15:49:22,447][21195] Updated weights for policy 0, policy_version 3190 (0.0008) +[2023-10-08 15:49:22,815][21195] Updated weights for policy 0, policy_version 3200 (0.0010) +[2023-10-08 15:49:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 6520832. Throughput: 0: 1754.9, 1: 1711.1. Samples: 1635516. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 15:49:23,803][19739] Avg episode reward: [(0, '10.860'), (1, '11.850')] +[2023-10-08 15:49:24,542][21194] Updated weights for policy 1, policy_version 3170 (0.0011) +[2023-10-08 15:49:24,903][21194] Updated weights for policy 1, policy_version 3180 (0.0009) +[2023-10-08 15:49:25,272][21194] Updated weights for policy 1, policy_version 3190 (0.0010) +[2023-10-08 15:49:25,648][21194] Updated weights for policy 1, policy_version 3200 (0.0009) +[2023-10-08 15:49:26,778][21195] Updated weights for policy 0, policy_version 3210 (0.0007) +[2023-10-08 15:49:27,148][21195] Updated weights for policy 0, policy_version 3220 (0.0009) +[2023-10-08 15:49:27,517][21195] Updated weights for policy 0, policy_version 3230 (0.0007) +[2023-10-08 15:49:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 6586368. Throughput: 0: 1725.6, 1: 1744.1. Samples: 1656022. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 15:49:28,803][19739] Avg episode reward: [(0, '12.790'), (1, '13.110')] +[2023-10-08 15:49:28,811][20836] Saving new best policy, reward=13.110! +[2023-10-08 15:49:29,847][21194] Updated weights for policy 1, policy_version 3210 (0.0007) +[2023-10-08 15:49:30,221][21194] Updated weights for policy 1, policy_version 3220 (0.0007) +[2023-10-08 15:49:30,588][21194] Updated weights for policy 1, policy_version 3230 (0.0007) +[2023-10-08 15:49:31,316][21195] Updated weights for policy 0, policy_version 3240 (0.0008) +[2023-10-08 15:49:31,688][21195] Updated weights for policy 0, policy_version 3250 (0.0010) +[2023-10-08 15:49:32,067][21195] Updated weights for policy 0, policy_version 3260 (0.0010) +[2023-10-08 15:49:33,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 6651904. Throughput: 0: 1736.7, 1: 1706.0. Samples: 1671336. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 15:49:33,803][19739] Avg episode reward: [(0, '14.190'), (1, '11.830')] +[2023-10-08 15:49:34,450][21194] Updated weights for policy 1, policy_version 3240 (0.0007) +[2023-10-08 15:49:34,820][21194] Updated weights for policy 1, policy_version 3250 (0.0012) +[2023-10-08 15:49:35,189][21194] Updated weights for policy 1, policy_version 3260 (0.0009) +[2023-10-08 15:49:35,841][21195] Updated weights for policy 0, policy_version 3270 (0.0009) +[2023-10-08 15:49:36,222][21195] Updated weights for policy 0, policy_version 3280 (0.0007) +[2023-10-08 15:49:36,603][21195] Updated weights for policy 0, policy_version 3290 (0.0008) +[2023-10-08 15:49:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 6717440. Throughput: 0: 1740.0, 1: 1731.5. Samples: 1687112. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 15:49:38,803][19739] Avg episode reward: [(0, '17.040'), (1, '11.100')] +[2023-10-08 15:49:38,804][20740] Saving new best policy, reward=17.040! +[2023-10-08 15:49:39,043][21194] Updated weights for policy 1, policy_version 3270 (0.0009) +[2023-10-08 15:49:39,408][21194] Updated weights for policy 1, policy_version 3280 (0.0010) +[2023-10-08 15:49:39,770][21194] Updated weights for policy 1, policy_version 3290 (0.0010) +[2023-10-08 15:49:40,415][21195] Updated weights for policy 0, policy_version 3300 (0.0009) +[2023-10-08 15:49:40,780][21195] Updated weights for policy 0, policy_version 3310 (0.0009) +[2023-10-08 15:49:41,157][21195] Updated weights for policy 0, policy_version 3320 (0.0008) +[2023-10-08 15:49:43,792][21194] Updated weights for policy 1, policy_version 3300 (0.0008) +[2023-10-08 15:49:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 6782976. Throughput: 0: 1742.5, 1: 1744.5. Samples: 1708698. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 15:49:43,803][19739] Avg episode reward: [(0, '18.980'), (1, '10.120')] +[2023-10-08 15:49:43,810][20740] Saving new best policy, reward=18.980! +[2023-10-08 15:49:44,170][21194] Updated weights for policy 1, policy_version 3310 (0.0009) +[2023-10-08 15:49:44,537][21194] Updated weights for policy 1, policy_version 3320 (0.0009) +[2023-10-08 15:49:45,060][21195] Updated weights for policy 0, policy_version 3330 (0.0007) +[2023-10-08 15:49:45,425][21195] Updated weights for policy 0, policy_version 3340 (0.0009) +[2023-10-08 15:49:45,797][21195] Updated weights for policy 0, policy_version 3350 (0.0007) +[2023-10-08 15:49:46,166][21195] Updated weights for policy 0, policy_version 3360 (0.0007) +[2023-10-08 15:49:48,458][21194] Updated weights for policy 1, policy_version 3330 (0.0009) +[2023-10-08 15:49:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 6848512. Throughput: 0: 1767.0, 1: 1717.2. Samples: 1724372. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 15:49:48,803][19739] Avg episode reward: [(0, '18.520'), (1, '10.380')] +[2023-10-08 15:49:48,822][21194] Updated weights for policy 1, policy_version 3340 (0.0010) +[2023-10-08 15:49:49,181][21194] Updated weights for policy 1, policy_version 3350 (0.0009) +[2023-10-08 15:49:49,551][21194] Updated weights for policy 1, policy_version 3360 (0.0009) +[2023-10-08 15:49:49,982][21195] Updated weights for policy 0, policy_version 3370 (0.0007) +[2023-10-08 15:49:50,359][21195] Updated weights for policy 0, policy_version 3380 (0.0008) +[2023-10-08 15:49:50,735][21195] Updated weights for policy 0, policy_version 3390 (0.0007) +[2023-10-08 15:49:53,405][21194] Updated weights for policy 1, policy_version 3370 (0.0007) +[2023-10-08 15:49:53,771][21194] Updated weights for policy 1, policy_version 3380 (0.0007) +[2023-10-08 15:49:53,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 6914048. Throughput: 0: 1744.0, 1: 1741.9. Samples: 1739752. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:49:53,804][19739] Avg episode reward: [(0, '15.750'), (1, '10.980')] +[2023-10-08 15:49:54,141][21194] Updated weights for policy 1, policy_version 3390 (0.0009) +[2023-10-08 15:49:54,654][21195] Updated weights for policy 0, policy_version 3400 (0.0009) +[2023-10-08 15:49:55,034][21195] Updated weights for policy 0, policy_version 3410 (0.0009) +[2023-10-08 15:49:55,400][21195] Updated weights for policy 0, policy_version 3420 (0.0009) +[2023-10-08 15:49:58,039][21194] Updated weights for policy 1, policy_version 3400 (0.0010) +[2023-10-08 15:49:58,404][21194] Updated weights for policy 1, policy_version 3410 (0.0009) +[2023-10-08 15:49:58,779][21194] Updated weights for policy 1, policy_version 3420 (0.0007) +[2023-10-08 15:49:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 6979584. Throughput: 0: 1757.9, 1: 1738.9. Samples: 1761360. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:49:58,803][19739] Avg episode reward: [(0, '12.550'), (1, '13.990')] +[2023-10-08 15:49:58,926][20836] Saving new best policy, reward=13.990! +[2023-10-08 15:49:59,261][21195] Updated weights for policy 0, policy_version 3430 (0.0009) +[2023-10-08 15:49:59,628][21195] Updated weights for policy 0, policy_version 3440 (0.0008) +[2023-10-08 15:50:00,004][21195] Updated weights for policy 0, policy_version 3450 (0.0008) +[2023-10-08 15:50:02,596][21194] Updated weights for policy 1, policy_version 3430 (0.0009) +[2023-10-08 15:50:02,966][21194] Updated weights for policy 1, policy_version 3440 (0.0009) +[2023-10-08 15:50:03,336][21194] Updated weights for policy 1, policy_version 3450 (0.0009) +[2023-10-08 15:50:03,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 7077888. Throughput: 0: 1774.4, 1: 1738.0. Samples: 1777258. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:50:03,804][19739] Avg episode reward: [(0, '12.170'), (1, '14.890')] +[2023-10-08 15:50:03,805][20836] Saving new best policy, reward=14.890! +[2023-10-08 15:50:03,828][21195] Updated weights for policy 0, policy_version 3460 (0.0008) +[2023-10-08 15:50:04,199][21195] Updated weights for policy 0, policy_version 3470 (0.0010) +[2023-10-08 15:50:04,563][21195] Updated weights for policy 0, policy_version 3480 (0.0007) +[2023-10-08 15:50:07,244][21194] Updated weights for policy 1, policy_version 3460 (0.0009) +[2023-10-08 15:50:07,626][21194] Updated weights for policy 1, policy_version 3470 (0.0010) +[2023-10-08 15:50:07,993][21194] Updated weights for policy 1, policy_version 3480 (0.0010) +[2023-10-08 15:50:08,186][21195] Updated weights for policy 0, policy_version 3490 (0.0007) +[2023-10-08 15:50:08,556][21195] Updated weights for policy 0, policy_version 3500 (0.0008) +[2023-10-08 15:50:08,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 7143424. Throughput: 0: 1754.8, 1: 1747.1. Samples: 1793102. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:50:08,803][19739] Avg episode reward: [(0, '13.760'), (1, '16.090')] +[2023-10-08 15:50:08,804][20836] Saving new best policy, reward=16.090! +[2023-10-08 15:50:08,931][21195] Updated weights for policy 0, policy_version 3510 (0.0010) +[2023-10-08 15:50:09,310][21195] Updated weights for policy 0, policy_version 3520 (0.0008) +[2023-10-08 15:50:11,818][21194] Updated weights for policy 1, policy_version 3490 (0.0009) +[2023-10-08 15:50:12,179][21194] Updated weights for policy 1, policy_version 3500 (0.0007) +[2023-10-08 15:50:12,545][21194] Updated weights for policy 1, policy_version 3510 (0.0011) +[2023-10-08 15:50:12,923][21194] Updated weights for policy 1, policy_version 3520 (0.0009) +[2023-10-08 15:50:13,124][21195] Updated weights for policy 0, policy_version 3530 (0.0007) +[2023-10-08 15:50:13,495][21195] Updated weights for policy 0, policy_version 3540 (0.0008) +[2023-10-08 15:50:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 7208960. Throughput: 0: 1782.5, 1: 1710.4. Samples: 1813202. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:50:13,803][19739] Avg episode reward: [(0, '14.500'), (1, '14.090')] +[2023-10-08 15:50:13,863][21195] Updated weights for policy 0, policy_version 3550 (0.0008) +[2023-10-08 15:50:17,076][21194] Updated weights for policy 1, policy_version 3530 (0.0007) +[2023-10-08 15:50:17,444][21194] Updated weights for policy 1, policy_version 3540 (0.0007) +[2023-10-08 15:50:17,706][21195] Updated weights for policy 0, policy_version 3560 (0.0008) +[2023-10-08 15:50:17,805][21194] Updated weights for policy 1, policy_version 3550 (0.0008) +[2023-10-08 15:50:18,069][21195] Updated weights for policy 0, policy_version 3570 (0.0009) +[2023-10-08 15:50:18,450][21195] Updated weights for policy 0, policy_version 3580 (0.0010) +[2023-10-08 15:50:18,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 7307264. Throughput: 0: 1750.0, 1: 1747.9. Samples: 1828742. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:50:18,803][19739] Avg episode reward: [(0, '14.060'), (1, '11.340')] +[2023-10-08 15:50:21,571][21194] Updated weights for policy 1, policy_version 3560 (0.0008) +[2023-10-08 15:50:21,932][21194] Updated weights for policy 1, policy_version 3570 (0.0010) +[2023-10-08 15:50:22,255][21195] Updated weights for policy 0, policy_version 3590 (0.0007) +[2023-10-08 15:50:22,295][21194] Updated weights for policy 1, policy_version 3580 (0.0008) +[2023-10-08 15:50:22,626][21195] Updated weights for policy 0, policy_version 3600 (0.0010) +[2023-10-08 15:50:22,998][21195] Updated weights for policy 0, policy_version 3610 (0.0007) +[2023-10-08 15:50:23,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 7372800. Throughput: 0: 1780.3, 1: 1724.6. Samples: 1844830. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:50:23,803][19739] Avg episode reward: [(0, '18.480'), (1, '9.390')] +[2023-10-08 15:50:26,268][21194] Updated weights for policy 1, policy_version 3590 (0.0009) +[2023-10-08 15:50:26,640][21194] Updated weights for policy 1, policy_version 3600 (0.0010) +[2023-10-08 15:50:26,901][21195] Updated weights for policy 0, policy_version 3620 (0.0007) +[2023-10-08 15:50:27,011][21194] Updated weights for policy 1, policy_version 3610 (0.0009) +[2023-10-08 15:50:27,278][21195] Updated weights for policy 0, policy_version 3630 (0.0007) +[2023-10-08 15:50:27,649][21195] Updated weights for policy 0, policy_version 3640 (0.0010) +[2023-10-08 15:50:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 7438336. Throughput: 0: 1753.7, 1: 1715.2. Samples: 1864796. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:50:28,803][19739] Avg episode reward: [(0, '19.320'), (1, '9.930')] +[2023-10-08 15:50:28,811][20740] Saving new best policy, reward=19.320! +[2023-10-08 15:50:30,875][21194] Updated weights for policy 1, policy_version 3620 (0.0008) +[2023-10-08 15:50:31,241][21194] Updated weights for policy 1, policy_version 3630 (0.0010) +[2023-10-08 15:50:31,517][21195] Updated weights for policy 0, policy_version 3650 (0.0008) +[2023-10-08 15:50:31,607][21194] Updated weights for policy 1, policy_version 3640 (0.0008) +[2023-10-08 15:50:31,890][21195] Updated weights for policy 0, policy_version 3660 (0.0009) +[2023-10-08 15:50:32,262][21195] Updated weights for policy 0, policy_version 3670 (0.0008) +[2023-10-08 15:50:32,643][21195] Updated weights for policy 0, policy_version 3680 (0.0007) +[2023-10-08 15:50:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 7503872. Throughput: 0: 1741.5, 1: 1739.2. Samples: 1881000. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:50:33,803][19739] Avg episode reward: [(0, '21.630'), (1, '9.710')] +[2023-10-08 15:50:33,804][20740] Saving new best policy, reward=21.630! +[2023-10-08 15:50:35,668][21194] Updated weights for policy 1, policy_version 3650 (0.0009) +[2023-10-08 15:50:36,045][21194] Updated weights for policy 1, policy_version 3660 (0.0010) +[2023-10-08 15:50:36,422][21194] Updated weights for policy 1, policy_version 3670 (0.0009) +[2023-10-08 15:50:36,697][21195] Updated weights for policy 0, policy_version 3690 (0.0008) +[2023-10-08 15:50:36,786][21194] Updated weights for policy 1, policy_version 3680 (0.0009) +[2023-10-08 15:50:37,067][21195] Updated weights for policy 0, policy_version 3700 (0.0008) +[2023-10-08 15:50:37,443][21195] Updated weights for policy 0, policy_version 3710 (0.0010) +[2023-10-08 15:50:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 7569408. Throughput: 0: 1760.2, 1: 1714.0. Samples: 1896090. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:50:38,803][19739] Avg episode reward: [(0, '23.920'), (1, '12.290')] +[2023-10-08 15:50:38,804][20740] Saving new best policy, reward=23.920! +[2023-10-08 15:50:40,689][21194] Updated weights for policy 1, policy_version 3690 (0.0007) +[2023-10-08 15:50:41,064][21194] Updated weights for policy 1, policy_version 3700 (0.0007) +[2023-10-08 15:50:41,429][21194] Updated weights for policy 1, policy_version 3710 (0.0009) +[2023-10-08 15:50:41,491][21195] Updated weights for policy 0, policy_version 3720 (0.0007) +[2023-10-08 15:50:41,854][21195] Updated weights for policy 0, policy_version 3730 (0.0010) +[2023-10-08 15:50:42,230][21195] Updated weights for policy 0, policy_version 3740 (0.0008) +[2023-10-08 15:50:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 7634944. Throughput: 0: 1738.1, 1: 1715.5. Samples: 1916772. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:50:43,803][19739] Avg episode reward: [(0, '24.630'), (1, '12.850')] +[2023-10-08 15:50:43,813][20740] Saving new best policy, reward=24.630! +[2023-10-08 15:50:45,374][21194] Updated weights for policy 1, policy_version 3720 (0.0008) +[2023-10-08 15:50:45,742][21194] Updated weights for policy 1, policy_version 3730 (0.0011) +[2023-10-08 15:50:45,962][21195] Updated weights for policy 0, policy_version 3750 (0.0009) +[2023-10-08 15:50:46,104][21194] Updated weights for policy 1, policy_version 3740 (0.0009) +[2023-10-08 15:50:46,337][21195] Updated weights for policy 0, policy_version 3760 (0.0008) +[2023-10-08 15:50:46,712][21195] Updated weights for policy 0, policy_version 3770 (0.0009) +[2023-10-08 15:50:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 7700480. Throughput: 0: 1738.7, 1: 1714.3. Samples: 1932640. Policy #0 lag: (min: 16.0, avg: 37.4, max: 48.0) +[2023-10-08 15:50:48,803][19739] Avg episode reward: [(0, '26.080'), (1, '13.940')] +[2023-10-08 15:50:48,804][20740] Saving new best policy, reward=26.080! +[2023-10-08 15:50:50,200][21194] Updated weights for policy 1, policy_version 3750 (0.0008) +[2023-10-08 15:50:50,560][21194] Updated weights for policy 1, policy_version 3760 (0.0010) +[2023-10-08 15:50:50,599][21195] Updated weights for policy 0, policy_version 3780 (0.0008) +[2023-10-08 15:50:50,930][21194] Updated weights for policy 1, policy_version 3770 (0.0009) +[2023-10-08 15:50:50,967][21195] Updated weights for policy 0, policy_version 3790 (0.0008) +[2023-10-08 15:50:51,340][21195] Updated weights for policy 0, policy_version 3800 (0.0007) +[2023-10-08 15:50:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 7766016. Throughput: 0: 1732.0, 1: 1701.9. Samples: 1947626. Policy #0 lag: (min: 16.0, avg: 37.4, max: 48.0) +[2023-10-08 15:50:53,803][19739] Avg episode reward: [(0, '24.070'), (1, '15.190')] +[2023-10-08 15:50:54,886][21194] Updated weights for policy 1, policy_version 3780 (0.0009) +[2023-10-08 15:50:55,170][21195] Updated weights for policy 0, policy_version 3810 (0.0009) +[2023-10-08 15:50:55,248][21194] Updated weights for policy 1, policy_version 3790 (0.0008) +[2023-10-08 15:50:55,540][21195] Updated weights for policy 0, policy_version 3820 (0.0008) +[2023-10-08 15:50:55,617][21194] Updated weights for policy 1, policy_version 3800 (0.0008) +[2023-10-08 15:50:55,906][21195] Updated weights for policy 0, policy_version 3830 (0.0007) +[2023-10-08 15:50:56,277][21195] Updated weights for policy 0, policy_version 3840 (0.0007) +[2023-10-08 15:50:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 7831552. Throughput: 0: 1733.0, 1: 1737.5. Samples: 1969374. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 15:50:58,803][19739] Avg episode reward: [(0, '21.450'), (1, '13.060')] +[2023-10-08 15:50:59,616][21194] Updated weights for policy 1, policy_version 3810 (0.0008) +[2023-10-08 15:50:59,984][21194] Updated weights for policy 1, policy_version 3820 (0.0007) +[2023-10-08 15:51:00,086][21195] Updated weights for policy 0, policy_version 3850 (0.0007) +[2023-10-08 15:51:00,355][21194] Updated weights for policy 1, policy_version 3830 (0.0009) +[2023-10-08 15:51:00,456][21195] Updated weights for policy 0, policy_version 3860 (0.0008) +[2023-10-08 15:51:00,718][21194] Updated weights for policy 1, policy_version 3840 (0.0008) +[2023-10-08 15:51:00,836][21195] Updated weights for policy 0, policy_version 3870 (0.0008) +[2023-10-08 15:51:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 7897088. Throughput: 0: 1761.6, 1: 1705.7. Samples: 1984772. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 15:51:03,803][19739] Avg episode reward: [(0, '13.560'), (1, '14.230')] +[2023-10-08 15:51:04,776][21194] Updated weights for policy 1, policy_version 3850 (0.0009) +[2023-10-08 15:51:04,788][21195] Updated weights for policy 0, policy_version 3880 (0.0008) +[2023-10-08 15:51:05,145][21194] Updated weights for policy 1, policy_version 3860 (0.0008) +[2023-10-08 15:51:05,159][21195] Updated weights for policy 0, policy_version 3890 (0.0007) +[2023-10-08 15:51:05,514][21194] Updated weights for policy 1, policy_version 3870 (0.0008) +[2023-10-08 15:51:05,531][21195] Updated weights for policy 0, policy_version 3900 (0.0009) +[2023-10-08 15:51:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 7962624. Throughput: 0: 1726.7, 1: 1717.4. Samples: 1999816. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 15:51:08,803][19739] Avg episode reward: [(0, '14.670'), (1, '13.750')] +[2023-10-08 15:51:09,409][21195] Updated weights for policy 0, policy_version 3910 (0.0008) +[2023-10-08 15:51:09,416][21194] Updated weights for policy 1, policy_version 3880 (0.0009) +[2023-10-08 15:51:09,779][21194] Updated weights for policy 1, policy_version 3890 (0.0008) +[2023-10-08 15:51:09,783][21195] Updated weights for policy 0, policy_version 3920 (0.0007) +[2023-10-08 15:51:10,150][21194] Updated weights for policy 1, policy_version 3900 (0.0009) +[2023-10-08 15:51:10,152][21195] Updated weights for policy 0, policy_version 3930 (0.0008) +[2023-10-08 15:51:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 8028160. Throughput: 0: 1755.2, 1: 1731.6. Samples: 2021702. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 15:51:13,803][19739] Avg episode reward: [(0, '15.680'), (1, '14.280')] +[2023-10-08 15:51:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000003936_4030464.pth... +[2023-10-08 15:51:13,851][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000002304_2359296.pth +[2023-10-08 15:51:14,068][21194] Updated weights for policy 1, policy_version 3910 (0.0008) +[2023-10-08 15:51:14,140][21195] Updated weights for policy 0, policy_version 3940 (0.0008) +[2023-10-08 15:51:14,431][21194] Updated weights for policy 1, policy_version 3920 (0.0009) +[2023-10-08 15:51:14,503][21195] Updated weights for policy 0, policy_version 3950 (0.0009) +[2023-10-08 15:51:14,796][21194] Updated weights for policy 1, policy_version 3930 (0.0009) +[2023-10-08 15:51:14,872][21195] Updated weights for policy 0, policy_version 3960 (0.0008) +[2023-10-08 15:51:15,016][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000003936_4030464.pth... +[2023-10-08 15:51:15,056][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000002304_2359296.pth +[2023-10-08 15:51:18,660][21194] Updated weights for policy 1, policy_version 3940 (0.0008) +[2023-10-08 15:51:18,691][21195] Updated weights for policy 0, policy_version 3970 (0.0009) +[2023-10-08 15:51:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13884.8). Total num frames: 8093696. Throughput: 0: 1763.5, 1: 1706.8. Samples: 2037164. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 15:51:18,803][19739] Avg episode reward: [(0, '14.970'), (1, '14.280')] +[2023-10-08 15:51:19,019][21194] Updated weights for policy 1, policy_version 3950 (0.0008) +[2023-10-08 15:51:19,054][21195] Updated weights for policy 0, policy_version 3980 (0.0009) +[2023-10-08 15:51:19,389][21194] Updated weights for policy 1, policy_version 3960 (0.0008) +[2023-10-08 15:51:19,425][21195] Updated weights for policy 0, policy_version 3990 (0.0007) +[2023-10-08 15:51:19,803][21195] Updated weights for policy 0, policy_version 4000 (0.0008) +[2023-10-08 15:51:23,477][21194] Updated weights for policy 1, policy_version 3970 (0.0007) +[2023-10-08 15:51:23,558][21195] Updated weights for policy 0, policy_version 4010 (0.0007) +[2023-10-08 15:51:23,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 8159232. Throughput: 0: 1752.5, 1: 1729.1. Samples: 2052762. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 15:51:23,803][19739] Avg episode reward: [(0, '16.330'), (1, '17.530')] +[2023-10-08 15:51:23,849][21194] Updated weights for policy 1, policy_version 3980 (0.0009) +[2023-10-08 15:51:23,933][21195] Updated weights for policy 0, policy_version 4020 (0.0007) +[2023-10-08 15:51:24,220][21194] Updated weights for policy 1, policy_version 3990 (0.0008) +[2023-10-08 15:51:24,312][21195] Updated weights for policy 0, policy_version 4030 (0.0007) +[2023-10-08 15:51:24,582][20836] Saving new best policy, reward=17.530! +[2023-10-08 15:51:24,585][21194] Updated weights for policy 1, policy_version 4000 (0.0007) +[2023-10-08 15:51:28,021][21195] Updated weights for policy 0, policy_version 4040 (0.0009) +[2023-10-08 15:51:28,390][21194] Updated weights for policy 1, policy_version 4010 (0.0007) +[2023-10-08 15:51:28,396][21195] Updated weights for policy 0, policy_version 4050 (0.0008) +[2023-10-08 15:51:28,758][21194] Updated weights for policy 1, policy_version 4020 (0.0007) +[2023-10-08 15:51:28,768][21195] Updated weights for policy 0, policy_version 4060 (0.0010) +[2023-10-08 15:51:28,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13107.1, 300 sec: 13773.7). Total num frames: 8224768. Throughput: 0: 1777.5, 1: 1731.3. Samples: 2074666. Policy #0 lag: (min: 31.0, avg: 32.5, max: 58.0) +[2023-10-08 15:51:28,804][19739] Avg episode reward: [(0, '20.070'), (1, '18.980')] +[2023-10-08 15:51:29,123][21194] Updated weights for policy 1, policy_version 4030 (0.0010) +[2023-10-08 15:51:29,198][20836] Saving new best policy, reward=18.980! +[2023-10-08 15:51:32,602][21195] Updated weights for policy 0, policy_version 4070 (0.0009) +[2023-10-08 15:51:32,973][21195] Updated weights for policy 0, policy_version 4080 (0.0007) +[2023-10-08 15:51:33,161][21194] Updated weights for policy 1, policy_version 4040 (0.0008) +[2023-10-08 15:51:33,334][21195] Updated weights for policy 0, policy_version 4090 (0.0007) +[2023-10-08 15:51:33,527][21194] Updated weights for policy 1, policy_version 4050 (0.0007) +[2023-10-08 15:51:33,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 8323072. Throughput: 0: 1747.9, 1: 1727.4. Samples: 2089028. Policy #0 lag: (min: 2.0, avg: 2.2, max: 10.0) +[2023-10-08 15:51:33,803][19739] Avg episode reward: [(0, '20.480'), (1, '21.150')] +[2023-10-08 15:51:33,891][21194] Updated weights for policy 1, policy_version 4060 (0.0007) +[2023-10-08 15:51:34,036][20836] Saving new best policy, reward=21.150! +[2023-10-08 15:51:37,108][21195] Updated weights for policy 0, policy_version 4100 (0.0008) +[2023-10-08 15:51:37,479][21195] Updated weights for policy 0, policy_version 4110 (0.0008) +[2023-10-08 15:51:37,849][21195] Updated weights for policy 0, policy_version 4120 (0.0008) +[2023-10-08 15:51:37,896][21194] Updated weights for policy 1, policy_version 4070 (0.0007) +[2023-10-08 15:51:38,258][21194] Updated weights for policy 1, policy_version 4080 (0.0007) +[2023-10-08 15:51:38,633][21194] Updated weights for policy 1, policy_version 4090 (0.0007) +[2023-10-08 15:51:38,803][19739] Fps is (10 sec: 16384.6, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 8388608. Throughput: 0: 1781.8, 1: 1731.4. Samples: 2105718. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 15:51:38,803][19739] Avg episode reward: [(0, '20.030'), (1, '22.290')] +[2023-10-08 15:51:38,848][20836] Saving new best policy, reward=22.290! +[2023-10-08 15:51:41,506][21195] Updated weights for policy 0, policy_version 4130 (0.0008) +[2023-10-08 15:51:41,872][21195] Updated weights for policy 0, policy_version 4140 (0.0009) +[2023-10-08 15:51:42,247][21195] Updated weights for policy 0, policy_version 4150 (0.0008) +[2023-10-08 15:51:42,531][21194] Updated weights for policy 1, policy_version 4100 (0.0008) +[2023-10-08 15:51:42,615][21195] Updated weights for policy 0, policy_version 4160 (0.0009) +[2023-10-08 15:51:42,902][21194] Updated weights for policy 1, policy_version 4110 (0.0007) +[2023-10-08 15:51:43,277][21194] Updated weights for policy 1, policy_version 4120 (0.0008) +[2023-10-08 15:51:43,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 13995.8). Total num frames: 8486912. Throughput: 0: 1753.2, 1: 1712.5. Samples: 2125334. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 15:51:43,803][19739] Avg episode reward: [(0, '19.420'), (1, '23.380')] +[2023-10-08 15:51:43,812][20836] Saving new best policy, reward=23.380! +[2023-10-08 15:51:46,427][21195] Updated weights for policy 0, policy_version 4170 (0.0007) +[2023-10-08 15:51:46,795][21195] Updated weights for policy 0, policy_version 4180 (0.0008) +[2023-10-08 15:51:47,174][21195] Updated weights for policy 0, policy_version 4190 (0.0008) +[2023-10-08 15:51:47,281][21194] Updated weights for policy 1, policy_version 4130 (0.0008) +[2023-10-08 15:51:47,646][21194] Updated weights for policy 1, policy_version 4140 (0.0007) +[2023-10-08 15:51:48,017][21194] Updated weights for policy 1, policy_version 4150 (0.0008) +[2023-10-08 15:51:48,379][21194] Updated weights for policy 1, policy_version 4160 (0.0009) +[2023-10-08 15:51:48,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 13995.8). Total num frames: 8552448. Throughput: 0: 1757.8, 1: 1729.6. Samples: 2141704. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:51:48,803][19739] Avg episode reward: [(0, '20.910'), (1, '23.840')] +[2023-10-08 15:51:48,804][20836] Saving new best policy, reward=23.840! +[2023-10-08 15:51:51,042][21195] Updated weights for policy 0, policy_version 4200 (0.0008) +[2023-10-08 15:51:51,417][21195] Updated weights for policy 0, policy_version 4210 (0.0009) +[2023-10-08 15:51:51,795][21195] Updated weights for policy 0, policy_version 4220 (0.0010) +[2023-10-08 15:51:52,294][21194] Updated weights for policy 1, policy_version 4170 (0.0008) +[2023-10-08 15:51:52,667][21194] Updated weights for policy 1, policy_version 4180 (0.0009) +[2023-10-08 15:51:53,038][21194] Updated weights for policy 1, policy_version 4190 (0.0010) +[2023-10-08 15:51:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 8617984. Throughput: 0: 1762.4, 1: 1734.8. Samples: 2157188. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:51:53,804][19739] Avg episode reward: [(0, '19.330'), (1, '25.890')] +[2023-10-08 15:51:53,805][20836] Saving new best policy, reward=25.890! +[2023-10-08 15:51:55,723][21195] Updated weights for policy 0, policy_version 4230 (0.0009) +[2023-10-08 15:51:56,110][21195] Updated weights for policy 0, policy_version 4240 (0.0009) +[2023-10-08 15:51:56,482][21195] Updated weights for policy 0, policy_version 4250 (0.0010) +[2023-10-08 15:51:57,113][21194] Updated weights for policy 1, policy_version 4200 (0.0011) +[2023-10-08 15:51:57,491][21194] Updated weights for policy 1, policy_version 4210 (0.0010) +[2023-10-08 15:51:57,851][21194] Updated weights for policy 1, policy_version 4220 (0.0010) +[2023-10-08 15:51:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 8683520. Throughput: 0: 1758.3, 1: 1700.0. Samples: 2177326. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:51:58,803][19739] Avg episode reward: [(0, '20.360'), (1, '21.740')] +[2023-10-08 15:52:00,476][21195] Updated weights for policy 0, policy_version 4260 (0.0009) +[2023-10-08 15:52:00,843][21195] Updated weights for policy 0, policy_version 4270 (0.0008) +[2023-10-08 15:52:01,217][21195] Updated weights for policy 0, policy_version 4280 (0.0007) +[2023-10-08 15:52:01,897][21194] Updated weights for policy 1, policy_version 4230 (0.0009) +[2023-10-08 15:52:02,265][21194] Updated weights for policy 1, policy_version 4240 (0.0009) +[2023-10-08 15:52:02,627][21194] Updated weights for policy 1, policy_version 4250 (0.0007) +[2023-10-08 15:52:03,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 8749056. Throughput: 0: 1760.1, 1: 1730.5. Samples: 2194242. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:52:03,803][19739] Avg episode reward: [(0, '18.540'), (1, '20.980')] +[2023-10-08 15:52:05,091][21195] Updated weights for policy 0, policy_version 4290 (0.0009) +[2023-10-08 15:52:05,455][21195] Updated weights for policy 0, policy_version 4300 (0.0007) +[2023-10-08 15:52:05,827][21195] Updated weights for policy 0, policy_version 4310 (0.0008) +[2023-10-08 15:52:06,202][21195] Updated weights for policy 0, policy_version 4320 (0.0008) +[2023-10-08 15:52:06,587][21194] Updated weights for policy 1, policy_version 4260 (0.0007) +[2023-10-08 15:52:06,957][21194] Updated weights for policy 1, policy_version 4270 (0.0007) +[2023-10-08 15:52:07,323][21194] Updated weights for policy 1, policy_version 4280 (0.0008) +[2023-10-08 15:52:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 8814592. Throughput: 0: 1752.4, 1: 1720.1. Samples: 2209022. Policy #0 lag: (min: 11.0, avg: 30.6, max: 32.0) +[2023-10-08 15:52:08,803][19739] Avg episode reward: [(0, '19.790'), (1, '21.070')] +[2023-10-08 15:52:09,832][21195] Updated weights for policy 0, policy_version 4330 (0.0007) +[2023-10-08 15:52:10,206][21195] Updated weights for policy 0, policy_version 4340 (0.0007) +[2023-10-08 15:52:10,572][21195] Updated weights for policy 0, policy_version 4350 (0.0009) +[2023-10-08 15:52:11,237][21194] Updated weights for policy 1, policy_version 4290 (0.0008) +[2023-10-08 15:52:11,600][21194] Updated weights for policy 1, policy_version 4300 (0.0009) +[2023-10-08 15:52:11,974][21194] Updated weights for policy 1, policy_version 4310 (0.0010) +[2023-10-08 15:52:12,338][21194] Updated weights for policy 1, policy_version 4320 (0.0008) +[2023-10-08 15:52:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 8880128. Throughput: 0: 1753.5, 1: 1703.2. Samples: 2230214. Policy #0 lag: (min: 11.0, avg: 30.6, max: 32.0) +[2023-10-08 15:52:13,803][19739] Avg episode reward: [(0, '19.710'), (1, '20.220')] +[2023-10-08 15:52:14,382][21195] Updated weights for policy 0, policy_version 4360 (0.0010) +[2023-10-08 15:52:14,761][21195] Updated weights for policy 0, policy_version 4370 (0.0008) +[2023-10-08 15:52:15,130][21195] Updated weights for policy 0, policy_version 4380 (0.0010) +[2023-10-08 15:52:16,333][21194] Updated weights for policy 1, policy_version 4330 (0.0009) +[2023-10-08 15:52:16,708][21194] Updated weights for policy 1, policy_version 4340 (0.0008) +[2023-10-08 15:52:17,078][21194] Updated weights for policy 1, policy_version 4350 (0.0008) +[2023-10-08 15:52:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 8945664. Throughput: 0: 1781.6, 1: 1728.4. Samples: 2246978. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 15:52:18,803][19739] Avg episode reward: [(0, '19.080'), (1, '20.920')] +[2023-10-08 15:52:18,882][21195] Updated weights for policy 0, policy_version 4390 (0.0009) +[2023-10-08 15:52:19,260][21195] Updated weights for policy 0, policy_version 4400 (0.0008) +[2023-10-08 15:52:19,641][21195] Updated weights for policy 0, policy_version 4410 (0.0010) +[2023-10-08 15:52:20,880][21194] Updated weights for policy 1, policy_version 4360 (0.0011) +[2023-10-08 15:52:21,249][21194] Updated weights for policy 1, policy_version 4370 (0.0007) +[2023-10-08 15:52:21,616][21194] Updated weights for policy 1, policy_version 4380 (0.0009) +[2023-10-08 15:52:23,471][21195] Updated weights for policy 0, policy_version 4420 (0.0008) +[2023-10-08 15:52:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 9011200. Throughput: 0: 1752.0, 1: 1703.8. Samples: 2261230. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 15:52:23,803][19739] Avg episode reward: [(0, '18.690'), (1, '20.610')] +[2023-10-08 15:52:23,845][21195] Updated weights for policy 0, policy_version 4430 (0.0009) +[2023-10-08 15:52:24,223][21195] Updated weights for policy 0, policy_version 4440 (0.0010) +[2023-10-08 15:52:25,423][21194] Updated weights for policy 1, policy_version 4390 (0.0010) +[2023-10-08 15:52:25,786][21194] Updated weights for policy 1, policy_version 4400 (0.0010) +[2023-10-08 15:52:26,153][21194] Updated weights for policy 1, policy_version 4410 (0.0009) +[2023-10-08 15:52:28,144][21195] Updated weights for policy 0, policy_version 4450 (0.0009) +[2023-10-08 15:52:28,509][21195] Updated weights for policy 0, policy_version 4460 (0.0007) +[2023-10-08 15:52:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 9076736. Throughput: 0: 1782.4, 1: 1716.5. Samples: 2282782. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:52:28,803][19739] Avg episode reward: [(0, '20.180'), (1, '24.470')] +[2023-10-08 15:52:28,882][21195] Updated weights for policy 0, policy_version 4470 (0.0007) +[2023-10-08 15:52:29,258][21195] Updated weights for policy 0, policy_version 4480 (0.0007) +[2023-10-08 15:52:30,303][21194] Updated weights for policy 1, policy_version 4420 (0.0010) +[2023-10-08 15:52:30,655][21194] Updated weights for policy 1, policy_version 4430 (0.0009) +[2023-10-08 15:52:31,024][21194] Updated weights for policy 1, policy_version 4440 (0.0008) +[2023-10-08 15:52:33,133][21195] Updated weights for policy 0, policy_version 4490 (0.0008) +[2023-10-08 15:52:33,504][21195] Updated weights for policy 0, policy_version 4500 (0.0009) +[2023-10-08 15:52:33,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 9142272. Throughput: 0: 1756.7, 1: 1710.4. Samples: 2297722. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:52:33,803][19739] Avg episode reward: [(0, '18.440'), (1, '24.130')] +[2023-10-08 15:52:33,871][21195] Updated weights for policy 0, policy_version 4510 (0.0009) +[2023-10-08 15:52:34,965][21194] Updated weights for policy 1, policy_version 4450 (0.0008) +[2023-10-08 15:52:35,334][21194] Updated weights for policy 1, policy_version 4460 (0.0008) +[2023-10-08 15:52:35,689][21194] Updated weights for policy 1, policy_version 4470 (0.0009) +[2023-10-08 15:52:36,065][21194] Updated weights for policy 1, policy_version 4480 (0.0008) +[2023-10-08 15:52:37,763][21195] Updated weights for policy 0, policy_version 4520 (0.0009) +[2023-10-08 15:52:38,139][21195] Updated weights for policy 0, policy_version 4530 (0.0007) +[2023-10-08 15:52:38,511][21195] Updated weights for policy 0, policy_version 4540 (0.0009) +[2023-10-08 15:52:38,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13995.8). Total num frames: 9240576. Throughput: 0: 1780.5, 1: 1701.2. Samples: 2313866. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:52:38,803][19739] Avg episode reward: [(0, '17.580'), (1, '23.950')] +[2023-10-08 15:52:40,273][21194] Updated weights for policy 1, policy_version 4490 (0.0007) +[2023-10-08 15:52:40,639][21194] Updated weights for policy 1, policy_version 4500 (0.0008) +[2023-10-08 15:52:41,007][21194] Updated weights for policy 1, policy_version 4510 (0.0008) +[2023-10-08 15:52:42,252][21195] Updated weights for policy 0, policy_version 4550 (0.0007) +[2023-10-08 15:52:42,638][21195] Updated weights for policy 0, policy_version 4560 (0.0007) +[2023-10-08 15:52:43,022][21195] Updated weights for policy 0, policy_version 4570 (0.0009) +[2023-10-08 15:52:43,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13995.8). Total num frames: 9306112. Throughput: 0: 1766.0, 1: 1725.6. Samples: 2334448. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 15:52:43,803][19739] Avg episode reward: [(0, '19.200'), (1, '22.360')] +[2023-10-08 15:52:44,966][21194] Updated weights for policy 1, policy_version 4520 (0.0007) +[2023-10-08 15:52:45,327][21194] Updated weights for policy 1, policy_version 4530 (0.0009) +[2023-10-08 15:52:45,693][21194] Updated weights for policy 1, policy_version 4540 (0.0011) +[2023-10-08 15:52:46,893][21195] Updated weights for policy 0, policy_version 4580 (0.0008) +[2023-10-08 15:52:47,262][21195] Updated weights for policy 0, policy_version 4590 (0.0010) +[2023-10-08 15:52:47,645][21195] Updated weights for policy 0, policy_version 4600 (0.0009) +[2023-10-08 15:52:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 9371648. Throughput: 0: 1751.8, 1: 1692.8. Samples: 2349248. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 15:52:48,803][19739] Avg episode reward: [(0, '19.090'), (1, '24.360')] +[2023-10-08 15:52:49,518][21194] Updated weights for policy 1, policy_version 4550 (0.0010) +[2023-10-08 15:52:49,882][21194] Updated weights for policy 1, policy_version 4560 (0.0010) +[2023-10-08 15:52:50,252][21194] Updated weights for policy 1, policy_version 4570 (0.0009) +[2023-10-08 15:52:51,531][21195] Updated weights for policy 0, policy_version 4610 (0.0008) +[2023-10-08 15:52:51,916][21195] Updated weights for policy 0, policy_version 4620 (0.0009) +[2023-10-08 15:52:52,294][21195] Updated weights for policy 0, policy_version 4630 (0.0011) +[2023-10-08 15:52:52,658][21195] Updated weights for policy 0, policy_version 4640 (0.0008) +[2023-10-08 15:52:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 9437184. Throughput: 0: 1775.2, 1: 1712.0. Samples: 2365942. Policy #0 lag: (min: 31.0, avg: 32.7, max: 59.0) +[2023-10-08 15:52:53,803][19739] Avg episode reward: [(0, '17.590'), (1, '24.140')] +[2023-10-08 15:52:54,296][21194] Updated weights for policy 1, policy_version 4580 (0.0010) +[2023-10-08 15:52:54,673][21194] Updated weights for policy 1, policy_version 4590 (0.0008) +[2023-10-08 15:52:55,037][21194] Updated weights for policy 1, policy_version 4600 (0.0009) +[2023-10-08 15:52:56,586][21195] Updated weights for policy 0, policy_version 4650 (0.0008) +[2023-10-08 15:52:56,960][21195] Updated weights for policy 0, policy_version 4660 (0.0008) +[2023-10-08 15:52:57,335][21195] Updated weights for policy 0, policy_version 4670 (0.0008) +[2023-10-08 15:52:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 9502720. Throughput: 0: 1745.4, 1: 1725.3. Samples: 2386396. Policy #0 lag: (min: 31.0, avg: 32.7, max: 59.0) +[2023-10-08 15:52:58,804][19739] Avg episode reward: [(0, '19.710'), (1, '22.470')] +[2023-10-08 15:52:58,892][21194] Updated weights for policy 1, policy_version 4610 (0.0009) +[2023-10-08 15:52:59,257][21194] Updated weights for policy 1, policy_version 4620 (0.0008) +[2023-10-08 15:52:59,634][21194] Updated weights for policy 1, policy_version 4630 (0.0009) +[2023-10-08 15:53:00,012][21194] Updated weights for policy 1, policy_version 4640 (0.0008) +[2023-10-08 15:53:01,133][21195] Updated weights for policy 0, policy_version 4680 (0.0009) +[2023-10-08 15:53:01,505][21195] Updated weights for policy 0, policy_version 4690 (0.0009) +[2023-10-08 15:53:01,888][21195] Updated weights for policy 0, policy_version 4700 (0.0008) +[2023-10-08 15:53:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 9568256. Throughput: 0: 1749.0, 1: 1697.3. Samples: 2402062. Policy #0 lag: (min: 31.0, avg: 31.7, max: 50.0) +[2023-10-08 15:53:03,803][19739] Avg episode reward: [(0, '20.590'), (1, '24.600')] +[2023-10-08 15:53:03,882][21194] Updated weights for policy 1, policy_version 4650 (0.0009) +[2023-10-08 15:53:04,256][21194] Updated weights for policy 1, policy_version 4660 (0.0007) +[2023-10-08 15:53:04,618][21194] Updated weights for policy 1, policy_version 4670 (0.0007) +[2023-10-08 15:53:05,499][21195] Updated weights for policy 0, policy_version 4710 (0.0010) +[2023-10-08 15:53:05,869][21195] Updated weights for policy 0, policy_version 4720 (0.0009) +[2023-10-08 15:53:06,248][21195] Updated weights for policy 0, policy_version 4730 (0.0008) +[2023-10-08 15:53:08,615][21194] Updated weights for policy 1, policy_version 4680 (0.0008) +[2023-10-08 15:53:08,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 9633792. Throughput: 0: 1747.2, 1: 1727.1. Samples: 2417572. Policy #0 lag: (min: 31.0, avg: 31.7, max: 50.0) +[2023-10-08 15:53:08,803][19739] Avg episode reward: [(0, '20.930'), (1, '24.870')] +[2023-10-08 15:53:08,990][21194] Updated weights for policy 1, policy_version 4690 (0.0009) +[2023-10-08 15:53:09,363][21194] Updated weights for policy 1, policy_version 4700 (0.0007) +[2023-10-08 15:53:10,148][21195] Updated weights for policy 0, policy_version 4740 (0.0008) +[2023-10-08 15:53:10,518][21195] Updated weights for policy 0, policy_version 4750 (0.0010) +[2023-10-08 15:53:10,890][21195] Updated weights for policy 0, policy_version 4760 (0.0009) +[2023-10-08 15:53:13,349][21194] Updated weights for policy 1, policy_version 4710 (0.0008) +[2023-10-08 15:53:13,707][21194] Updated weights for policy 1, policy_version 4720 (0.0010) +[2023-10-08 15:53:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 9699328. Throughput: 0: 1744.3, 1: 1727.2. Samples: 2438998. Policy #0 lag: (min: 0.0, avg: 25.2, max: 32.0) +[2023-10-08 15:53:13,803][19739] Avg episode reward: [(0, '20.430'), (1, '25.510')] +[2023-10-08 15:53:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000004768_4882432.pth... +[2023-10-08 15:53:13,846][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000003136_3211264.pth +[2023-10-08 15:53:14,078][21194] Updated weights for policy 1, policy_version 4730 (0.0010) +[2023-10-08 15:53:14,304][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000004736_4849664.pth... +[2023-10-08 15:53:14,342][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000003104_3178496.pth +[2023-10-08 15:53:14,795][21195] Updated weights for policy 0, policy_version 4770 (0.0009) +[2023-10-08 15:53:15,175][21195] Updated weights for policy 0, policy_version 4780 (0.0008) +[2023-10-08 15:53:15,548][21195] Updated weights for policy 0, policy_version 4790 (0.0010) +[2023-10-08 15:53:15,921][21195] Updated weights for policy 0, policy_version 4800 (0.0008) +[2023-10-08 15:53:17,924][21194] Updated weights for policy 1, policy_version 4740 (0.0008) +[2023-10-08 15:53:18,294][21194] Updated weights for policy 1, policy_version 4750 (0.0009) +[2023-10-08 15:53:18,654][21194] Updated weights for policy 1, policy_version 4760 (0.0010) +[2023-10-08 15:53:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 9764864. Throughput: 0: 1763.5, 1: 1721.7. Samples: 2454556. Policy #0 lag: (min: 0.0, avg: 25.2, max: 32.0) +[2023-10-08 15:53:18,803][19739] Avg episode reward: [(0, '22.010'), (1, '28.250')] +[2023-10-08 15:53:18,949][20836] Saving new best policy, reward=28.250! +[2023-10-08 15:53:19,889][21195] Updated weights for policy 0, policy_version 4810 (0.0008) +[2023-10-08 15:53:20,269][21195] Updated weights for policy 0, policy_version 4820 (0.0009) +[2023-10-08 15:53:20,642][21195] Updated weights for policy 0, policy_version 4830 (0.0010) +[2023-10-08 15:53:22,684][21194] Updated weights for policy 1, policy_version 4770 (0.0010) +[2023-10-08 15:53:23,054][21194] Updated weights for policy 1, policy_version 4780 (0.0008) +[2023-10-08 15:53:23,432][21194] Updated weights for policy 1, policy_version 4790 (0.0009) +[2023-10-08 15:53:23,797][21194] Updated weights for policy 1, policy_version 4800 (0.0008) +[2023-10-08 15:53:23,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13995.8). Total num frames: 9863168. Throughput: 0: 1734.6, 1: 1735.3. Samples: 2470010. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:53:23,803][19739] Avg episode reward: [(0, '22.650'), (1, '28.700')] +[2023-10-08 15:53:23,804][20836] Saving new best policy, reward=28.700! +[2023-10-08 15:53:24,540][21195] Updated weights for policy 0, policy_version 4840 (0.0007) +[2023-10-08 15:53:24,920][21195] Updated weights for policy 0, policy_version 4850 (0.0010) +[2023-10-08 15:53:25,283][21195] Updated weights for policy 0, policy_version 4860 (0.0010) +[2023-10-08 15:53:27,809][21194] Updated weights for policy 1, policy_version 4810 (0.0009) +[2023-10-08 15:53:28,184][21194] Updated weights for policy 1, policy_version 4820 (0.0010) +[2023-10-08 15:53:28,562][21194] Updated weights for policy 1, policy_version 4830 (0.0011) +[2023-10-08 15:53:28,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 9928704. Throughput: 0: 1750.0, 1: 1719.8. Samples: 2490588. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:53:28,803][19739] Avg episode reward: [(0, '20.080'), (1, '29.350')] +[2023-10-08 15:53:28,811][20836] Saving new best policy, reward=29.350! +[2023-10-08 15:53:29,196][21195] Updated weights for policy 0, policy_version 4870 (0.0009) +[2023-10-08 15:53:29,587][21195] Updated weights for policy 0, policy_version 4880 (0.0007) +[2023-10-08 15:53:29,957][21195] Updated weights for policy 0, policy_version 4890 (0.0007) +[2023-10-08 15:53:32,435][21194] Updated weights for policy 1, policy_version 4840 (0.0008) +[2023-10-08 15:53:32,814][21194] Updated weights for policy 1, policy_version 4850 (0.0008) +[2023-10-08 15:53:33,179][21194] Updated weights for policy 1, policy_version 4860 (0.0008) +[2023-10-08 15:53:33,722][21195] Updated weights for policy 0, policy_version 4900 (0.0009) +[2023-10-08 15:53:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 9994240. Throughput: 0: 1759.5, 1: 1735.0. Samples: 2506500. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:53:33,803][19739] Avg episode reward: [(0, '19.550'), (1, '29.870')] +[2023-10-08 15:53:33,804][20836] Saving new best policy, reward=29.870! +[2023-10-08 15:53:34,089][21195] Updated weights for policy 0, policy_version 4910 (0.0011) +[2023-10-08 15:53:34,459][21195] Updated weights for policy 0, policy_version 4920 (0.0011) +[2023-10-08 15:53:37,131][21194] Updated weights for policy 1, policy_version 4870 (0.0010) +[2023-10-08 15:53:37,507][21194] Updated weights for policy 1, policy_version 4880 (0.0009) +[2023-10-08 15:53:37,885][21194] Updated weights for policy 1, policy_version 4890 (0.0009) +[2023-10-08 15:53:38,367][21195] Updated weights for policy 0, policy_version 4930 (0.0011) +[2023-10-08 15:53:38,738][21195] Updated weights for policy 0, policy_version 4940 (0.0007) +[2023-10-08 15:53:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 10059776. Throughput: 0: 1740.1, 1: 1730.3. Samples: 2522108. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:53:38,803][19739] Avg episode reward: [(0, '20.280'), (1, '31.040')] +[2023-10-08 15:53:38,804][20836] Saving new best policy, reward=31.040! +[2023-10-08 15:53:39,119][21195] Updated weights for policy 0, policy_version 4950 (0.0008) +[2023-10-08 15:53:39,481][21195] Updated weights for policy 0, policy_version 4960 (0.0007) +[2023-10-08 15:53:41,719][21194] Updated weights for policy 1, policy_version 4900 (0.0007) +[2023-10-08 15:53:42,094][21194] Updated weights for policy 1, policy_version 4910 (0.0007) +[2023-10-08 15:53:42,469][21194] Updated weights for policy 1, policy_version 4920 (0.0009) +[2023-10-08 15:53:43,403][21195] Updated weights for policy 0, policy_version 4970 (0.0008) +[2023-10-08 15:53:43,770][21195] Updated weights for policy 0, policy_version 4980 (0.0010) +[2023-10-08 15:53:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 10125312. Throughput: 0: 1764.5, 1: 1702.5. Samples: 2542412. Policy #0 lag: (min: 5.0, avg: 8.5, max: 37.0) +[2023-10-08 15:53:43,803][19739] Avg episode reward: [(0, '19.390'), (1, '34.150')] +[2023-10-08 15:53:43,814][20836] Saving new best policy, reward=34.150! +[2023-10-08 15:53:44,148][21195] Updated weights for policy 0, policy_version 4990 (0.0011) +[2023-10-08 15:53:46,304][21194] Updated weights for policy 1, policy_version 4930 (0.0008) +[2023-10-08 15:53:46,660][21194] Updated weights for policy 1, policy_version 4940 (0.0011) +[2023-10-08 15:53:47,032][21194] Updated weights for policy 1, policy_version 4950 (0.0007) +[2023-10-08 15:53:47,397][21194] Updated weights for policy 1, policy_version 4960 (0.0007) +[2023-10-08 15:53:48,118][21195] Updated weights for policy 0, policy_version 5000 (0.0009) +[2023-10-08 15:53:48,501][21195] Updated weights for policy 0, policy_version 5010 (0.0008) +[2023-10-08 15:53:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 10190848. Throughput: 0: 1730.7, 1: 1735.5. Samples: 2558042. Policy #0 lag: (min: 5.0, avg: 8.5, max: 37.0) +[2023-10-08 15:53:48,803][19739] Avg episode reward: [(0, '17.770'), (1, '34.420')] +[2023-10-08 15:53:48,804][20836] Saving new best policy, reward=34.420! +[2023-10-08 15:53:48,869][21195] Updated weights for policy 0, policy_version 5020 (0.0010) +[2023-10-08 15:53:51,510][21194] Updated weights for policy 1, policy_version 4970 (0.0008) +[2023-10-08 15:53:51,885][21194] Updated weights for policy 1, policy_version 4980 (0.0008) +[2023-10-08 15:53:52,248][21194] Updated weights for policy 1, policy_version 4990 (0.0008) +[2023-10-08 15:53:52,783][21195] Updated weights for policy 0, policy_version 5030 (0.0008) +[2023-10-08 15:53:53,159][21195] Updated weights for policy 0, policy_version 5040 (0.0007) +[2023-10-08 15:53:53,524][21195] Updated weights for policy 0, policy_version 5050 (0.0008) +[2023-10-08 15:53:53,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13995.8). Total num frames: 10289152. Throughput: 0: 1751.3, 1: 1709.3. Samples: 2573300. Policy #0 lag: (min: 22.0, avg: 29.0, max: 54.0) +[2023-10-08 15:53:53,803][19739] Avg episode reward: [(0, '19.980'), (1, '32.580')] +[2023-10-08 15:53:56,314][21194] Updated weights for policy 1, policy_version 5000 (0.0008) +[2023-10-08 15:53:56,680][21194] Updated weights for policy 1, policy_version 5010 (0.0008) +[2023-10-08 15:53:57,051][21194] Updated weights for policy 1, policy_version 5020 (0.0009) +[2023-10-08 15:53:57,309][21195] Updated weights for policy 0, policy_version 5060 (0.0008) +[2023-10-08 15:53:57,675][21195] Updated weights for policy 0, policy_version 5070 (0.0008) +[2023-10-08 15:53:58,042][21195] Updated weights for policy 0, policy_version 5080 (0.0011) +[2023-10-08 15:53:58,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13995.8). Total num frames: 10354688. Throughput: 0: 1737.2, 1: 1700.3. Samples: 2593686. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 15:53:58,803][19739] Avg episode reward: [(0, '20.980'), (1, '32.420')] +[2023-10-08 15:54:01,059][21194] Updated weights for policy 1, policy_version 5030 (0.0008) +[2023-10-08 15:54:01,438][21194] Updated weights for policy 1, policy_version 5040 (0.0008) +[2023-10-08 15:54:01,801][21194] Updated weights for policy 1, policy_version 5050 (0.0008) +[2023-10-08 15:54:01,931][21195] Updated weights for policy 0, policy_version 5090 (0.0011) +[2023-10-08 15:54:02,309][21195] Updated weights for policy 0, policy_version 5100 (0.0009) +[2023-10-08 15:54:02,680][21195] Updated weights for policy 0, policy_version 5110 (0.0008) +[2023-10-08 15:54:03,044][21195] Updated weights for policy 0, policy_version 5120 (0.0008) +[2023-10-08 15:54:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 10420224. Throughput: 0: 1720.9, 1: 1720.9. Samples: 2609440. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 15:54:03,804][19739] Avg episode reward: [(0, '19.830'), (1, '33.190')] +[2023-10-08 15:54:05,659][21194] Updated weights for policy 1, policy_version 5060 (0.0010) +[2023-10-08 15:54:06,031][21194] Updated weights for policy 1, policy_version 5070 (0.0010) +[2023-10-08 15:54:06,400][21194] Updated weights for policy 1, policy_version 5080 (0.0008) +[2023-10-08 15:54:07,121][21195] Updated weights for policy 0, policy_version 5130 (0.0008) +[2023-10-08 15:54:07,481][21195] Updated weights for policy 0, policy_version 5140 (0.0010) +[2023-10-08 15:54:07,860][21195] Updated weights for policy 0, policy_version 5150 (0.0010) +[2023-10-08 15:54:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 10485760. Throughput: 0: 1750.2, 1: 1696.1. Samples: 2625094. Policy #0 lag: (min: 0.0, avg: 25.4, max: 32.0) +[2023-10-08 15:54:08,803][19739] Avg episode reward: [(0, '21.090'), (1, '33.630')] +[2023-10-08 15:54:10,485][21194] Updated weights for policy 1, policy_version 5090 (0.0008) +[2023-10-08 15:54:10,853][21194] Updated weights for policy 1, policy_version 5100 (0.0007) +[2023-10-08 15:54:11,218][21194] Updated weights for policy 1, policy_version 5110 (0.0010) +[2023-10-08 15:54:11,588][21194] Updated weights for policy 1, policy_version 5120 (0.0008) +[2023-10-08 15:54:11,804][21195] Updated weights for policy 0, policy_version 5160 (0.0009) +[2023-10-08 15:54:12,168][21195] Updated weights for policy 0, policy_version 5170 (0.0011) +[2023-10-08 15:54:12,544][21195] Updated weights for policy 0, policy_version 5180 (0.0011) +[2023-10-08 15:54:13,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 10551296. Throughput: 0: 1720.0, 1: 1715.9. Samples: 2645204. Policy #0 lag: (min: 0.0, avg: 25.4, max: 32.0) +[2023-10-08 15:54:13,803][19739] Avg episode reward: [(0, '22.310'), (1, '35.240')] +[2023-10-08 15:54:13,809][20836] Saving new best policy, reward=35.240! +[2023-10-08 15:54:15,714][21194] Updated weights for policy 1, policy_version 5130 (0.0010) +[2023-10-08 15:54:16,081][21194] Updated weights for policy 1, policy_version 5140 (0.0007) +[2023-10-08 15:54:16,443][21194] Updated weights for policy 1, policy_version 5150 (0.0007) +[2023-10-08 15:54:16,707][21195] Updated weights for policy 0, policy_version 5190 (0.0009) +[2023-10-08 15:54:17,080][21195] Updated weights for policy 0, policy_version 5200 (0.0009) +[2023-10-08 15:54:17,446][21195] Updated weights for policy 0, policy_version 5210 (0.0010) +[2023-10-08 15:54:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 10616832. Throughput: 0: 1712.8, 1: 1713.0. Samples: 2660662. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:54:18,803][19739] Avg episode reward: [(0, '25.430'), (1, '35.180')] +[2023-10-08 15:54:20,192][21194] Updated weights for policy 1, policy_version 5160 (0.0007) +[2023-10-08 15:54:20,560][21194] Updated weights for policy 1, policy_version 5170 (0.0011) +[2023-10-08 15:54:20,937][21194] Updated weights for policy 1, policy_version 5180 (0.0007) +[2023-10-08 15:54:21,203][21195] Updated weights for policy 0, policy_version 5220 (0.0008) +[2023-10-08 15:54:21,574][21195] Updated weights for policy 0, policy_version 5230 (0.0008) +[2023-10-08 15:54:21,950][21195] Updated weights for policy 0, policy_version 5240 (0.0009) +[2023-10-08 15:54:23,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 10682368. Throughput: 0: 1722.4, 1: 1702.3. Samples: 2676218. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:54:23,803][19739] Avg episode reward: [(0, '25.950'), (1, '35.680')] +[2023-10-08 15:54:23,805][20836] Saving new best policy, reward=35.680! +[2023-10-08 15:54:24,915][21194] Updated weights for policy 1, policy_version 5190 (0.0010) +[2023-10-08 15:54:25,287][21194] Updated weights for policy 1, policy_version 5200 (0.0010) +[2023-10-08 15:54:25,650][21194] Updated weights for policy 1, policy_version 5210 (0.0009) +[2023-10-08 15:54:25,904][21195] Updated weights for policy 0, policy_version 5250 (0.0007) +[2023-10-08 15:54:26,283][21195] Updated weights for policy 0, policy_version 5260 (0.0007) +[2023-10-08 15:54:26,646][21195] Updated weights for policy 0, policy_version 5270 (0.0010) +[2023-10-08 15:54:27,022][21195] Updated weights for policy 0, policy_version 5280 (0.0007) +[2023-10-08 15:54:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 10747904. Throughput: 0: 1708.8, 1: 1727.6. Samples: 2697052. Policy #0 lag: (min: 5.0, avg: 5.0, max: 5.0) +[2023-10-08 15:54:28,803][19739] Avg episode reward: [(0, '25.810'), (1, '35.100')] +[2023-10-08 15:54:29,721][21194] Updated weights for policy 1, policy_version 5220 (0.0010) +[2023-10-08 15:54:30,080][21194] Updated weights for policy 1, policy_version 5230 (0.0009) +[2023-10-08 15:54:30,448][21194] Updated weights for policy 1, policy_version 5240 (0.0009) +[2023-10-08 15:54:30,958][21195] Updated weights for policy 0, policy_version 5290 (0.0007) +[2023-10-08 15:54:31,336][21195] Updated weights for policy 0, policy_version 5300 (0.0008) +[2023-10-08 15:54:31,700][21195] Updated weights for policy 0, policy_version 5310 (0.0008) +[2023-10-08 15:54:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 10813440. Throughput: 0: 1734.8, 1: 1693.8. Samples: 2712332. Policy #0 lag: (min: 5.0, avg: 5.0, max: 5.0) +[2023-10-08 15:54:33,803][19739] Avg episode reward: [(0, '27.280'), (1, '40.370')] +[2023-10-08 15:54:33,804][20740] Saving new best policy, reward=27.280! +[2023-10-08 15:54:33,804][20836] Saving new best policy, reward=40.370! +[2023-10-08 15:54:34,346][21194] Updated weights for policy 1, policy_version 5250 (0.0010) +[2023-10-08 15:54:34,723][21194] Updated weights for policy 1, policy_version 5260 (0.0009) +[2023-10-08 15:54:35,093][21194] Updated weights for policy 1, policy_version 5270 (0.0011) +[2023-10-08 15:54:35,467][21194] Updated weights for policy 1, policy_version 5280 (0.0010) +[2023-10-08 15:54:35,797][21195] Updated weights for policy 0, policy_version 5320 (0.0010) +[2023-10-08 15:54:36,173][21195] Updated weights for policy 0, policy_version 5330 (0.0008) +[2023-10-08 15:54:36,553][21195] Updated weights for policy 0, policy_version 5340 (0.0008) +[2023-10-08 15:54:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 10878976. Throughput: 0: 1713.0, 1: 1719.9. Samples: 2727782. Policy #0 lag: (min: 19.0, avg: 31.8, max: 51.0) +[2023-10-08 15:54:38,803][19739] Avg episode reward: [(0, '31.040'), (1, '42.880')] +[2023-10-08 15:54:38,804][20740] Saving new best policy, reward=31.040! +[2023-10-08 15:54:38,804][20836] Saving new best policy, reward=42.880! +[2023-10-08 15:54:39,466][21194] Updated weights for policy 1, policy_version 5290 (0.0008) +[2023-10-08 15:54:39,836][21194] Updated weights for policy 1, policy_version 5300 (0.0008) +[2023-10-08 15:54:40,212][21194] Updated weights for policy 1, policy_version 5310 (0.0007) +[2023-10-08 15:54:40,467][21195] Updated weights for policy 0, policy_version 5350 (0.0009) +[2023-10-08 15:54:40,841][21195] Updated weights for policy 0, policy_version 5360 (0.0008) +[2023-10-08 15:54:41,214][21195] Updated weights for policy 0, policy_version 5370 (0.0007) +[2023-10-08 15:54:43,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 10944512. Throughput: 0: 1721.6, 1: 1733.5. Samples: 2749168. Policy #0 lag: (min: 19.0, avg: 31.8, max: 51.0) +[2023-10-08 15:54:43,804][19739] Avg episode reward: [(0, '30.500'), (1, '42.740')] +[2023-10-08 15:54:44,201][21194] Updated weights for policy 1, policy_version 5320 (0.0008) +[2023-10-08 15:54:44,567][21194] Updated weights for policy 1, policy_version 5330 (0.0007) +[2023-10-08 15:54:44,948][21194] Updated weights for policy 1, policy_version 5340 (0.0007) +[2023-10-08 15:54:45,196][21195] Updated weights for policy 0, policy_version 5380 (0.0011) +[2023-10-08 15:54:45,560][21195] Updated weights for policy 0, policy_version 5390 (0.0010) +[2023-10-08 15:54:45,933][21195] Updated weights for policy 0, policy_version 5400 (0.0008) +[2023-10-08 15:54:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 11010048. Throughput: 0: 1732.3, 1: 1708.0. Samples: 2764252. Policy #0 lag: (min: 3.0, avg: 5.4, max: 31.0) +[2023-10-08 15:54:48,803][19739] Avg episode reward: [(0, '37.940'), (1, '45.700')] +[2023-10-08 15:54:48,804][20740] Saving new best policy, reward=37.940! +[2023-10-08 15:54:48,980][21194] Updated weights for policy 1, policy_version 5350 (0.0008) +[2023-10-08 15:54:49,352][21194] Updated weights for policy 1, policy_version 5360 (0.0008) +[2023-10-08 15:54:49,723][21194] Updated weights for policy 1, policy_version 5370 (0.0007) +[2023-10-08 15:54:49,942][20836] Saving new best policy, reward=45.700! +[2023-10-08 15:54:49,989][21195] Updated weights for policy 0, policy_version 5410 (0.0008) +[2023-10-08 15:54:50,359][21195] Updated weights for policy 0, policy_version 5420 (0.0010) +[2023-10-08 15:54:50,728][21195] Updated weights for policy 0, policy_version 5430 (0.0010) +[2023-10-08 15:54:51,100][21195] Updated weights for policy 0, policy_version 5440 (0.0011) +[2023-10-08 15:54:53,707][21194] Updated weights for policy 1, policy_version 5380 (0.0008) +[2023-10-08 15:54:53,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13884.7). Total num frames: 11075584. Throughput: 0: 1701.8, 1: 1727.6. Samples: 2779416. Policy #0 lag: (min: 3.0, avg: 5.4, max: 31.0) +[2023-10-08 15:54:53,803][19739] Avg episode reward: [(0, '37.890'), (1, '48.530')] +[2023-10-08 15:54:54,078][21194] Updated weights for policy 1, policy_version 5390 (0.0007) +[2023-10-08 15:54:54,438][21194] Updated weights for policy 1, policy_version 5400 (0.0009) +[2023-10-08 15:54:54,728][20836] Saving new best policy, reward=48.530! +[2023-10-08 15:54:54,842][21195] Updated weights for policy 0, policy_version 5450 (0.0008) +[2023-10-08 15:54:55,223][21195] Updated weights for policy 0, policy_version 5460 (0.0008) +[2023-10-08 15:54:55,593][21195] Updated weights for policy 0, policy_version 5470 (0.0009) +[2023-10-08 15:54:58,343][21194] Updated weights for policy 1, policy_version 5410 (0.0009) +[2023-10-08 15:54:58,707][21194] Updated weights for policy 1, policy_version 5420 (0.0007) +[2023-10-08 15:54:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 11141120. Throughput: 0: 1730.0, 1: 1727.6. Samples: 2800796. Policy #0 lag: (min: 31.0, avg: 38.4, max: 63.0) +[2023-10-08 15:54:58,803][19739] Avg episode reward: [(0, '38.760'), (1, '49.990')] +[2023-10-08 15:54:58,810][20740] Saving new best policy, reward=38.760! +[2023-10-08 15:54:59,084][21194] Updated weights for policy 1, policy_version 5430 (0.0007) +[2023-10-08 15:54:59,403][21195] Updated weights for policy 0, policy_version 5480 (0.0008) +[2023-10-08 15:54:59,439][20836] Saving new best policy, reward=49.990! +[2023-10-08 15:54:59,442][21194] Updated weights for policy 1, policy_version 5440 (0.0009) +[2023-10-08 15:54:59,773][21195] Updated weights for policy 0, policy_version 5490 (0.0008) +[2023-10-08 15:55:00,149][21195] Updated weights for policy 0, policy_version 5500 (0.0007) +[2023-10-08 15:55:03,507][21194] Updated weights for policy 1, policy_version 5450 (0.0011) +[2023-10-08 15:55:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 11206656. Throughput: 0: 1734.0, 1: 1717.4. Samples: 2815974. Policy #0 lag: (min: 31.0, avg: 38.4, max: 63.0) +[2023-10-08 15:55:03,803][19739] Avg episode reward: [(0, '37.200'), (1, '47.320')] +[2023-10-08 15:55:03,876][21194] Updated weights for policy 1, policy_version 5460 (0.0010) +[2023-10-08 15:55:04,256][21194] Updated weights for policy 1, policy_version 5470 (0.0011) +[2023-10-08 15:55:04,405][21195] Updated weights for policy 0, policy_version 5510 (0.0008) +[2023-10-08 15:55:04,790][21195] Updated weights for policy 0, policy_version 5520 (0.0007) +[2023-10-08 15:55:05,161][21195] Updated weights for policy 0, policy_version 5530 (0.0008) +[2023-10-08 15:55:08,070][21194] Updated weights for policy 1, policy_version 5480 (0.0009) +[2023-10-08 15:55:08,443][21194] Updated weights for policy 1, policy_version 5490 (0.0007) +[2023-10-08 15:55:08,802][21194] Updated weights for policy 1, policy_version 5500 (0.0009) +[2023-10-08 15:55:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 11272192. Throughput: 0: 1715.9, 1: 1724.7. Samples: 2831046. Policy #0 lag: (min: 31.0, avg: 31.0, max: 35.0) +[2023-10-08 15:55:08,803][19739] Avg episode reward: [(0, '39.000'), (1, '48.990')] +[2023-10-08 15:55:08,804][20740] Saving new best policy, reward=39.000! +[2023-10-08 15:55:09,172][21195] Updated weights for policy 0, policy_version 5540 (0.0008) +[2023-10-08 15:55:09,538][21195] Updated weights for policy 0, policy_version 5550 (0.0009) +[2023-10-08 15:55:09,916][21195] Updated weights for policy 0, policy_version 5560 (0.0010) +[2023-10-08 15:55:12,716][21194] Updated weights for policy 1, policy_version 5510 (0.0008) +[2023-10-08 15:55:13,077][21194] Updated weights for policy 1, policy_version 5520 (0.0007) +[2023-10-08 15:55:13,452][21194] Updated weights for policy 1, policy_version 5530 (0.0007) +[2023-10-08 15:55:13,803][19739] Fps is (10 sec: 16383.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 11370496. Throughput: 0: 1725.6, 1: 1716.6. Samples: 2851952. Policy #0 lag: (min: 31.0, avg: 31.0, max: 35.0) +[2023-10-08 15:55:13,804][19739] Avg episode reward: [(0, '42.430'), (1, '49.400')] +[2023-10-08 15:55:13,815][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000005536_5668864.pth... +[2023-10-08 15:55:13,845][21195] Updated weights for policy 0, policy_version 5570 (0.0010) +[2023-10-08 15:55:13,847][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000003936_4030464.pth +[2023-10-08 15:55:14,223][21195] Updated weights for policy 0, policy_version 5580 (0.0010) +[2023-10-08 15:55:14,582][21195] Updated weights for policy 0, policy_version 5590 (0.0008) +[2023-10-08 15:55:14,952][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000005600_5734400.pth... +[2023-10-08 15:55:14,953][21195] Updated weights for policy 0, policy_version 5600 (0.0007) +[2023-10-08 15:55:14,991][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000003936_4030464.pth +[2023-10-08 15:55:14,996][20740] Saving new best policy, reward=42.430! +[2023-10-08 15:55:17,410][21194] Updated weights for policy 1, policy_version 5540 (0.0008) +[2023-10-08 15:55:17,777][21194] Updated weights for policy 1, policy_version 5550 (0.0008) +[2023-10-08 15:55:18,152][21194] Updated weights for policy 1, policy_version 5560 (0.0009) +[2023-10-08 15:55:18,734][21195] Updated weights for policy 0, policy_version 5610 (0.0010) +[2023-10-08 15:55:18,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 11436032. Throughput: 0: 1720.9, 1: 1731.6. Samples: 2867692. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:55:18,803][19739] Avg episode reward: [(0, '42.650'), (1, '52.820')] +[2023-10-08 15:55:18,804][20836] Saving new best policy, reward=52.820! +[2023-10-08 15:55:19,102][21195] Updated weights for policy 0, policy_version 5620 (0.0011) +[2023-10-08 15:55:19,472][21195] Updated weights for policy 0, policy_version 5630 (0.0009) +[2023-10-08 15:55:19,544][20740] Saving new best policy, reward=42.650! +[2023-10-08 15:55:22,163][21194] Updated weights for policy 1, policy_version 5570 (0.0008) +[2023-10-08 15:55:22,537][21194] Updated weights for policy 1, policy_version 5580 (0.0008) +[2023-10-08 15:55:22,896][21194] Updated weights for policy 1, policy_version 5590 (0.0008) +[2023-10-08 15:55:23,258][21194] Updated weights for policy 1, policy_version 5600 (0.0007) +[2023-10-08 15:55:23,314][21195] Updated weights for policy 0, policy_version 5640 (0.0009) +[2023-10-08 15:55:23,685][21195] Updated weights for policy 0, policy_version 5650 (0.0007) +[2023-10-08 15:55:23,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 11501568. Throughput: 0: 1727.2, 1: 1730.1. Samples: 2883360. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:55:23,804][19739] Avg episode reward: [(0, '41.320'), (1, '53.320')] +[2023-10-08 15:55:23,805][20836] Saving new best policy, reward=53.320! +[2023-10-08 15:55:24,057][21195] Updated weights for policy 0, policy_version 5660 (0.0007) +[2023-10-08 15:55:27,211][21194] Updated weights for policy 1, policy_version 5610 (0.0008) +[2023-10-08 15:55:27,585][21194] Updated weights for policy 1, policy_version 5620 (0.0008) +[2023-10-08 15:55:27,953][21194] Updated weights for policy 1, policy_version 5630 (0.0008) +[2023-10-08 15:55:28,073][21195] Updated weights for policy 0, policy_version 5670 (0.0008) +[2023-10-08 15:55:28,448][21195] Updated weights for policy 0, policy_version 5680 (0.0008) +[2023-10-08 15:55:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 11567104. Throughput: 0: 1733.4, 1: 1694.6. Samples: 2903428. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:55:28,803][19739] Avg episode reward: [(0, '41.100'), (1, '52.170')] +[2023-10-08 15:55:28,815][21195] Updated weights for policy 0, policy_version 5690 (0.0008) +[2023-10-08 15:55:31,732][21194] Updated weights for policy 1, policy_version 5640 (0.0008) +[2023-10-08 15:55:32,105][21194] Updated weights for policy 1, policy_version 5650 (0.0009) +[2023-10-08 15:55:32,466][21194] Updated weights for policy 1, policy_version 5660 (0.0008) +[2023-10-08 15:55:32,700][21195] Updated weights for policy 0, policy_version 5700 (0.0010) +[2023-10-08 15:55:33,062][21195] Updated weights for policy 0, policy_version 5710 (0.0008) +[2023-10-08 15:55:33,432][21195] Updated weights for policy 0, policy_version 5720 (0.0010) +[2023-10-08 15:55:33,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 11665408. Throughput: 0: 1707.0, 1: 1726.8. Samples: 2918770. Policy #0 lag: (min: 1.0, avg: 17.5, max: 33.0) +[2023-10-08 15:55:33,803][19739] Avg episode reward: [(0, '42.770'), (1, '53.770')] +[2023-10-08 15:55:33,804][20740] Saving new best policy, reward=42.770! +[2023-10-08 15:55:33,804][20836] Saving new best policy, reward=53.770! +[2023-10-08 15:55:36,570][21194] Updated weights for policy 1, policy_version 5670 (0.0008) +[2023-10-08 15:55:36,948][21194] Updated weights for policy 1, policy_version 5680 (0.0009) +[2023-10-08 15:55:37,314][21194] Updated weights for policy 1, policy_version 5690 (0.0010) +[2023-10-08 15:55:37,334][21195] Updated weights for policy 0, policy_version 5730 (0.0008) +[2023-10-08 15:55:37,714][21195] Updated weights for policy 0, policy_version 5740 (0.0009) +[2023-10-08 15:55:38,076][21195] Updated weights for policy 0, policy_version 5750 (0.0009) +[2023-10-08 15:55:38,448][21195] Updated weights for policy 0, policy_version 5760 (0.0009) +[2023-10-08 15:55:38,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 11730944. Throughput: 0: 1738.7, 1: 1718.0. Samples: 2934966. Policy #0 lag: (min: 1.0, avg: 17.5, max: 33.0) +[2023-10-08 15:55:38,803][19739] Avg episode reward: [(0, '39.150'), (1, '52.060')] +[2023-10-08 15:55:41,182][21194] Updated weights for policy 1, policy_version 5700 (0.0008) +[2023-10-08 15:55:41,545][21194] Updated weights for policy 1, policy_version 5710 (0.0010) +[2023-10-08 15:55:41,918][21194] Updated weights for policy 1, policy_version 5720 (0.0008) +[2023-10-08 15:55:42,448][21195] Updated weights for policy 0, policy_version 5770 (0.0010) +[2023-10-08 15:55:42,814][21195] Updated weights for policy 0, policy_version 5780 (0.0008) +[2023-10-08 15:55:43,182][21195] Updated weights for policy 0, policy_version 5790 (0.0008) +[2023-10-08 15:55:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 11796480. Throughput: 0: 1723.3, 1: 1705.9. Samples: 2955110. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:55:43,803][19739] Avg episode reward: [(0, '38.520'), (1, '52.060')] +[2023-10-08 15:55:45,794][21194] Updated weights for policy 1, policy_version 5730 (0.0009) +[2023-10-08 15:55:46,164][21194] Updated weights for policy 1, policy_version 5740 (0.0009) +[2023-10-08 15:55:46,538][21194] Updated weights for policy 1, policy_version 5750 (0.0009) +[2023-10-08 15:55:46,902][21194] Updated weights for policy 1, policy_version 5760 (0.0007) +[2023-10-08 15:55:47,013][21195] Updated weights for policy 0, policy_version 5800 (0.0008) +[2023-10-08 15:55:47,385][21195] Updated weights for policy 0, policy_version 5810 (0.0009) +[2023-10-08 15:55:47,751][21195] Updated weights for policy 0, policy_version 5820 (0.0008) +[2023-10-08 15:55:48,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 11862016. Throughput: 0: 1714.9, 1: 1728.8. Samples: 2970944. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:55:48,804][19739] Avg episode reward: [(0, '38.390'), (1, '51.440')] +[2023-10-08 15:55:50,916][21194] Updated weights for policy 1, policy_version 5770 (0.0012) +[2023-10-08 15:55:51,288][21194] Updated weights for policy 1, policy_version 5780 (0.0009) +[2023-10-08 15:55:51,655][21194] Updated weights for policy 1, policy_version 5790 (0.0009) +[2023-10-08 15:55:51,870][21195] Updated weights for policy 0, policy_version 5830 (0.0008) +[2023-10-08 15:55:52,250][21195] Updated weights for policy 0, policy_version 5840 (0.0009) +[2023-10-08 15:55:52,625][21195] Updated weights for policy 0, policy_version 5850 (0.0008) +[2023-10-08 15:55:53,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 11927552. Throughput: 0: 1742.1, 1: 1710.9. Samples: 2986430. Policy #0 lag: (min: 17.0, avg: 25.0, max: 49.0) +[2023-10-08 15:55:53,803][19739] Avg episode reward: [(0, '40.420'), (1, '52.590')] +[2023-10-08 15:55:55,625][21194] Updated weights for policy 1, policy_version 5800 (0.0009) +[2023-10-08 15:55:56,004][21194] Updated weights for policy 1, policy_version 5810 (0.0011) +[2023-10-08 15:55:56,375][21194] Updated weights for policy 1, policy_version 5820 (0.0009) +[2023-10-08 15:55:56,409][21195] Updated weights for policy 0, policy_version 5860 (0.0009) +[2023-10-08 15:55:56,781][21195] Updated weights for policy 0, policy_version 5870 (0.0010) +[2023-10-08 15:55:57,158][21195] Updated weights for policy 0, policy_version 5880 (0.0010) +[2023-10-08 15:55:58,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 11993088. Throughput: 0: 1719.0, 1: 1725.5. Samples: 3006954. Policy #0 lag: (min: 17.0, avg: 25.0, max: 49.0) +[2023-10-08 15:55:58,803][19739] Avg episode reward: [(0, '40.900'), (1, '51.320')] +[2023-10-08 15:56:00,046][21194] Updated weights for policy 1, policy_version 5830 (0.0008) +[2023-10-08 15:56:00,411][21194] Updated weights for policy 1, policy_version 5840 (0.0008) +[2023-10-08 15:56:00,777][21194] Updated weights for policy 1, policy_version 5850 (0.0009) +[2023-10-08 15:56:01,060][21195] Updated weights for policy 0, policy_version 5890 (0.0009) +[2023-10-08 15:56:01,435][21195] Updated weights for policy 0, policy_version 5900 (0.0009) +[2023-10-08 15:56:01,813][21195] Updated weights for policy 0, policy_version 5910 (0.0009) +[2023-10-08 15:56:02,190][21195] Updated weights for policy 0, policy_version 5920 (0.0008) +[2023-10-08 15:56:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 12058624. Throughput: 0: 1723.2, 1: 1713.4. Samples: 3022340. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 15:56:03,803][19739] Avg episode reward: [(0, '47.170'), (1, '58.220')] +[2023-10-08 15:56:03,804][20740] Saving new best policy, reward=47.170! +[2023-10-08 15:56:03,804][20836] Saving new best policy, reward=58.220! +[2023-10-08 15:56:04,607][21194] Updated weights for policy 1, policy_version 5860 (0.0009) +[2023-10-08 15:56:04,971][21194] Updated weights for policy 1, policy_version 5870 (0.0008) +[2023-10-08 15:56:05,332][21194] Updated weights for policy 1, policy_version 5880 (0.0008) +[2023-10-08 15:56:06,096][21195] Updated weights for policy 0, policy_version 5930 (0.0008) +[2023-10-08 15:56:06,459][21195] Updated weights for policy 0, policy_version 5940 (0.0010) +[2023-10-08 15:56:06,834][21195] Updated weights for policy 0, policy_version 5950 (0.0008) +[2023-10-08 15:56:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 12124160. Throughput: 0: 1718.5, 1: 1720.6. Samples: 3038118. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 15:56:08,803][19739] Avg episode reward: [(0, '46.460'), (1, '58.220')] +[2023-10-08 15:56:09,205][21194] Updated weights for policy 1, policy_version 5890 (0.0009) +[2023-10-08 15:56:09,584][21194] Updated weights for policy 1, policy_version 5900 (0.0009) +[2023-10-08 15:56:09,956][21194] Updated weights for policy 1, policy_version 5910 (0.0007) +[2023-10-08 15:56:10,315][21194] Updated weights for policy 1, policy_version 5920 (0.0008) +[2023-10-08 15:56:10,728][21195] Updated weights for policy 0, policy_version 5960 (0.0009) +[2023-10-08 15:56:11,103][21195] Updated weights for policy 0, policy_version 5970 (0.0007) +[2023-10-08 15:56:11,465][21195] Updated weights for policy 0, policy_version 5980 (0.0007) +[2023-10-08 15:56:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 12189696. Throughput: 0: 1709.8, 1: 1756.6. Samples: 3059416. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:56:13,803][19739] Avg episode reward: [(0, '48.440'), (1, '60.400')] +[2023-10-08 15:56:13,810][20740] Saving new best policy, reward=48.440! +[2023-10-08 15:56:14,247][21194] Updated weights for policy 1, policy_version 5930 (0.0008) +[2023-10-08 15:56:14,629][21194] Updated weights for policy 1, policy_version 5940 (0.0008) +[2023-10-08 15:56:15,000][21194] Updated weights for policy 1, policy_version 5950 (0.0009) +[2023-10-08 15:56:15,065][20836] Saving new best policy, reward=60.400! +[2023-10-08 15:56:15,199][21195] Updated weights for policy 0, policy_version 5990 (0.0007) +[2023-10-08 15:56:15,567][21195] Updated weights for policy 0, policy_version 6000 (0.0009) +[2023-10-08 15:56:15,940][21195] Updated weights for policy 0, policy_version 6010 (0.0010) +[2023-10-08 15:56:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 12255232. Throughput: 0: 1744.3, 1: 1728.5. Samples: 3075046. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:56:18,803][19739] Avg episode reward: [(0, '54.080'), (1, '63.690')] +[2023-10-08 15:56:18,804][20740] Saving new best policy, reward=54.080! +[2023-10-08 15:56:18,997][21194] Updated weights for policy 1, policy_version 5960 (0.0011) +[2023-10-08 15:56:19,365][21194] Updated weights for policy 1, policy_version 5970 (0.0007) +[2023-10-08 15:56:19,730][21194] Updated weights for policy 1, policy_version 5980 (0.0007) +[2023-10-08 15:56:19,868][20836] Saving new best policy, reward=63.690! +[2023-10-08 15:56:19,892][21195] Updated weights for policy 0, policy_version 6020 (0.0007) +[2023-10-08 15:56:20,265][21195] Updated weights for policy 0, policy_version 6030 (0.0010) +[2023-10-08 15:56:20,641][21195] Updated weights for policy 0, policy_version 6040 (0.0011) +[2023-10-08 15:56:23,696][21194] Updated weights for policy 1, policy_version 5990 (0.0009) +[2023-10-08 15:56:23,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 12320768. Throughput: 0: 1714.0, 1: 1738.9. Samples: 3090348. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:56:23,803][19739] Avg episode reward: [(0, '54.110'), (1, '62.120')] +[2023-10-08 15:56:23,804][20740] Saving new best policy, reward=54.110! +[2023-10-08 15:56:24,060][21194] Updated weights for policy 1, policy_version 6000 (0.0011) +[2023-10-08 15:56:24,431][21194] Updated weights for policy 1, policy_version 6010 (0.0009) +[2023-10-08 15:56:24,606][21195] Updated weights for policy 0, policy_version 6050 (0.0010) +[2023-10-08 15:56:24,975][21195] Updated weights for policy 0, policy_version 6060 (0.0009) +[2023-10-08 15:56:25,346][21195] Updated weights for policy 0, policy_version 6070 (0.0010) +[2023-10-08 15:56:25,712][21195] Updated weights for policy 0, policy_version 6080 (0.0008) +[2023-10-08 15:56:28,343][21194] Updated weights for policy 1, policy_version 6020 (0.0007) +[2023-10-08 15:56:28,709][21194] Updated weights for policy 1, policy_version 6030 (0.0009) +[2023-10-08 15:56:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 12386304. Throughput: 0: 1725.2, 1: 1753.2. Samples: 3111642. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:56:28,803][19739] Avg episode reward: [(0, '61.040'), (1, '61.350')] +[2023-10-08 15:56:28,812][20740] Saving new best policy, reward=61.040! +[2023-10-08 15:56:29,075][21194] Updated weights for policy 1, policy_version 6040 (0.0008) +[2023-10-08 15:56:29,764][21195] Updated weights for policy 0, policy_version 6090 (0.0007) +[2023-10-08 15:56:30,136][21195] Updated weights for policy 0, policy_version 6100 (0.0009) +[2023-10-08 15:56:30,511][21195] Updated weights for policy 0, policy_version 6110 (0.0012) +[2023-10-08 15:56:32,872][21194] Updated weights for policy 1, policy_version 6050 (0.0007) +[2023-10-08 15:56:33,245][21194] Updated weights for policy 1, policy_version 6060 (0.0007) +[2023-10-08 15:56:33,613][21194] Updated weights for policy 1, policy_version 6070 (0.0007) +[2023-10-08 15:56:33,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 12451840. Throughput: 0: 1737.1, 1: 1732.5. Samples: 3127074. Policy #0 lag: (min: 24.0, avg: 50.7, max: 56.0) +[2023-10-08 15:56:33,804][19739] Avg episode reward: [(0, '63.310'), (1, '62.880')] +[2023-10-08 15:56:33,805][20740] Saving new best policy, reward=63.310! +[2023-10-08 15:56:33,977][21194] Updated weights for policy 1, policy_version 6080 (0.0010) +[2023-10-08 15:56:34,346][21195] Updated weights for policy 0, policy_version 6120 (0.0011) +[2023-10-08 15:56:34,725][21195] Updated weights for policy 0, policy_version 6130 (0.0009) +[2023-10-08 15:56:35,103][21195] Updated weights for policy 0, policy_version 6140 (0.0009) +[2023-10-08 15:56:37,857][21194] Updated weights for policy 1, policy_version 6090 (0.0008) +[2023-10-08 15:56:38,227][21194] Updated weights for policy 1, policy_version 6100 (0.0007) +[2023-10-08 15:56:38,590][21194] Updated weights for policy 1, policy_version 6110 (0.0008) +[2023-10-08 15:56:38,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 12550144. Throughput: 0: 1712.9, 1: 1760.0. Samples: 3142712. Policy #0 lag: (min: 24.0, avg: 50.7, max: 56.0) +[2023-10-08 15:56:38,803][19739] Avg episode reward: [(0, '65.800'), (1, '65.140')] +[2023-10-08 15:56:38,804][20740] Saving new best policy, reward=65.800! +[2023-10-08 15:56:38,804][20836] Saving new best policy, reward=65.140! +[2023-10-08 15:56:39,149][21195] Updated weights for policy 0, policy_version 6150 (0.0009) +[2023-10-08 15:56:39,519][21195] Updated weights for policy 0, policy_version 6160 (0.0007) +[2023-10-08 15:56:39,891][21195] Updated weights for policy 0, policy_version 6170 (0.0007) +[2023-10-08 15:56:42,584][21194] Updated weights for policy 1, policy_version 6120 (0.0009) +[2023-10-08 15:56:42,959][21194] Updated weights for policy 1, policy_version 6130 (0.0010) +[2023-10-08 15:56:43,331][21194] Updated weights for policy 1, policy_version 6140 (0.0008) +[2023-10-08 15:56:43,802][19739] Fps is (10 sec: 16384.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 12615680. Throughput: 0: 1738.0, 1: 1735.6. Samples: 3163264. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 15:56:43,803][19739] Avg episode reward: [(0, '66.090'), (1, '68.430')] +[2023-10-08 15:56:43,809][20836] Saving new best policy, reward=68.430! +[2023-10-08 15:56:43,840][21195] Updated weights for policy 0, policy_version 6180 (0.0010) +[2023-10-08 15:56:44,219][21195] Updated weights for policy 0, policy_version 6190 (0.0007) +[2023-10-08 15:56:44,584][21195] Updated weights for policy 0, policy_version 6200 (0.0007) +[2023-10-08 15:56:44,883][20740] Saving new best policy, reward=66.090! +[2023-10-08 15:56:47,095][21194] Updated weights for policy 1, policy_version 6150 (0.0009) +[2023-10-08 15:56:47,462][21194] Updated weights for policy 1, policy_version 6160 (0.0010) +[2023-10-08 15:56:47,831][21194] Updated weights for policy 1, policy_version 6170 (0.0007) +[2023-10-08 15:56:48,551][21195] Updated weights for policy 0, policy_version 6210 (0.0009) +[2023-10-08 15:56:48,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 12681216. Throughput: 0: 1725.8, 1: 1753.1. Samples: 3178892. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 15:56:48,803][19739] Avg episode reward: [(0, '65.590'), (1, '69.750')] +[2023-10-08 15:56:48,804][20836] Saving new best policy, reward=69.750! +[2023-10-08 15:56:48,931][21195] Updated weights for policy 0, policy_version 6220 (0.0008) +[2023-10-08 15:56:49,293][21195] Updated weights for policy 0, policy_version 6230 (0.0009) +[2023-10-08 15:56:49,665][21195] Updated weights for policy 0, policy_version 6240 (0.0009) +[2023-10-08 15:56:51,850][21194] Updated weights for policy 1, policy_version 6180 (0.0009) +[2023-10-08 15:56:52,214][21194] Updated weights for policy 1, policy_version 6190 (0.0010) +[2023-10-08 15:56:52,579][21194] Updated weights for policy 1, policy_version 6200 (0.0010) +[2023-10-08 15:56:53,653][21195] Updated weights for policy 0, policy_version 6250 (0.0008) +[2023-10-08 15:56:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 12746752. Throughput: 0: 1725.9, 1: 1736.8. Samples: 3193940. Policy #0 lag: (min: 31.0, avg: 33.3, max: 63.0) +[2023-10-08 15:56:53,803][19739] Avg episode reward: [(0, '64.290'), (1, '75.790')] +[2023-10-08 15:56:53,804][20836] Saving new best policy, reward=75.790! +[2023-10-08 15:56:54,020][21195] Updated weights for policy 0, policy_version 6260 (0.0009) +[2023-10-08 15:56:54,397][21195] Updated weights for policy 0, policy_version 6270 (0.0008) +[2023-10-08 15:56:56,553][21194] Updated weights for policy 1, policy_version 6210 (0.0011) +[2023-10-08 15:56:56,932][21194] Updated weights for policy 1, policy_version 6220 (0.0008) +[2023-10-08 15:56:57,300][21194] Updated weights for policy 1, policy_version 6230 (0.0008) +[2023-10-08 15:56:57,669][21194] Updated weights for policy 1, policy_version 6240 (0.0008) +[2023-10-08 15:56:58,319][21195] Updated weights for policy 0, policy_version 6280 (0.0008) +[2023-10-08 15:56:58,688][21195] Updated weights for policy 0, policy_version 6290 (0.0007) +[2023-10-08 15:56:58,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 12812288. Throughput: 0: 1733.9, 1: 1713.4. Samples: 3214544. Policy #0 lag: (min: 31.0, avg: 33.3, max: 63.0) +[2023-10-08 15:56:58,803][19739] Avg episode reward: [(0, '68.050'), (1, '75.790')] +[2023-10-08 15:56:59,068][21195] Updated weights for policy 0, policy_version 6300 (0.0009) +[2023-10-08 15:56:59,216][20740] Saving new best policy, reward=68.050! +[2023-10-08 15:57:01,756][21194] Updated weights for policy 1, policy_version 6250 (0.0008) +[2023-10-08 15:57:02,135][21194] Updated weights for policy 1, policy_version 6260 (0.0010) +[2023-10-08 15:57:02,509][21194] Updated weights for policy 1, policy_version 6270 (0.0008) +[2023-10-08 15:57:03,151][21195] Updated weights for policy 0, policy_version 6310 (0.0009) +[2023-10-08 15:57:03,527][21195] Updated weights for policy 0, policy_version 6320 (0.0009) +[2023-10-08 15:57:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 12877824. Throughput: 0: 1704.8, 1: 1739.2. Samples: 3230026. Policy #0 lag: (min: 31.0, avg: 37.0, max: 63.0) +[2023-10-08 15:57:03,803][19739] Avg episode reward: [(0, '70.220'), (1, '75.390')] +[2023-10-08 15:57:03,895][21195] Updated weights for policy 0, policy_version 6330 (0.0011) +[2023-10-08 15:57:04,110][20740] Saving new best policy, reward=70.220! +[2023-10-08 15:57:06,468][21194] Updated weights for policy 1, policy_version 6280 (0.0007) +[2023-10-08 15:57:06,843][21194] Updated weights for policy 1, policy_version 6290 (0.0007) +[2023-10-08 15:57:07,216][21194] Updated weights for policy 1, policy_version 6300 (0.0009) +[2023-10-08 15:57:07,976][21195] Updated weights for policy 0, policy_version 6340 (0.0008) +[2023-10-08 15:57:08,350][21195] Updated weights for policy 0, policy_version 6350 (0.0009) +[2023-10-08 15:57:08,708][21195] Updated weights for policy 0, policy_version 6360 (0.0011) +[2023-10-08 15:57:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 12943360. Throughput: 0: 1722.9, 1: 1717.3. Samples: 3245156. Policy #0 lag: (min: 31.0, avg: 37.0, max: 63.0) +[2023-10-08 15:57:08,803][19739] Avg episode reward: [(0, '70.910'), (1, '78.960')] +[2023-10-08 15:57:08,804][20836] Saving new best policy, reward=78.960! +[2023-10-08 15:57:09,001][20740] Saving new best policy, reward=70.910! +[2023-10-08 15:57:11,137][21194] Updated weights for policy 1, policy_version 6310 (0.0007) +[2023-10-08 15:57:11,496][21194] Updated weights for policy 1, policy_version 6320 (0.0007) +[2023-10-08 15:57:11,861][21194] Updated weights for policy 1, policy_version 6330 (0.0010) +[2023-10-08 15:57:12,615][21195] Updated weights for policy 0, policy_version 6370 (0.0009) +[2023-10-08 15:57:12,997][21195] Updated weights for policy 0, policy_version 6380 (0.0008) +[2023-10-08 15:57:13,369][21195] Updated weights for policy 0, policy_version 6390 (0.0007) +[2023-10-08 15:57:13,731][21195] Updated weights for policy 0, policy_version 6400 (0.0007) +[2023-10-08 15:57:13,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 13041664. Throughput: 0: 1715.7, 1: 1708.5. Samples: 3265734. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 15:57:13,803][19739] Avg episode reward: [(0, '76.180'), (1, '78.960')] +[2023-10-08 15:57:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000006400_6553600.pth... +[2023-10-08 15:57:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000006336_6488064.pth... +[2023-10-08 15:57:13,849][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000004768_4882432.pth +[2023-10-08 15:57:13,851][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000004736_4849664.pth +[2023-10-08 15:57:13,853][20740] Saving new best policy, reward=76.180! +[2023-10-08 15:57:15,764][21194] Updated weights for policy 1, policy_version 6340 (0.0010) +[2023-10-08 15:57:16,139][21194] Updated weights for policy 1, policy_version 6350 (0.0007) +[2023-10-08 15:57:16,498][21194] Updated weights for policy 1, policy_version 6360 (0.0007) +[2023-10-08 15:57:17,589][21195] Updated weights for policy 0, policy_version 6410 (0.0010) +[2023-10-08 15:57:17,961][21195] Updated weights for policy 0, policy_version 6420 (0.0010) +[2023-10-08 15:57:18,336][21195] Updated weights for policy 0, policy_version 6430 (0.0011) +[2023-10-08 15:57:18,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 13107200. Throughput: 0: 1694.8, 1: 1727.7. Samples: 3281086. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:57:18,803][19739] Avg episode reward: [(0, '76.040'), (1, '82.830')] +[2023-10-08 15:57:18,804][20836] Saving new best policy, reward=82.830! +[2023-10-08 15:57:20,209][21194] Updated weights for policy 1, policy_version 6370 (0.0008) +[2023-10-08 15:57:20,570][21194] Updated weights for policy 1, policy_version 6380 (0.0007) +[2023-10-08 15:57:20,941][21194] Updated weights for policy 1, policy_version 6390 (0.0009) +[2023-10-08 15:57:21,313][21194] Updated weights for policy 1, policy_version 6400 (0.0009) +[2023-10-08 15:57:22,273][21195] Updated weights for policy 0, policy_version 6440 (0.0011) +[2023-10-08 15:57:22,644][21195] Updated weights for policy 0, policy_version 6450 (0.0009) +[2023-10-08 15:57:23,014][21195] Updated weights for policy 0, policy_version 6460 (0.0008) +[2023-10-08 15:57:23,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 13172736. Throughput: 0: 1730.6, 1: 1706.6. Samples: 3297386. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:57:23,803][19739] Avg episode reward: [(0, '71.700'), (1, '81.280')] +[2023-10-08 15:57:25,283][21194] Updated weights for policy 1, policy_version 6410 (0.0009) +[2023-10-08 15:57:25,654][21194] Updated weights for policy 1, policy_version 6420 (0.0009) +[2023-10-08 15:57:26,016][21194] Updated weights for policy 1, policy_version 6430 (0.0008) +[2023-10-08 15:57:27,033][21195] Updated weights for policy 0, policy_version 6470 (0.0009) +[2023-10-08 15:57:27,417][21195] Updated weights for policy 0, policy_version 6480 (0.0008) +[2023-10-08 15:57:27,783][21195] Updated weights for policy 0, policy_version 6490 (0.0007) +[2023-10-08 15:57:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 13238272. Throughput: 0: 1701.2, 1: 1732.5. Samples: 3317780. Policy #0 lag: (min: 31.0, avg: 31.1, max: 37.0) +[2023-10-08 15:57:28,803][19739] Avg episode reward: [(0, '73.970'), (1, '89.480')] +[2023-10-08 15:57:28,811][20836] Saving new best policy, reward=89.480! +[2023-10-08 15:57:30,118][21194] Updated weights for policy 1, policy_version 6440 (0.0008) +[2023-10-08 15:57:30,485][21194] Updated weights for policy 1, policy_version 6450 (0.0009) +[2023-10-08 15:57:30,850][21194] Updated weights for policy 1, policy_version 6460 (0.0009) +[2023-10-08 15:57:31,621][21195] Updated weights for policy 0, policy_version 6500 (0.0008) +[2023-10-08 15:57:31,991][21195] Updated weights for policy 0, policy_version 6510 (0.0008) +[2023-10-08 15:57:32,356][21195] Updated weights for policy 0, policy_version 6520 (0.0009) +[2023-10-08 15:57:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 13303808. Throughput: 0: 1709.6, 1: 1705.6. Samples: 3332578. Policy #0 lag: (min: 31.0, avg: 31.1, max: 37.0) +[2023-10-08 15:57:33,803][19739] Avg episode reward: [(0, '76.400'), (1, '89.480')] +[2023-10-08 15:57:33,804][20740] Saving new best policy, reward=76.400! +[2023-10-08 15:57:34,741][21194] Updated weights for policy 1, policy_version 6470 (0.0009) +[2023-10-08 15:57:35,111][21194] Updated weights for policy 1, policy_version 6480 (0.0008) +[2023-10-08 15:57:35,480][21194] Updated weights for policy 1, policy_version 6490 (0.0008) +[2023-10-08 15:57:36,324][21195] Updated weights for policy 0, policy_version 6530 (0.0007) +[2023-10-08 15:57:36,698][21195] Updated weights for policy 0, policy_version 6540 (0.0008) +[2023-10-08 15:57:37,061][21195] Updated weights for policy 0, policy_version 6550 (0.0008) +[2023-10-08 15:57:37,427][21195] Updated weights for policy 0, policy_version 6560 (0.0007) +[2023-10-08 15:57:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 13369344. Throughput: 0: 1722.2, 1: 1718.8. Samples: 3348786. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 15:57:38,803][19739] Avg episode reward: [(0, '70.880'), (1, '89.480')] +[2023-10-08 15:57:39,465][21194] Updated weights for policy 1, policy_version 6500 (0.0008) +[2023-10-08 15:57:39,831][21194] Updated weights for policy 1, policy_version 6510 (0.0007) +[2023-10-08 15:57:40,195][21194] Updated weights for policy 1, policy_version 6520 (0.0010) +[2023-10-08 15:57:41,208][21195] Updated weights for policy 0, policy_version 6570 (0.0009) +[2023-10-08 15:57:41,580][21195] Updated weights for policy 0, policy_version 6580 (0.0007) +[2023-10-08 15:57:41,942][21195] Updated weights for policy 0, policy_version 6590 (0.0007) +[2023-10-08 15:57:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 13434880. Throughput: 0: 1703.8, 1: 1738.6. Samples: 3369452. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 15:57:43,803][19739] Avg episode reward: [(0, '70.860'), (1, '93.510')] +[2023-10-08 15:57:43,813][20836] Saving new best policy, reward=93.510! +[2023-10-08 15:57:44,095][21194] Updated weights for policy 1, policy_version 6530 (0.0009) +[2023-10-08 15:57:44,467][21194] Updated weights for policy 1, policy_version 6540 (0.0009) +[2023-10-08 15:57:44,830][21194] Updated weights for policy 1, policy_version 6550 (0.0007) +[2023-10-08 15:57:45,202][21194] Updated weights for policy 1, policy_version 6560 (0.0008) +[2023-10-08 15:57:45,722][21195] Updated weights for policy 0, policy_version 6600 (0.0007) +[2023-10-08 15:57:46,095][21195] Updated weights for policy 0, policy_version 6610 (0.0009) +[2023-10-08 15:57:46,461][21195] Updated weights for policy 0, policy_version 6620 (0.0008) +[2023-10-08 15:57:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 13500416. Throughput: 0: 1733.4, 1: 1711.2. Samples: 3385034. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 15:57:48,803][19739] Avg episode reward: [(0, '68.390'), (1, '93.510')] +[2023-10-08 15:57:49,142][21194] Updated weights for policy 1, policy_version 6570 (0.0010) +[2023-10-08 15:57:49,515][21194] Updated weights for policy 1, policy_version 6580 (0.0009) +[2023-10-08 15:57:49,874][21194] Updated weights for policy 1, policy_version 6590 (0.0008) +[2023-10-08 15:57:50,445][21195] Updated weights for policy 0, policy_version 6630 (0.0009) +[2023-10-08 15:57:50,815][21195] Updated weights for policy 0, policy_version 6640 (0.0012) +[2023-10-08 15:57:51,179][21195] Updated weights for policy 0, policy_version 6650 (0.0009) +[2023-10-08 15:57:53,743][21194] Updated weights for policy 1, policy_version 6600 (0.0008) +[2023-10-08 15:57:53,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 13565952. Throughput: 0: 1717.6, 1: 1735.8. Samples: 3400560. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 15:57:53,803][19739] Avg episode reward: [(0, '64.890'), (1, '93.510')] +[2023-10-08 15:57:54,113][21194] Updated weights for policy 1, policy_version 6610 (0.0010) +[2023-10-08 15:57:54,480][21194] Updated weights for policy 1, policy_version 6620 (0.0011) +[2023-10-08 15:57:55,026][21195] Updated weights for policy 0, policy_version 6660 (0.0008) +[2023-10-08 15:57:55,402][21195] Updated weights for policy 0, policy_version 6670 (0.0008) +[2023-10-08 15:57:55,761][21195] Updated weights for policy 0, policy_version 6680 (0.0008) +[2023-10-08 15:57:58,323][21194] Updated weights for policy 1, policy_version 6630 (0.0010) +[2023-10-08 15:57:58,693][21194] Updated weights for policy 1, policy_version 6640 (0.0011) +[2023-10-08 15:57:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 13631488. Throughput: 0: 1726.4, 1: 1749.8. Samples: 3422162. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:57:58,803][19739] Avg episode reward: [(0, '63.740'), (1, '93.510')] +[2023-10-08 15:57:59,054][21194] Updated weights for policy 1, policy_version 6650 (0.0011) +[2023-10-08 15:57:59,637][21195] Updated weights for policy 0, policy_version 6690 (0.0007) +[2023-10-08 15:58:00,011][21195] Updated weights for policy 0, policy_version 6700 (0.0009) +[2023-10-08 15:58:00,378][21195] Updated weights for policy 0, policy_version 6710 (0.0009) +[2023-10-08 15:58:00,751][21195] Updated weights for policy 0, policy_version 6720 (0.0008) +[2023-10-08 15:58:03,030][21194] Updated weights for policy 1, policy_version 6660 (0.0009) +[2023-10-08 15:58:03,400][21194] Updated weights for policy 1, policy_version 6670 (0.0008) +[2023-10-08 15:58:03,769][21194] Updated weights for policy 1, policy_version 6680 (0.0009) +[2023-10-08 15:58:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 13697024. Throughput: 0: 1747.2, 1: 1729.2. Samples: 3437524. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:58:03,803][19739] Avg episode reward: [(0, '70.850'), (1, '93.510')] +[2023-10-08 15:58:04,753][21195] Updated weights for policy 0, policy_version 6730 (0.0007) +[2023-10-08 15:58:05,117][21195] Updated weights for policy 0, policy_version 6740 (0.0007) +[2023-10-08 15:58:05,486][21195] Updated weights for policy 0, policy_version 6750 (0.0009) +[2023-10-08 15:58:07,800][21194] Updated weights for policy 1, policy_version 6690 (0.0007) +[2023-10-08 15:58:08,159][21194] Updated weights for policy 1, policy_version 6700 (0.0011) +[2023-10-08 15:58:08,536][21194] Updated weights for policy 1, policy_version 6710 (0.0011) +[2023-10-08 15:58:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 13762560. Throughput: 0: 1715.6, 1: 1741.7. Samples: 3452962. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 15:58:08,803][19739] Avg episode reward: [(0, '70.070'), (1, '99.900')] +[2023-10-08 15:58:08,895][20836] Saving new best policy, reward=99.900! +[2023-10-08 15:58:08,896][21194] Updated weights for policy 1, policy_version 6720 (0.0010) +[2023-10-08 15:58:09,191][21195] Updated weights for policy 0, policy_version 6760 (0.0009) +[2023-10-08 15:58:09,565][21195] Updated weights for policy 0, policy_version 6770 (0.0008) +[2023-10-08 15:58:09,931][21195] Updated weights for policy 0, policy_version 6780 (0.0010) +[2023-10-08 15:58:12,918][21194] Updated weights for policy 1, policy_version 6730 (0.0008) +[2023-10-08 15:58:13,298][21194] Updated weights for policy 1, policy_version 6740 (0.0007) +[2023-10-08 15:58:13,666][21194] Updated weights for policy 1, policy_version 6750 (0.0008) +[2023-10-08 15:58:13,803][19739] Fps is (10 sec: 16383.6, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 13860864. Throughput: 0: 1746.1, 1: 1718.3. Samples: 3473680. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 15:58:13,804][19739] Avg episode reward: [(0, '69.600'), (1, '99.900')] +[2023-10-08 15:58:13,925][21195] Updated weights for policy 0, policy_version 6790 (0.0010) +[2023-10-08 15:58:14,303][21195] Updated weights for policy 0, policy_version 6800 (0.0008) +[2023-10-08 15:58:14,680][21195] Updated weights for policy 0, policy_version 6810 (0.0007) +[2023-10-08 15:58:17,702][21194] Updated weights for policy 1, policy_version 6760 (0.0009) +[2023-10-08 15:58:18,078][21194] Updated weights for policy 1, policy_version 6770 (0.0007) +[2023-10-08 15:58:18,441][21194] Updated weights for policy 1, policy_version 6780 (0.0009) +[2023-10-08 15:58:18,579][21195] Updated weights for policy 0, policy_version 6820 (0.0007) +[2023-10-08 15:58:18,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 13926400. Throughput: 0: 1743.0, 1: 1736.8. Samples: 3489172. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 15:58:18,803][19739] Avg episode reward: [(0, '63.210'), (1, '113.120')] +[2023-10-08 15:58:18,804][20836] Saving new best policy, reward=113.120! +[2023-10-08 15:58:18,951][21195] Updated weights for policy 0, policy_version 6830 (0.0009) +[2023-10-08 15:58:19,318][21195] Updated weights for policy 0, policy_version 6840 (0.0008) +[2023-10-08 15:58:22,348][21194] Updated weights for policy 1, policy_version 6790 (0.0007) +[2023-10-08 15:58:22,717][21194] Updated weights for policy 1, policy_version 6800 (0.0007) +[2023-10-08 15:58:23,082][21194] Updated weights for policy 1, policy_version 6810 (0.0007) +[2023-10-08 15:58:23,108][21195] Updated weights for policy 0, policy_version 6850 (0.0008) +[2023-10-08 15:58:23,488][21195] Updated weights for policy 0, policy_version 6860 (0.0008) +[2023-10-08 15:58:23,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 13991936. Throughput: 0: 1741.1, 1: 1731.5. Samples: 3505054. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 15:58:23,803][19739] Avg episode reward: [(0, '60.530'), (1, '113.120')] +[2023-10-08 15:58:23,861][21195] Updated weights for policy 0, policy_version 6870 (0.0008) +[2023-10-08 15:58:24,232][21195] Updated weights for policy 0, policy_version 6880 (0.0009) +[2023-10-08 15:58:26,859][21194] Updated weights for policy 1, policy_version 6820 (0.0008) +[2023-10-08 15:58:27,230][21194] Updated weights for policy 1, policy_version 6830 (0.0008) +[2023-10-08 15:58:27,593][21194] Updated weights for policy 1, policy_version 6840 (0.0008) +[2023-10-08 15:58:28,265][21195] Updated weights for policy 0, policy_version 6890 (0.0007) +[2023-10-08 15:58:28,632][21195] Updated weights for policy 0, policy_version 6900 (0.0009) +[2023-10-08 15:58:28,803][19739] Fps is (10 sec: 13106.7, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 14057472. Throughput: 0: 1761.4, 1: 1706.7. Samples: 3525518. Policy #0 lag: (min: 8.0, avg: 26.4, max: 40.0) +[2023-10-08 15:58:28,804][19739] Avg episode reward: [(0, '59.740'), (1, '118.200')] +[2023-10-08 15:58:28,815][20836] Saving new best policy, reward=118.200! +[2023-10-08 15:58:29,000][21195] Updated weights for policy 0, policy_version 6910 (0.0008) +[2023-10-08 15:58:31,477][21194] Updated weights for policy 1, policy_version 6850 (0.0008) +[2023-10-08 15:58:31,852][21194] Updated weights for policy 1, policy_version 6860 (0.0007) +[2023-10-08 15:58:32,213][21194] Updated weights for policy 1, policy_version 6870 (0.0007) +[2023-10-08 15:58:32,576][21194] Updated weights for policy 1, policy_version 6880 (0.0007) +[2023-10-08 15:58:32,775][21195] Updated weights for policy 0, policy_version 6920 (0.0009) +[2023-10-08 15:58:33,157][21195] Updated weights for policy 0, policy_version 6930 (0.0009) +[2023-10-08 15:58:33,524][21195] Updated weights for policy 0, policy_version 6940 (0.0008) +[2023-10-08 15:58:33,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 14155776. Throughput: 0: 1729.6, 1: 1736.9. Samples: 3541028. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 15:58:33,803][19739] Avg episode reward: [(0, '63.690'), (1, '119.630')] +[2023-10-08 15:58:33,804][20836] Saving new best policy, reward=119.630! +[2023-10-08 15:58:36,589][21194] Updated weights for policy 1, policy_version 6890 (0.0009) +[2023-10-08 15:58:36,964][21194] Updated weights for policy 1, policy_version 6900 (0.0007) +[2023-10-08 15:58:37,334][21194] Updated weights for policy 1, policy_version 6910 (0.0009) +[2023-10-08 15:58:37,340][21195] Updated weights for policy 0, policy_version 6950 (0.0009) +[2023-10-08 15:58:37,708][21195] Updated weights for policy 0, policy_version 6960 (0.0008) +[2023-10-08 15:58:38,086][21195] Updated weights for policy 0, policy_version 6970 (0.0007) +[2023-10-08 15:58:38,803][19739] Fps is (10 sec: 16384.6, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 14221312. Throughput: 0: 1759.2, 1: 1714.6. Samples: 3556882. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 15:58:38,803][19739] Avg episode reward: [(0, '66.090'), (1, '126.450')] +[2023-10-08 15:58:38,804][20836] Saving new best policy, reward=126.450! +[2023-10-08 15:58:41,504][21194] Updated weights for policy 1, policy_version 6920 (0.0010) +[2023-10-08 15:58:41,869][21194] Updated weights for policy 1, policy_version 6930 (0.0007) +[2023-10-08 15:58:42,017][21195] Updated weights for policy 0, policy_version 6980 (0.0008) +[2023-10-08 15:58:42,237][21194] Updated weights for policy 1, policy_version 6940 (0.0007) +[2023-10-08 15:58:42,392][21195] Updated weights for policy 0, policy_version 6990 (0.0007) +[2023-10-08 15:58:42,760][21195] Updated weights for policy 0, policy_version 7000 (0.0010) +[2023-10-08 15:58:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 14286848. Throughput: 0: 1739.5, 1: 1697.2. Samples: 3576812. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:58:43,803][19739] Avg episode reward: [(0, '67.260'), (1, '125.290')] +[2023-10-08 15:58:46,320][21194] Updated weights for policy 1, policy_version 6950 (0.0007) +[2023-10-08 15:58:46,688][21194] Updated weights for policy 1, policy_version 6960 (0.0011) +[2023-10-08 15:58:46,827][21195] Updated weights for policy 0, policy_version 7010 (0.0009) +[2023-10-08 15:58:47,050][21194] Updated weights for policy 1, policy_version 6970 (0.0008) +[2023-10-08 15:58:47,190][21195] Updated weights for policy 0, policy_version 7020 (0.0008) +[2023-10-08 15:58:47,572][21195] Updated weights for policy 0, policy_version 7030 (0.0008) +[2023-10-08 15:58:47,935][21195] Updated weights for policy 0, policy_version 7040 (0.0008) +[2023-10-08 15:58:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 14352384. Throughput: 0: 1729.0, 1: 1724.8. Samples: 3592942. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:58:48,803][19739] Avg episode reward: [(0, '72.240'), (1, '136.860')] +[2023-10-08 15:58:48,805][20836] Saving new best policy, reward=136.860! +[2023-10-08 15:58:51,033][21194] Updated weights for policy 1, policy_version 6980 (0.0008) +[2023-10-08 15:58:51,404][21194] Updated weights for policy 1, policy_version 6990 (0.0007) +[2023-10-08 15:58:51,774][21194] Updated weights for policy 1, policy_version 7000 (0.0008) +[2023-10-08 15:58:51,890][21195] Updated weights for policy 0, policy_version 7050 (0.0008) +[2023-10-08 15:58:52,267][21195] Updated weights for policy 0, policy_version 7060 (0.0009) +[2023-10-08 15:58:52,631][21195] Updated weights for policy 0, policy_version 7070 (0.0009) +[2023-10-08 15:58:53,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 14417920. Throughput: 0: 1752.0, 1: 1697.9. Samples: 3608210. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 15:58:53,803][19739] Avg episode reward: [(0, '72.980'), (1, '148.570')] +[2023-10-08 15:58:53,804][20836] Saving new best policy, reward=148.570! +[2023-10-08 15:58:55,661][21194] Updated weights for policy 1, policy_version 7010 (0.0008) +[2023-10-08 15:58:56,029][21194] Updated weights for policy 1, policy_version 7020 (0.0007) +[2023-10-08 15:58:56,392][21194] Updated weights for policy 1, policy_version 7030 (0.0009) +[2023-10-08 15:58:56,641][21195] Updated weights for policy 0, policy_version 7080 (0.0009) +[2023-10-08 15:58:56,759][21194] Updated weights for policy 1, policy_version 7040 (0.0009) +[2023-10-08 15:58:57,013][21195] Updated weights for policy 0, policy_version 7090 (0.0007) +[2023-10-08 15:58:57,384][21195] Updated weights for policy 0, policy_version 7100 (0.0007) +[2023-10-08 15:58:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 14483456. Throughput: 0: 1728.2, 1: 1709.3. Samples: 3628368. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 15:58:58,803][19739] Avg episode reward: [(0, '67.110'), (1, '155.760')] +[2023-10-08 15:58:58,813][20836] Saving new best policy, reward=155.760! +[2023-10-08 15:59:00,729][21194] Updated weights for policy 1, policy_version 7050 (0.0008) +[2023-10-08 15:59:01,102][21194] Updated weights for policy 1, policy_version 7060 (0.0008) +[2023-10-08 15:59:01,133][21195] Updated weights for policy 0, policy_version 7110 (0.0008) +[2023-10-08 15:59:01,465][21194] Updated weights for policy 1, policy_version 7070 (0.0007) +[2023-10-08 15:59:01,493][21195] Updated weights for policy 0, policy_version 7120 (0.0009) +[2023-10-08 15:59:01,866][21195] Updated weights for policy 0, policy_version 7130 (0.0008) +[2023-10-08 15:59:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 14548992. Throughput: 0: 1739.6, 1: 1715.6. Samples: 3644654. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 15:59:03,803][19739] Avg episode reward: [(0, '67.300'), (1, '155.580')] +[2023-10-08 15:59:05,445][21194] Updated weights for policy 1, policy_version 7080 (0.0007) +[2023-10-08 15:59:05,759][21195] Updated weights for policy 0, policy_version 7140 (0.0009) +[2023-10-08 15:59:05,818][21194] Updated weights for policy 1, policy_version 7090 (0.0009) +[2023-10-08 15:59:06,124][21195] Updated weights for policy 0, policy_version 7150 (0.0007) +[2023-10-08 15:59:06,183][21194] Updated weights for policy 1, policy_version 7100 (0.0008) +[2023-10-08 15:59:06,491][21195] Updated weights for policy 0, policy_version 7160 (0.0009) +[2023-10-08 15:59:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 14614528. Throughput: 0: 1729.2, 1: 1702.2. Samples: 3659466. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 15:59:08,803][19739] Avg episode reward: [(0, '68.070'), (1, '157.010')] +[2023-10-08 15:59:08,804][20836] Saving new best policy, reward=157.010! +[2023-10-08 15:59:10,165][21194] Updated weights for policy 1, policy_version 7110 (0.0008) +[2023-10-08 15:59:10,541][21194] Updated weights for policy 1, policy_version 7120 (0.0008) +[2023-10-08 15:59:10,563][21195] Updated weights for policy 0, policy_version 7170 (0.0010) +[2023-10-08 15:59:10,913][21194] Updated weights for policy 1, policy_version 7130 (0.0008) +[2023-10-08 15:59:10,931][21195] Updated weights for policy 0, policy_version 7180 (0.0007) +[2023-10-08 15:59:11,302][21195] Updated weights for policy 0, policy_version 7190 (0.0009) +[2023-10-08 15:59:11,669][21195] Updated weights for policy 0, policy_version 7200 (0.0010) +[2023-10-08 15:59:13,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 14680064. Throughput: 0: 1719.8, 1: 1731.3. Samples: 3680818. Policy #0 lag: (min: 31.0, avg: 47.0, max: 63.0) +[2023-10-08 15:59:13,804][19739] Avg episode reward: [(0, '68.380'), (1, '162.190')] +[2023-10-08 15:59:13,814][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000007200_7372800.pth... +[2023-10-08 15:59:13,814][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000007136_7307264.pth... +[2023-10-08 15:59:13,845][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000005600_5734400.pth +[2023-10-08 15:59:13,848][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000005536_5668864.pth +[2023-10-08 15:59:13,851][20836] Saving new best policy, reward=162.190! +[2023-10-08 15:59:14,741][21194] Updated weights for policy 1, policy_version 7140 (0.0009) +[2023-10-08 15:59:15,111][21194] Updated weights for policy 1, policy_version 7150 (0.0010) +[2023-10-08 15:59:15,468][21195] Updated weights for policy 0, policy_version 7210 (0.0009) +[2023-10-08 15:59:15,473][21194] Updated weights for policy 1, policy_version 7160 (0.0008) +[2023-10-08 15:59:15,847][21195] Updated weights for policy 0, policy_version 7220 (0.0010) +[2023-10-08 15:59:16,222][21195] Updated weights for policy 0, policy_version 7230 (0.0008) +[2023-10-08 15:59:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 14745600. Throughput: 0: 1749.0, 1: 1702.3. Samples: 3696336. Policy #0 lag: (min: 31.0, avg: 47.0, max: 63.0) +[2023-10-08 15:59:18,803][19739] Avg episode reward: [(0, '69.710'), (1, '165.930')] +[2023-10-08 15:59:18,804][20836] Saving new best policy, reward=165.930! +[2023-10-08 15:59:19,382][21194] Updated weights for policy 1, policy_version 7170 (0.0007) +[2023-10-08 15:59:19,741][21194] Updated weights for policy 1, policy_version 7180 (0.0010) +[2023-10-08 15:59:20,114][21194] Updated weights for policy 1, policy_version 7190 (0.0008) +[2023-10-08 15:59:20,197][21195] Updated weights for policy 0, policy_version 7240 (0.0009) +[2023-10-08 15:59:20,473][21194] Updated weights for policy 1, policy_version 7200 (0.0008) +[2023-10-08 15:59:20,564][21195] Updated weights for policy 0, policy_version 7250 (0.0007) +[2023-10-08 15:59:20,932][21195] Updated weights for policy 0, policy_version 7260 (0.0011) +[2023-10-08 15:59:23,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 14811136. Throughput: 0: 1720.2, 1: 1720.4. Samples: 3711712. Policy #0 lag: (min: 9.0, avg: 28.2, max: 41.0) +[2023-10-08 15:59:23,803][19739] Avg episode reward: [(0, '71.380'), (1, '165.470')] +[2023-10-08 15:59:24,508][21194] Updated weights for policy 1, policy_version 7210 (0.0009) +[2023-10-08 15:59:24,694][21195] Updated weights for policy 0, policy_version 7270 (0.0008) +[2023-10-08 15:59:24,872][21194] Updated weights for policy 1, policy_version 7220 (0.0008) +[2023-10-08 15:59:25,065][21195] Updated weights for policy 0, policy_version 7280 (0.0009) +[2023-10-08 15:59:25,243][21194] Updated weights for policy 1, policy_version 7230 (0.0008) +[2023-10-08 15:59:25,443][21195] Updated weights for policy 0, policy_version 7290 (0.0010) +[2023-10-08 15:59:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 14876672. Throughput: 0: 1742.8, 1: 1736.1. Samples: 3733362. Policy #0 lag: (min: 9.0, avg: 28.2, max: 41.0) +[2023-10-08 15:59:28,803][19739] Avg episode reward: [(0, '75.340'), (1, '165.070')] +[2023-10-08 15:59:28,934][21194] Updated weights for policy 1, policy_version 7240 (0.0009) +[2023-10-08 15:59:29,267][21195] Updated weights for policy 0, policy_version 7300 (0.0009) +[2023-10-08 15:59:29,297][21194] Updated weights for policy 1, policy_version 7250 (0.0009) +[2023-10-08 15:59:29,634][21195] Updated weights for policy 0, policy_version 7310 (0.0009) +[2023-10-08 15:59:29,665][21194] Updated weights for policy 1, policy_version 7260 (0.0010) +[2023-10-08 15:59:29,998][21195] Updated weights for policy 0, policy_version 7320 (0.0007) +[2023-10-08 15:59:33,524][21194] Updated weights for policy 1, policy_version 7270 (0.0009) +[2023-10-08 15:59:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 14942208. Throughput: 0: 1752.3, 1: 1708.4. Samples: 3748670. Policy #0 lag: (min: 31.0, avg: 31.3, max: 42.0) +[2023-10-08 15:59:33,803][19739] Avg episode reward: [(0, '76.210'), (1, '165.070')] +[2023-10-08 15:59:33,890][21194] Updated weights for policy 1, policy_version 7280 (0.0008) +[2023-10-08 15:59:33,991][21195] Updated weights for policy 0, policy_version 7330 (0.0009) +[2023-10-08 15:59:34,262][21194] Updated weights for policy 1, policy_version 7290 (0.0009) +[2023-10-08 15:59:34,358][21195] Updated weights for policy 0, policy_version 7340 (0.0007) +[2023-10-08 15:59:34,725][21195] Updated weights for policy 0, policy_version 7350 (0.0007) +[2023-10-08 15:59:35,084][21195] Updated weights for policy 0, policy_version 7360 (0.0009) +[2023-10-08 15:59:38,238][21194] Updated weights for policy 1, policy_version 7300 (0.0007) +[2023-10-08 15:59:38,605][21194] Updated weights for policy 1, policy_version 7310 (0.0008) +[2023-10-08 15:59:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 15007744. Throughput: 0: 1724.8, 1: 1739.5. Samples: 3764104. Policy #0 lag: (min: 31.0, avg: 31.3, max: 42.0) +[2023-10-08 15:59:38,803][19739] Avg episode reward: [(0, '76.150'), (1, '174.040')] +[2023-10-08 15:59:38,973][21194] Updated weights for policy 1, policy_version 7320 (0.0009) +[2023-10-08 15:59:39,073][21195] Updated weights for policy 0, policy_version 7370 (0.0010) +[2023-10-08 15:59:39,270][20836] Saving new best policy, reward=174.040! +[2023-10-08 15:59:39,443][21195] Updated weights for policy 0, policy_version 7380 (0.0007) +[2023-10-08 15:59:39,823][21195] Updated weights for policy 0, policy_version 7390 (0.0007) +[2023-10-08 15:59:42,863][21194] Updated weights for policy 1, policy_version 7330 (0.0008) +[2023-10-08 15:59:43,229][21194] Updated weights for policy 1, policy_version 7340 (0.0008) +[2023-10-08 15:59:43,595][21194] Updated weights for policy 1, policy_version 7350 (0.0008) +[2023-10-08 15:59:43,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 15073280. Throughput: 0: 1743.3, 1: 1742.3. Samples: 3785220. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 15:59:43,803][19739] Avg episode reward: [(0, '72.870'), (1, '176.880')] +[2023-10-08 15:59:43,850][21195] Updated weights for policy 0, policy_version 7400 (0.0008) +[2023-10-08 15:59:43,961][20836] Saving new best policy, reward=176.880! +[2023-10-08 15:59:43,963][21194] Updated weights for policy 1, policy_version 7360 (0.0008) +[2023-10-08 15:59:44,227][21195] Updated weights for policy 0, policy_version 7410 (0.0007) +[2023-10-08 15:59:44,601][21195] Updated weights for policy 0, policy_version 7420 (0.0007) +[2023-10-08 15:59:47,841][21194] Updated weights for policy 1, policy_version 7370 (0.0009) +[2023-10-08 15:59:48,213][21194] Updated weights for policy 1, policy_version 7380 (0.0007) +[2023-10-08 15:59:48,584][21194] Updated weights for policy 1, policy_version 7390 (0.0007) +[2023-10-08 15:59:48,653][21195] Updated weights for policy 0, policy_version 7430 (0.0007) +[2023-10-08 15:59:48,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 15171584. Throughput: 0: 1723.8, 1: 1732.7. Samples: 3800196. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 15:59:48,803][19739] Avg episode reward: [(0, '76.110'), (1, '176.880')] +[2023-10-08 15:59:49,015][21195] Updated weights for policy 0, policy_version 7440 (0.0009) +[2023-10-08 15:59:49,395][21195] Updated weights for policy 0, policy_version 7450 (0.0010) +[2023-10-08 15:59:52,754][21194] Updated weights for policy 1, policy_version 7400 (0.0007) +[2023-10-08 15:59:53,132][21194] Updated weights for policy 1, policy_version 7410 (0.0007) +[2023-10-08 15:59:53,469][21195] Updated weights for policy 0, policy_version 7460 (0.0008) +[2023-10-08 15:59:53,500][21194] Updated weights for policy 1, policy_version 7420 (0.0007) +[2023-10-08 15:59:53,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 15237120. Throughput: 0: 1728.3, 1: 1741.8. Samples: 3815622. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 15:59:53,803][19739] Avg episode reward: [(0, '77.240'), (1, '174.880')] +[2023-10-08 15:59:53,841][21195] Updated weights for policy 0, policy_version 7470 (0.0008) +[2023-10-08 15:59:54,215][21195] Updated weights for policy 0, policy_version 7480 (0.0009) +[2023-10-08 15:59:54,505][20740] Saving new best policy, reward=77.240! +[2023-10-08 15:59:57,488][21194] Updated weights for policy 1, policy_version 7430 (0.0010) +[2023-10-08 15:59:57,869][21194] Updated weights for policy 1, policy_version 7440 (0.0008) +[2023-10-08 15:59:57,886][21195] Updated weights for policy 0, policy_version 7490 (0.0010) +[2023-10-08 15:59:58,230][21194] Updated weights for policy 1, policy_version 7450 (0.0009) +[2023-10-08 15:59:58,252][21195] Updated weights for policy 0, policy_version 7500 (0.0008) +[2023-10-08 15:59:58,621][21195] Updated weights for policy 0, policy_version 7510 (0.0008) +[2023-10-08 15:59:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 15302656. Throughput: 0: 1737.3, 1: 1716.8. Samples: 3836248. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 15:59:58,803][19739] Avg episode reward: [(0, '74.540'), (1, '173.100')] +[2023-10-08 15:59:58,996][21195] Updated weights for policy 0, policy_version 7520 (0.0008) +[2023-10-08 16:00:02,360][21194] Updated weights for policy 1, policy_version 7460 (0.0009) +[2023-10-08 16:00:02,723][21194] Updated weights for policy 1, policy_version 7470 (0.0008) +[2023-10-08 16:00:03,086][21194] Updated weights for policy 1, policy_version 7480 (0.0010) +[2023-10-08 16:00:03,172][21195] Updated weights for policy 0, policy_version 7530 (0.0007) +[2023-10-08 16:00:03,538][21195] Updated weights for policy 0, policy_version 7540 (0.0008) +[2023-10-08 16:00:03,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 15368192. Throughput: 0: 1707.0, 1: 1729.5. Samples: 3850978. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 16:00:03,804][19739] Avg episode reward: [(0, '75.420'), (1, '182.060')] +[2023-10-08 16:00:03,805][20836] Saving new best policy, reward=182.060! +[2023-10-08 16:00:03,904][21195] Updated weights for policy 0, policy_version 7550 (0.0010) +[2023-10-08 16:00:07,182][21194] Updated weights for policy 1, policy_version 7490 (0.0007) +[2023-10-08 16:00:07,552][21194] Updated weights for policy 1, policy_version 7500 (0.0010) +[2023-10-08 16:00:07,845][21195] Updated weights for policy 0, policy_version 7560 (0.0009) +[2023-10-08 16:00:07,916][21194] Updated weights for policy 1, policy_version 7510 (0.0007) +[2023-10-08 16:00:08,203][21195] Updated weights for policy 0, policy_version 7570 (0.0009) +[2023-10-08 16:00:08,281][21194] Updated weights for policy 1, policy_version 7520 (0.0007) +[2023-10-08 16:00:08,581][21195] Updated weights for policy 0, policy_version 7580 (0.0008) +[2023-10-08 16:00:08,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13884.8). Total num frames: 15466496. Throughput: 0: 1732.4, 1: 1729.2. Samples: 3867482. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:00:08,803][19739] Avg episode reward: [(0, '73.680'), (1, '190.460')] +[2023-10-08 16:00:08,805][20836] Saving new best policy, reward=190.460! +[2023-10-08 16:00:12,175][21194] Updated weights for policy 1, policy_version 7530 (0.0009) +[2023-10-08 16:00:12,552][21194] Updated weights for policy 1, policy_version 7540 (0.0008) +[2023-10-08 16:00:12,648][21195] Updated weights for policy 0, policy_version 7590 (0.0007) +[2023-10-08 16:00:12,918][21194] Updated weights for policy 1, policy_version 7550 (0.0007) +[2023-10-08 16:00:13,011][21195] Updated weights for policy 0, policy_version 7600 (0.0007) +[2023-10-08 16:00:13,387][21195] Updated weights for policy 0, policy_version 7610 (0.0008) +[2023-10-08 16:00:13,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 15532032. Throughput: 0: 1721.3, 1: 1694.4. Samples: 3887072. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:00:13,804][19739] Avg episode reward: [(0, '74.660'), (1, '194.600')] +[2023-10-08 16:00:13,813][20836] Saving new best policy, reward=194.600! +[2023-10-08 16:00:16,868][21194] Updated weights for policy 1, policy_version 7560 (0.0009) +[2023-10-08 16:00:17,221][21195] Updated weights for policy 0, policy_version 7620 (0.0008) +[2023-10-08 16:00:17,249][21194] Updated weights for policy 1, policy_version 7570 (0.0009) +[2023-10-08 16:00:17,595][21195] Updated weights for policy 0, policy_version 7630 (0.0007) +[2023-10-08 16:00:17,611][21194] Updated weights for policy 1, policy_version 7580 (0.0007) +[2023-10-08 16:00:17,971][21195] Updated weights for policy 0, policy_version 7640 (0.0007) +[2023-10-08 16:00:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 15597568. Throughput: 0: 1697.6, 1: 1721.4. Samples: 3902526. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 16:00:18,803][19739] Avg episode reward: [(0, '74.660'), (1, '194.600')] +[2023-10-08 16:00:21,664][21194] Updated weights for policy 1, policy_version 7590 (0.0008) +[2023-10-08 16:00:21,914][21195] Updated weights for policy 0, policy_version 7650 (0.0011) +[2023-10-08 16:00:22,030][21194] Updated weights for policy 1, policy_version 7600 (0.0008) +[2023-10-08 16:00:22,287][21195] Updated weights for policy 0, policy_version 7660 (0.0009) +[2023-10-08 16:00:22,409][21194] Updated weights for policy 1, policy_version 7610 (0.0008) +[2023-10-08 16:00:22,658][21195] Updated weights for policy 0, policy_version 7670 (0.0009) +[2023-10-08 16:00:23,039][21195] Updated weights for policy 0, policy_version 7680 (0.0007) +[2023-10-08 16:00:23,802][19739] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 15663104. Throughput: 0: 1730.9, 1: 1703.3. Samples: 3918644. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 16:00:23,803][19739] Avg episode reward: [(0, '74.660'), (1, '194.600')] +[2023-10-08 16:00:26,406][21194] Updated weights for policy 1, policy_version 7620 (0.0008) +[2023-10-08 16:00:26,774][21194] Updated weights for policy 1, policy_version 7630 (0.0007) +[2023-10-08 16:00:27,027][21195] Updated weights for policy 0, policy_version 7690 (0.0007) +[2023-10-08 16:00:27,140][21194] Updated weights for policy 1, policy_version 7640 (0.0009) +[2023-10-08 16:00:27,401][21195] Updated weights for policy 0, policy_version 7700 (0.0009) +[2023-10-08 16:00:27,775][21195] Updated weights for policy 0, policy_version 7710 (0.0011) +[2023-10-08 16:00:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 15728640. Throughput: 0: 1701.6, 1: 1686.7. Samples: 3937692. Policy #0 lag: (min: 14.0, avg: 16.9, max: 46.0) +[2023-10-08 16:00:28,803][19739] Avg episode reward: [(0, '79.950'), (1, '201.270')] +[2023-10-08 16:00:28,811][20740] Saving new best policy, reward=79.950! +[2023-10-08 16:00:28,811][20836] Saving new best policy, reward=201.270! +[2023-10-08 16:00:31,054][21194] Updated weights for policy 1, policy_version 7650 (0.0008) +[2023-10-08 16:00:31,428][21194] Updated weights for policy 1, policy_version 7660 (0.0009) +[2023-10-08 16:00:31,686][21195] Updated weights for policy 0, policy_version 7720 (0.0008) +[2023-10-08 16:00:31,803][21194] Updated weights for policy 1, policy_version 7670 (0.0010) +[2023-10-08 16:00:32,051][21195] Updated weights for policy 0, policy_version 7730 (0.0007) +[2023-10-08 16:00:32,161][21194] Updated weights for policy 1, policy_version 7680 (0.0008) +[2023-10-08 16:00:32,430][21195] Updated weights for policy 0, policy_version 7740 (0.0007) +[2023-10-08 16:00:33,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 15794176. Throughput: 0: 1714.4, 1: 1709.4. Samples: 3954266. Policy #0 lag: (min: 14.0, avg: 16.9, max: 46.0) +[2023-10-08 16:00:33,803][19739] Avg episode reward: [(0, '83.080'), (1, '201.270')] +[2023-10-08 16:00:33,804][20740] Saving new best policy, reward=83.080! +[2023-10-08 16:00:36,189][21194] Updated weights for policy 1, policy_version 7690 (0.0007) +[2023-10-08 16:00:36,416][21195] Updated weights for policy 0, policy_version 7750 (0.0009) +[2023-10-08 16:00:36,557][21194] Updated weights for policy 1, policy_version 7700 (0.0007) +[2023-10-08 16:00:36,790][21195] Updated weights for policy 0, policy_version 7760 (0.0009) +[2023-10-08 16:00:36,924][21194] Updated weights for policy 1, policy_version 7710 (0.0007) +[2023-10-08 16:00:37,159][21195] Updated weights for policy 0, policy_version 7770 (0.0008) +[2023-10-08 16:00:38,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 15859712. Throughput: 0: 1717.5, 1: 1686.1. Samples: 3968786. Policy #0 lag: (min: 31.0, avg: 33.2, max: 63.0) +[2023-10-08 16:00:38,803][19739] Avg episode reward: [(0, '85.720'), (1, '201.270')] +[2023-10-08 16:00:38,804][20740] Saving new best policy, reward=85.720! +[2023-10-08 16:00:40,831][21194] Updated weights for policy 1, policy_version 7720 (0.0009) +[2023-10-08 16:00:41,112][21195] Updated weights for policy 0, policy_version 7780 (0.0008) +[2023-10-08 16:00:41,189][21194] Updated weights for policy 1, policy_version 7730 (0.0010) +[2023-10-08 16:00:41,481][21195] Updated weights for policy 0, policy_version 7790 (0.0009) +[2023-10-08 16:00:41,555][21194] Updated weights for policy 1, policy_version 7740 (0.0008) +[2023-10-08 16:00:41,853][21195] Updated weights for policy 0, policy_version 7800 (0.0007) +[2023-10-08 16:00:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 15925248. Throughput: 0: 1694.5, 1: 1709.4. Samples: 3989426. Policy #0 lag: (min: 31.0, avg: 33.2, max: 63.0) +[2023-10-08 16:00:43,803][19739] Avg episode reward: [(0, '85.720'), (1, '199.360')] +[2023-10-08 16:00:45,335][21194] Updated weights for policy 1, policy_version 7750 (0.0007) +[2023-10-08 16:00:45,702][21194] Updated weights for policy 1, policy_version 7760 (0.0007) +[2023-10-08 16:00:45,804][21195] Updated weights for policy 0, policy_version 7810 (0.0008) +[2023-10-08 16:00:46,065][21194] Updated weights for policy 1, policy_version 7770 (0.0007) +[2023-10-08 16:00:46,168][21195] Updated weights for policy 0, policy_version 7820 (0.0008) +[2023-10-08 16:00:46,538][21195] Updated weights for policy 0, policy_version 7830 (0.0009) +[2023-10-08 16:00:46,914][21195] Updated weights for policy 0, policy_version 7840 (0.0009) +[2023-10-08 16:00:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 15990784. Throughput: 0: 1718.7, 1: 1705.3. Samples: 4005058. Policy #0 lag: (min: 23.0, avg: 28.6, max: 55.0) +[2023-10-08 16:00:48,803][19739] Avg episode reward: [(0, '93.660'), (1, '199.360')] +[2023-10-08 16:00:48,804][20740] Saving new best policy, reward=93.660! +[2023-10-08 16:00:50,226][21194] Updated weights for policy 1, policy_version 7780 (0.0007) +[2023-10-08 16:00:50,593][21194] Updated weights for policy 1, policy_version 7790 (0.0007) +[2023-10-08 16:00:50,893][21195] Updated weights for policy 0, policy_version 7850 (0.0008) +[2023-10-08 16:00:50,959][21194] Updated weights for policy 1, policy_version 7800 (0.0008) +[2023-10-08 16:00:51,270][21195] Updated weights for policy 0, policy_version 7860 (0.0009) +[2023-10-08 16:00:51,645][21195] Updated weights for policy 0, policy_version 7870 (0.0010) +[2023-10-08 16:00:53,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 16056320. Throughput: 0: 1692.3, 1: 1694.3. Samples: 4019878. Policy #0 lag: (min: 23.0, avg: 28.6, max: 55.0) +[2023-10-08 16:00:53,804][19739] Avg episode reward: [(0, '95.170'), (1, '200.320')] +[2023-10-08 16:00:53,805][20740] Saving new best policy, reward=95.170! +[2023-10-08 16:00:54,985][21194] Updated weights for policy 1, policy_version 7810 (0.0008) +[2023-10-08 16:00:55,353][21194] Updated weights for policy 1, policy_version 7820 (0.0010) +[2023-10-08 16:00:55,660][21195] Updated weights for policy 0, policy_version 7880 (0.0008) +[2023-10-08 16:00:55,716][21194] Updated weights for policy 1, policy_version 7830 (0.0008) +[2023-10-08 16:00:56,021][21195] Updated weights for policy 0, policy_version 7890 (0.0007) +[2023-10-08 16:00:56,083][21194] Updated weights for policy 1, policy_version 7840 (0.0008) +[2023-10-08 16:00:56,396][21195] Updated weights for policy 0, policy_version 7900 (0.0007) +[2023-10-08 16:00:58,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 16121856. Throughput: 0: 1699.7, 1: 1722.2. Samples: 4041058. Policy #0 lag: (min: 31.0, avg: 32.2, max: 55.0) +[2023-10-08 16:00:58,803][19739] Avg episode reward: [(0, '111.820'), (1, '202.010')] +[2023-10-08 16:00:58,810][20740] Saving new best policy, reward=111.820! +[2023-10-08 16:00:58,810][20836] Saving new best policy, reward=202.010! +[2023-10-08 16:01:00,105][21194] Updated weights for policy 1, policy_version 7850 (0.0007) +[2023-10-08 16:01:00,312][21195] Updated weights for policy 0, policy_version 7910 (0.0007) +[2023-10-08 16:01:00,471][21194] Updated weights for policy 1, policy_version 7860 (0.0008) +[2023-10-08 16:01:00,694][21195] Updated weights for policy 0, policy_version 7920 (0.0008) +[2023-10-08 16:01:00,840][21194] Updated weights for policy 1, policy_version 7870 (0.0009) +[2023-10-08 16:01:01,061][21195] Updated weights for policy 0, policy_version 7930 (0.0009) +[2023-10-08 16:01:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 16187392. Throughput: 0: 1727.5, 1: 1696.0. Samples: 4056584. Policy #0 lag: (min: 31.0, avg: 32.2, max: 55.0) +[2023-10-08 16:01:03,804][19739] Avg episode reward: [(0, '107.870'), (1, '202.010')] +[2023-10-08 16:01:04,903][21194] Updated weights for policy 1, policy_version 7880 (0.0009) +[2023-10-08 16:01:05,004][21195] Updated weights for policy 0, policy_version 7940 (0.0007) +[2023-10-08 16:01:05,272][21194] Updated weights for policy 1, policy_version 7890 (0.0007) +[2023-10-08 16:01:05,372][21195] Updated weights for policy 0, policy_version 7950 (0.0008) +[2023-10-08 16:01:05,642][21194] Updated weights for policy 1, policy_version 7900 (0.0008) +[2023-10-08 16:01:05,737][21195] Updated weights for policy 0, policy_version 7960 (0.0007) +[2023-10-08 16:01:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 16252928. Throughput: 0: 1699.6, 1: 1708.4. Samples: 4072000. Policy #0 lag: (min: 31.0, avg: 34.5, max: 63.0) +[2023-10-08 16:01:08,803][19739] Avg episode reward: [(0, '107.870'), (1, '202.010')] +[2023-10-08 16:01:09,552][21195] Updated weights for policy 0, policy_version 7970 (0.0009) +[2023-10-08 16:01:09,603][21194] Updated weights for policy 1, policy_version 7910 (0.0007) +[2023-10-08 16:01:09,918][21195] Updated weights for policy 0, policy_version 7980 (0.0007) +[2023-10-08 16:01:09,970][21194] Updated weights for policy 1, policy_version 7920 (0.0007) +[2023-10-08 16:01:10,288][21195] Updated weights for policy 0, policy_version 7990 (0.0007) +[2023-10-08 16:01:10,334][21194] Updated weights for policy 1, policy_version 7930 (0.0008) +[2023-10-08 16:01:10,659][21195] Updated weights for policy 0, policy_version 8000 (0.0007) +[2023-10-08 16:01:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 16318464. Throughput: 0: 1731.3, 1: 1724.3. Samples: 4093192. Policy #0 lag: (min: 31.0, avg: 34.5, max: 63.0) +[2023-10-08 16:01:13,804][19739] Avg episode reward: [(0, '108.670'), (1, '206.680')] +[2023-10-08 16:01:13,815][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000007936_8126464.pth... +[2023-10-08 16:01:13,816][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000008000_8192000.pth... +[2023-10-08 16:01:13,848][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000006400_6553600.pth +[2023-10-08 16:01:13,852][20740] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p0/milestones/checkpoint_000008000_8192000.pth +[2023-10-08 16:01:13,856][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000006336_6488064.pth +[2023-10-08 16:01:13,860][20836] Saving new best policy, reward=206.680! +[2023-10-08 16:01:13,893][20836] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p1/milestones/checkpoint_000007936_8126464.pth +[2023-10-08 16:01:14,286][21194] Updated weights for policy 1, policy_version 7940 (0.0008) +[2023-10-08 16:01:14,648][21195] Updated weights for policy 0, policy_version 8010 (0.0007) +[2023-10-08 16:01:14,654][21194] Updated weights for policy 1, policy_version 7950 (0.0008) +[2023-10-08 16:01:15,018][21195] Updated weights for policy 0, policy_version 8020 (0.0007) +[2023-10-08 16:01:15,030][21194] Updated weights for policy 1, policy_version 7960 (0.0007) +[2023-10-08 16:01:15,397][21195] Updated weights for policy 0, policy_version 8030 (0.0009) +[2023-10-08 16:01:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 16384000. Throughput: 0: 1739.2, 1: 1695.7. Samples: 4108836. Policy #0 lag: (min: 27.0, avg: 40.6, max: 59.0) +[2023-10-08 16:01:18,803][19739] Avg episode reward: [(0, '119.920'), (1, '208.710')] +[2023-10-08 16:01:18,804][20740] Saving new best policy, reward=119.920! +[2023-10-08 16:01:18,804][20836] Saving new best policy, reward=208.710! +[2023-10-08 16:01:19,057][21194] Updated weights for policy 1, policy_version 7970 (0.0007) +[2023-10-08 16:01:19,269][21195] Updated weights for policy 0, policy_version 8040 (0.0008) +[2023-10-08 16:01:19,427][21194] Updated weights for policy 1, policy_version 7980 (0.0008) +[2023-10-08 16:01:19,636][21195] Updated weights for policy 0, policy_version 8050 (0.0007) +[2023-10-08 16:01:19,797][21194] Updated weights for policy 1, policy_version 7990 (0.0008) +[2023-10-08 16:01:20,014][21195] Updated weights for policy 0, policy_version 8060 (0.0007) +[2023-10-08 16:01:20,163][21194] Updated weights for policy 1, policy_version 8000 (0.0008) +[2023-10-08 16:01:23,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 16449536. Throughput: 0: 1726.4, 1: 1721.0. Samples: 4123918. Policy #0 lag: (min: 27.0, avg: 40.6, max: 59.0) +[2023-10-08 16:01:23,803][19739] Avg episode reward: [(0, '127.210'), (1, '208.710')] +[2023-10-08 16:01:23,911][21195] Updated weights for policy 0, policy_version 8070 (0.0007) +[2023-10-08 16:01:23,996][21194] Updated weights for policy 1, policy_version 8010 (0.0008) +[2023-10-08 16:01:24,294][21195] Updated weights for policy 0, policy_version 8080 (0.0008) +[2023-10-08 16:01:24,368][21194] Updated weights for policy 1, policy_version 8020 (0.0008) +[2023-10-08 16:01:24,676][21195] Updated weights for policy 0, policy_version 8090 (0.0007) +[2023-10-08 16:01:24,736][21194] Updated weights for policy 1, policy_version 8030 (0.0008) +[2023-10-08 16:01:24,896][20740] Saving new best policy, reward=127.210! +[2023-10-08 16:01:28,386][21195] Updated weights for policy 0, policy_version 8100 (0.0008) +[2023-10-08 16:01:28,699][21194] Updated weights for policy 1, policy_version 8040 (0.0010) +[2023-10-08 16:01:28,758][21195] Updated weights for policy 0, policy_version 8110 (0.0007) +[2023-10-08 16:01:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 16515072. Throughput: 0: 1744.7, 1: 1721.6. Samples: 4145412. Policy #0 lag: (min: 31.0, avg: 40.0, max: 63.0) +[2023-10-08 16:01:28,803][19739] Avg episode reward: [(0, '124.570'), (1, '211.080')] +[2023-10-08 16:01:29,067][21194] Updated weights for policy 1, policy_version 8050 (0.0008) +[2023-10-08 16:01:29,123][21195] Updated weights for policy 0, policy_version 8120 (0.0009) +[2023-10-08 16:01:29,433][21194] Updated weights for policy 1, policy_version 8060 (0.0007) +[2023-10-08 16:01:29,574][20836] Saving new best policy, reward=211.080! +[2023-10-08 16:01:33,029][21195] Updated weights for policy 0, policy_version 8130 (0.0007) +[2023-10-08 16:01:33,403][21195] Updated weights for policy 0, policy_version 8140 (0.0007) +[2023-10-08 16:01:33,407][21194] Updated weights for policy 1, policy_version 8070 (0.0008) +[2023-10-08 16:01:33,771][21195] Updated weights for policy 0, policy_version 8150 (0.0009) +[2023-10-08 16:01:33,780][21194] Updated weights for policy 1, policy_version 8080 (0.0009) +[2023-10-08 16:01:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 16580608. Throughput: 0: 1727.3, 1: 1708.4. Samples: 4159668. Policy #0 lag: (min: 31.0, avg: 40.0, max: 63.0) +[2023-10-08 16:01:33,803][19739] Avg episode reward: [(0, '137.660'), (1, '212.110')] +[2023-10-08 16:01:34,135][21194] Updated weights for policy 1, policy_version 8090 (0.0009) +[2023-10-08 16:01:34,146][21195] Updated weights for policy 0, policy_version 8160 (0.0008) +[2023-10-08 16:01:34,146][20740] Saving new best policy, reward=137.660! +[2023-10-08 16:01:34,357][20836] Saving new best policy, reward=212.110! +[2023-10-08 16:01:38,124][21195] Updated weights for policy 0, policy_version 8170 (0.0010) +[2023-10-08 16:01:38,318][21194] Updated weights for policy 1, policy_version 8100 (0.0008) +[2023-10-08 16:01:38,487][21195] Updated weights for policy 0, policy_version 8180 (0.0008) +[2023-10-08 16:01:38,678][21194] Updated weights for policy 1, policy_version 8110 (0.0007) +[2023-10-08 16:01:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 16646144. Throughput: 0: 1744.4, 1: 1716.7. Samples: 4175626. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:01:38,803][19739] Avg episode reward: [(0, '134.360'), (1, '212.110')] +[2023-10-08 16:01:38,862][21195] Updated weights for policy 0, policy_version 8190 (0.0009) +[2023-10-08 16:01:39,039][21194] Updated weights for policy 1, policy_version 8120 (0.0007) +[2023-10-08 16:01:42,868][21195] Updated weights for policy 0, policy_version 8200 (0.0008) +[2023-10-08 16:01:43,062][21194] Updated weights for policy 1, policy_version 8130 (0.0007) +[2023-10-08 16:01:43,247][21195] Updated weights for policy 0, policy_version 8210 (0.0010) +[2023-10-08 16:01:43,434][21194] Updated weights for policy 1, policy_version 8140 (0.0007) +[2023-10-08 16:01:43,617][21195] Updated weights for policy 0, policy_version 8220 (0.0009) +[2023-10-08 16:01:43,798][21194] Updated weights for policy 1, policy_version 8150 (0.0007) +[2023-10-08 16:01:43,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 16744448. Throughput: 0: 1742.1, 1: 1713.3. Samples: 4196550. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:01:43,803][19739] Avg episode reward: [(0, '135.190'), (1, '211.830')] +[2023-10-08 16:01:44,170][21194] Updated weights for policy 1, policy_version 8160 (0.0012) +[2023-10-08 16:01:47,661][21195] Updated weights for policy 0, policy_version 8230 (0.0010) +[2023-10-08 16:01:48,034][21195] Updated weights for policy 0, policy_version 8240 (0.0007) +[2023-10-08 16:01:48,147][21194] Updated weights for policy 1, policy_version 8170 (0.0009) +[2023-10-08 16:01:48,397][21195] Updated weights for policy 0, policy_version 8250 (0.0008) +[2023-10-08 16:01:48,520][21194] Updated weights for policy 1, policy_version 8180 (0.0007) +[2023-10-08 16:01:48,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 16809984. Throughput: 0: 1713.5, 1: 1712.5. Samples: 4210754. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:01:48,803][19739] Avg episode reward: [(0, '135.610'), (1, '212.060')] +[2023-10-08 16:01:48,886][21194] Updated weights for policy 1, policy_version 8190 (0.0008) +[2023-10-08 16:01:52,403][21195] Updated weights for policy 0, policy_version 8260 (0.0009) +[2023-10-08 16:01:52,698][21194] Updated weights for policy 1, policy_version 8200 (0.0008) +[2023-10-08 16:01:52,780][21195] Updated weights for policy 0, policy_version 8270 (0.0008) +[2023-10-08 16:01:53,062][21194] Updated weights for policy 1, policy_version 8210 (0.0007) +[2023-10-08 16:01:53,141][21195] Updated weights for policy 0, policy_version 8280 (0.0007) +[2023-10-08 16:01:53,423][21194] Updated weights for policy 1, policy_version 8220 (0.0007) +[2023-10-08 16:01:53,803][19739] Fps is (10 sec: 16383.6, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 16908288. Throughput: 0: 1741.0, 1: 1714.7. Samples: 4227506. Policy #0 lag: (min: 9.0, avg: 37.2, max: 40.0) +[2023-10-08 16:01:53,804][19739] Avg episode reward: [(0, '138.260'), (1, '209.030')] +[2023-10-08 16:01:53,805][20740] Saving new best policy, reward=138.260! +[2023-10-08 16:01:57,082][21195] Updated weights for policy 0, policy_version 8290 (0.0007) +[2023-10-08 16:01:57,461][21195] Updated weights for policy 0, policy_version 8300 (0.0008) +[2023-10-08 16:01:57,514][21194] Updated weights for policy 1, policy_version 8230 (0.0010) +[2023-10-08 16:01:57,839][21195] Updated weights for policy 0, policy_version 8310 (0.0008) +[2023-10-08 16:01:57,880][21194] Updated weights for policy 1, policy_version 8240 (0.0008) +[2023-10-08 16:01:58,214][21195] Updated weights for policy 0, policy_version 8320 (0.0008) +[2023-10-08 16:01:58,242][21194] Updated weights for policy 1, policy_version 8250 (0.0009) +[2023-10-08 16:01:58,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 16973824. Throughput: 0: 1719.7, 1: 1699.7. Samples: 4247066. Policy #0 lag: (min: 9.0, avg: 37.2, max: 40.0) +[2023-10-08 16:01:58,803][19739] Avg episode reward: [(0, '141.070'), (1, '215.430')] +[2023-10-08 16:01:58,810][20740] Saving new best policy, reward=141.070! +[2023-10-08 16:01:58,810][20836] Saving new best policy, reward=215.430! +[2023-10-08 16:02:01,911][21195] Updated weights for policy 0, policy_version 8330 (0.0010) +[2023-10-08 16:02:02,229][21194] Updated weights for policy 1, policy_version 8260 (0.0011) +[2023-10-08 16:02:02,280][21195] Updated weights for policy 0, policy_version 8340 (0.0010) +[2023-10-08 16:02:02,605][21194] Updated weights for policy 1, policy_version 8270 (0.0007) +[2023-10-08 16:02:02,648][21195] Updated weights for policy 0, policy_version 8350 (0.0009) +[2023-10-08 16:02:02,973][21194] Updated weights for policy 1, policy_version 8280 (0.0008) +[2023-10-08 16:02:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 17039360. Throughput: 0: 1708.5, 1: 1711.9. Samples: 4262754. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:02:03,804][19739] Avg episode reward: [(0, '139.940'), (1, '214.310')] +[2023-10-08 16:02:06,675][21195] Updated weights for policy 0, policy_version 8360 (0.0009) +[2023-10-08 16:02:06,863][21194] Updated weights for policy 1, policy_version 8290 (0.0008) +[2023-10-08 16:02:07,038][21195] Updated weights for policy 0, policy_version 8370 (0.0007) +[2023-10-08 16:02:07,233][21194] Updated weights for policy 1, policy_version 8300 (0.0008) +[2023-10-08 16:02:07,407][21195] Updated weights for policy 0, policy_version 8380 (0.0007) +[2023-10-08 16:02:07,602][21194] Updated weights for policy 1, policy_version 8310 (0.0008) +[2023-10-08 16:02:07,965][21194] Updated weights for policy 1, policy_version 8320 (0.0009) +[2023-10-08 16:02:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 17104896. Throughput: 0: 1727.6, 1: 1709.2. Samples: 4278574. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:02:08,803][19739] Avg episode reward: [(0, '144.480'), (1, '220.050')] +[2023-10-08 16:02:08,804][20740] Saving new best policy, reward=144.480! +[2023-10-08 16:02:08,804][20836] Saving new best policy, reward=220.050! +[2023-10-08 16:02:11,333][21195] Updated weights for policy 0, policy_version 8390 (0.0010) +[2023-10-08 16:02:11,704][21195] Updated weights for policy 0, policy_version 8400 (0.0009) +[2023-10-08 16:02:12,020][21194] Updated weights for policy 1, policy_version 8330 (0.0008) +[2023-10-08 16:02:12,071][21195] Updated weights for policy 0, policy_version 8410 (0.0007) +[2023-10-08 16:02:12,384][21194] Updated weights for policy 1, policy_version 8340 (0.0009) +[2023-10-08 16:02:12,743][21194] Updated weights for policy 1, policy_version 8350 (0.0009) +[2023-10-08 16:02:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 17170432. Throughput: 0: 1710.8, 1: 1680.4. Samples: 4298016. Policy #0 lag: (min: 0.0, avg: 29.7, max: 32.0) +[2023-10-08 16:02:13,804][19739] Avg episode reward: [(0, '151.640'), (1, '219.710')] +[2023-10-08 16:02:13,811][20740] Saving new best policy, reward=151.640! +[2023-10-08 16:02:15,854][21195] Updated weights for policy 0, policy_version 8420 (0.0008) +[2023-10-08 16:02:16,232][21195] Updated weights for policy 0, policy_version 8430 (0.0007) +[2023-10-08 16:02:16,597][21195] Updated weights for policy 0, policy_version 8440 (0.0008) +[2023-10-08 16:02:16,928][21194] Updated weights for policy 1, policy_version 8360 (0.0008) +[2023-10-08 16:02:17,299][21194] Updated weights for policy 1, policy_version 8370 (0.0010) +[2023-10-08 16:02:17,667][21194] Updated weights for policy 1, policy_version 8380 (0.0009) +[2023-10-08 16:02:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 17235968. Throughput: 0: 1739.1, 1: 1712.4. Samples: 4314986. Policy #0 lag: (min: 0.0, avg: 29.7, max: 32.0) +[2023-10-08 16:02:18,803][19739] Avg episode reward: [(0, '152.950'), (1, '219.710')] +[2023-10-08 16:02:18,804][20740] Saving new best policy, reward=152.950! +[2023-10-08 16:02:20,537][21195] Updated weights for policy 0, policy_version 8450 (0.0007) +[2023-10-08 16:02:20,910][21195] Updated weights for policy 0, policy_version 8460 (0.0008) +[2023-10-08 16:02:21,287][21195] Updated weights for policy 0, policy_version 8470 (0.0009) +[2023-10-08 16:02:21,379][21194] Updated weights for policy 1, policy_version 8390 (0.0008) +[2023-10-08 16:02:21,650][21195] Updated weights for policy 0, policy_version 8480 (0.0008) +[2023-10-08 16:02:21,745][21194] Updated weights for policy 1, policy_version 8400 (0.0008) +[2023-10-08 16:02:22,112][21194] Updated weights for policy 1, policy_version 8410 (0.0008) +[2023-10-08 16:02:23,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 17301504. Throughput: 0: 1720.8, 1: 1697.4. Samples: 4329442. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:02:23,803][19739] Avg episode reward: [(0, '153.450'), (1, '219.710')] +[2023-10-08 16:02:23,804][20740] Saving new best policy, reward=153.450! +[2023-10-08 16:02:25,581][21195] Updated weights for policy 0, policy_version 8490 (0.0010) +[2023-10-08 16:02:25,955][21195] Updated weights for policy 0, policy_version 8500 (0.0010) +[2023-10-08 16:02:26,154][21194] Updated weights for policy 1, policy_version 8420 (0.0008) +[2023-10-08 16:02:26,327][21195] Updated weights for policy 0, policy_version 8510 (0.0008) +[2023-10-08 16:02:26,522][21194] Updated weights for policy 1, policy_version 8430 (0.0008) +[2023-10-08 16:02:26,897][21194] Updated weights for policy 1, policy_version 8440 (0.0009) +[2023-10-08 16:02:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 17367040. Throughput: 0: 1723.8, 1: 1690.6. Samples: 4350200. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:02:28,803][19739] Avg episode reward: [(0, '152.370'), (1, '222.060')] +[2023-10-08 16:02:28,813][20836] Saving new best policy, reward=222.060! +[2023-10-08 16:02:30,128][21195] Updated weights for policy 0, policy_version 8520 (0.0008) +[2023-10-08 16:02:30,496][21195] Updated weights for policy 0, policy_version 8530 (0.0008) +[2023-10-08 16:02:30,860][21195] Updated weights for policy 0, policy_version 8540 (0.0007) +[2023-10-08 16:02:31,005][21194] Updated weights for policy 1, policy_version 8450 (0.0008) +[2023-10-08 16:02:31,368][21194] Updated weights for policy 1, policy_version 8460 (0.0009) +[2023-10-08 16:02:31,742][21194] Updated weights for policy 1, policy_version 8470 (0.0010) +[2023-10-08 16:02:32,107][21194] Updated weights for policy 1, policy_version 8480 (0.0009) +[2023-10-08 16:02:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 17432576. Throughput: 0: 1752.6, 1: 1714.6. Samples: 4366780. Policy #0 lag: (min: 6.0, avg: 6.6, max: 22.0) +[2023-10-08 16:02:33,803][19739] Avg episode reward: [(0, '152.370'), (1, '222.060')] +[2023-10-08 16:02:34,680][21195] Updated weights for policy 0, policy_version 8550 (0.0009) +[2023-10-08 16:02:35,051][21195] Updated weights for policy 0, policy_version 8560 (0.0008) +[2023-10-08 16:02:35,430][21195] Updated weights for policy 0, policy_version 8570 (0.0008) +[2023-10-08 16:02:36,085][21194] Updated weights for policy 1, policy_version 8490 (0.0008) +[2023-10-08 16:02:36,457][21194] Updated weights for policy 1, policy_version 8500 (0.0008) +[2023-10-08 16:02:36,835][21194] Updated weights for policy 1, policy_version 8510 (0.0009) +[2023-10-08 16:02:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 17498112. Throughput: 0: 1725.3, 1: 1685.4. Samples: 4380986. Policy #0 lag: (min: 6.0, avg: 6.6, max: 22.0) +[2023-10-08 16:02:38,803][19739] Avg episode reward: [(0, '152.090'), (1, '233.550')] +[2023-10-08 16:02:38,804][20836] Saving new best policy, reward=233.550! +[2023-10-08 16:02:39,363][21195] Updated weights for policy 0, policy_version 8580 (0.0008) +[2023-10-08 16:02:39,741][21195] Updated weights for policy 0, policy_version 8590 (0.0009) +[2023-10-08 16:02:40,121][21195] Updated weights for policy 0, policy_version 8600 (0.0008) +[2023-10-08 16:02:40,724][21194] Updated weights for policy 1, policy_version 8520 (0.0009) +[2023-10-08 16:02:41,099][21194] Updated weights for policy 1, policy_version 8530 (0.0010) +[2023-10-08 16:02:41,468][21194] Updated weights for policy 1, policy_version 8540 (0.0010) +[2023-10-08 16:02:43,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.2, 300 sec: 13773.6). Total num frames: 17563648. Throughput: 0: 1745.5, 1: 1704.5. Samples: 4402314. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:02:43,804][19739] Avg episode reward: [(0, '152.090'), (1, '233.550')] +[2023-10-08 16:02:43,855][21195] Updated weights for policy 0, policy_version 8610 (0.0007) +[2023-10-08 16:02:44,218][21195] Updated weights for policy 0, policy_version 8620 (0.0008) +[2023-10-08 16:02:44,594][21195] Updated weights for policy 0, policy_version 8630 (0.0008) +[2023-10-08 16:02:44,957][21195] Updated weights for policy 0, policy_version 8640 (0.0008) +[2023-10-08 16:02:45,395][21194] Updated weights for policy 1, policy_version 8550 (0.0012) +[2023-10-08 16:02:45,753][21194] Updated weights for policy 1, policy_version 8560 (0.0009) +[2023-10-08 16:02:46,119][21194] Updated weights for policy 1, policy_version 8570 (0.0007) +[2023-10-08 16:02:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 17629184. Throughput: 0: 1748.4, 1: 1700.9. Samples: 4417974. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:02:48,803][19739] Avg episode reward: [(0, '152.500'), (1, '237.780')] +[2023-10-08 16:02:48,804][20836] Saving new best policy, reward=237.780! +[2023-10-08 16:02:48,980][21195] Updated weights for policy 0, policy_version 8650 (0.0007) +[2023-10-08 16:02:49,355][21195] Updated weights for policy 0, policy_version 8660 (0.0007) +[2023-10-08 16:02:49,728][21195] Updated weights for policy 0, policy_version 8670 (0.0009) +[2023-10-08 16:02:50,194][21194] Updated weights for policy 1, policy_version 8580 (0.0009) +[2023-10-08 16:02:50,567][21194] Updated weights for policy 1, policy_version 8590 (0.0009) +[2023-10-08 16:02:50,942][21194] Updated weights for policy 1, policy_version 8600 (0.0009) +[2023-10-08 16:02:53,704][21195] Updated weights for policy 0, policy_version 8680 (0.0009) +[2023-10-08 16:02:53,802][19739] Fps is (10 sec: 13107.7, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 17694720. Throughput: 0: 1734.7, 1: 1696.9. Samples: 4432996. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 16:02:53,803][19739] Avg episode reward: [(0, '152.500'), (1, '231.480')] +[2023-10-08 16:02:54,069][21195] Updated weights for policy 0, policy_version 8690 (0.0007) +[2023-10-08 16:02:54,444][21195] Updated weights for policy 0, policy_version 8700 (0.0008) +[2023-10-08 16:02:54,924][21194] Updated weights for policy 1, policy_version 8610 (0.0009) +[2023-10-08 16:02:55,292][21194] Updated weights for policy 1, policy_version 8620 (0.0009) +[2023-10-08 16:02:55,664][21194] Updated weights for policy 1, policy_version 8630 (0.0007) +[2023-10-08 16:02:56,025][21194] Updated weights for policy 1, policy_version 8640 (0.0007) +[2023-10-08 16:02:58,566][21195] Updated weights for policy 0, policy_version 8710 (0.0009) +[2023-10-08 16:02:58,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13107.1, 300 sec: 13773.7). Total num frames: 17760256. Throughput: 0: 1753.7, 1: 1726.8. Samples: 4454638. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 16:02:58,804][19739] Avg episode reward: [(0, '155.870'), (1, '230.730')] +[2023-10-08 16:02:58,951][21195] Updated weights for policy 0, policy_version 8720 (0.0008) +[2023-10-08 16:02:59,335][21195] Updated weights for policy 0, policy_version 8730 (0.0009) +[2023-10-08 16:02:59,556][20740] Saving new best policy, reward=155.870! +[2023-10-08 16:02:59,945][21194] Updated weights for policy 1, policy_version 8650 (0.0010) +[2023-10-08 16:03:00,311][21194] Updated weights for policy 1, policy_version 8660 (0.0011) +[2023-10-08 16:03:00,688][21194] Updated weights for policy 1, policy_version 8670 (0.0011) +[2023-10-08 16:03:03,211][21195] Updated weights for policy 0, policy_version 8740 (0.0007) +[2023-10-08 16:03:03,569][21195] Updated weights for policy 0, policy_version 8750 (0.0008) +[2023-10-08 16:03:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 17825792. Throughput: 0: 1727.1, 1: 1700.3. Samples: 4469218. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:03:03,803][19739] Avg episode reward: [(0, '155.870'), (1, '221.650')] +[2023-10-08 16:03:03,939][21195] Updated weights for policy 0, policy_version 8760 (0.0008) +[2023-10-08 16:03:04,664][21194] Updated weights for policy 1, policy_version 8680 (0.0010) +[2023-10-08 16:03:05,042][21194] Updated weights for policy 1, policy_version 8690 (0.0009) +[2023-10-08 16:03:05,408][21194] Updated weights for policy 1, policy_version 8700 (0.0009) +[2023-10-08 16:03:07,898][21195] Updated weights for policy 0, policy_version 8770 (0.0007) +[2023-10-08 16:03:08,266][21195] Updated weights for policy 0, policy_version 8780 (0.0011) +[2023-10-08 16:03:08,646][21195] Updated weights for policy 0, policy_version 8790 (0.0007) +[2023-10-08 16:03:08,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 17891328. Throughput: 0: 1746.1, 1: 1715.5. Samples: 4485214. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:03:08,803][19739] Avg episode reward: [(0, '155.620'), (1, '231.520')] +[2023-10-08 16:03:09,012][21195] Updated weights for policy 0, policy_version 8800 (0.0009) +[2023-10-08 16:03:09,308][21194] Updated weights for policy 1, policy_version 8710 (0.0011) +[2023-10-08 16:03:09,671][21194] Updated weights for policy 1, policy_version 8720 (0.0009) +[2023-10-08 16:03:10,036][21194] Updated weights for policy 1, policy_version 8730 (0.0007) +[2023-10-08 16:03:12,902][21195] Updated weights for policy 0, policy_version 8810 (0.0008) +[2023-10-08 16:03:13,266][21195] Updated weights for policy 0, policy_version 8820 (0.0007) +[2023-10-08 16:03:13,633][21195] Updated weights for policy 0, policy_version 8830 (0.0008) +[2023-10-08 16:03:13,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 17989632. Throughput: 0: 1744.3, 1: 1731.1. Samples: 4506592. Policy #0 lag: (min: 10.0, avg: 17.9, max: 42.0) +[2023-10-08 16:03:13,804][19739] Avg episode reward: [(0, '155.620'), (1, '219.790')] +[2023-10-08 16:03:13,814][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000008832_9043968.pth... +[2023-10-08 16:03:13,857][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000007200_7372800.pth +[2023-10-08 16:03:13,877][21194] Updated weights for policy 1, policy_version 8740 (0.0008) +[2023-10-08 16:03:14,240][21194] Updated weights for policy 1, policy_version 8750 (0.0010) +[2023-10-08 16:03:14,606][21194] Updated weights for policy 1, policy_version 8760 (0.0010) +[2023-10-08 16:03:14,897][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000008768_8978432.pth... +[2023-10-08 16:03:14,934][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000007136_7307264.pth +[2023-10-08 16:03:17,570][21195] Updated weights for policy 0, policy_version 8840 (0.0008) +[2023-10-08 16:03:17,948][21195] Updated weights for policy 0, policy_version 8850 (0.0009) +[2023-10-08 16:03:18,315][21195] Updated weights for policy 0, policy_version 8860 (0.0008) +[2023-10-08 16:03:18,616][21194] Updated weights for policy 1, policy_version 8770 (0.0009) +[2023-10-08 16:03:18,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 18055168. Throughput: 0: 1719.7, 1: 1708.5. Samples: 4521050. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 16:03:18,803][19739] Avg episode reward: [(0, '158.590'), (1, '222.300')] +[2023-10-08 16:03:18,804][20740] Saving new best policy, reward=158.590! +[2023-10-08 16:03:18,979][21194] Updated weights for policy 1, policy_version 8780 (0.0008) +[2023-10-08 16:03:19,347][21194] Updated weights for policy 1, policy_version 8790 (0.0007) +[2023-10-08 16:03:19,709][21194] Updated weights for policy 1, policy_version 8800 (0.0009) +[2023-10-08 16:03:22,157][21195] Updated weights for policy 0, policy_version 8870 (0.0008) +[2023-10-08 16:03:22,530][21195] Updated weights for policy 0, policy_version 8880 (0.0010) +[2023-10-08 16:03:22,897][21195] Updated weights for policy 0, policy_version 8890 (0.0009) +[2023-10-08 16:03:23,530][21194] Updated weights for policy 1, policy_version 8810 (0.0009) +[2023-10-08 16:03:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 18120704. Throughput: 0: 1745.2, 1: 1738.0. Samples: 4537734. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 16:03:23,803][19739] Avg episode reward: [(0, '158.240'), (1, '232.360')] +[2023-10-08 16:03:23,897][21194] Updated weights for policy 1, policy_version 8820 (0.0007) +[2023-10-08 16:03:24,272][21194] Updated weights for policy 1, policy_version 8830 (0.0008) +[2023-10-08 16:03:26,594][21195] Updated weights for policy 0, policy_version 8900 (0.0009) +[2023-10-08 16:03:26,961][21195] Updated weights for policy 0, policy_version 8910 (0.0009) +[2023-10-08 16:03:27,335][21195] Updated weights for policy 0, policy_version 8920 (0.0011) +[2023-10-08 16:03:28,240][21194] Updated weights for policy 1, policy_version 8840 (0.0008) +[2023-10-08 16:03:28,609][21194] Updated weights for policy 1, policy_version 8850 (0.0007) +[2023-10-08 16:03:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 18186240. Throughput: 0: 1717.6, 1: 1736.2. Samples: 4557736. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:03:28,804][19739] Avg episode reward: [(0, '159.440'), (1, '233.480')] +[2023-10-08 16:03:28,811][20740] Saving new best policy, reward=159.440! +[2023-10-08 16:03:28,986][21194] Updated weights for policy 1, policy_version 8860 (0.0009) +[2023-10-08 16:03:31,249][21195] Updated weights for policy 0, policy_version 8930 (0.0009) +[2023-10-08 16:03:31,620][21195] Updated weights for policy 0, policy_version 8940 (0.0010) +[2023-10-08 16:03:31,993][21195] Updated weights for policy 0, policy_version 8950 (0.0008) +[2023-10-08 16:03:32,363][21195] Updated weights for policy 0, policy_version 8960 (0.0009) +[2023-10-08 16:03:32,893][21194] Updated weights for policy 1, policy_version 8870 (0.0008) +[2023-10-08 16:03:33,263][21194] Updated weights for policy 1, policy_version 8880 (0.0009) +[2023-10-08 16:03:33,633][21194] Updated weights for policy 1, policy_version 8890 (0.0007) +[2023-10-08 16:03:33,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 18251776. Throughput: 0: 1724.9, 1: 1727.9. Samples: 4573350. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:03:33,803][19739] Avg episode reward: [(0, '163.030'), (1, '233.480')] +[2023-10-08 16:03:33,804][20740] Saving new best policy, reward=163.030! +[2023-10-08 16:03:36,330][21195] Updated weights for policy 0, policy_version 8970 (0.0007) +[2023-10-08 16:03:36,715][21195] Updated weights for policy 0, policy_version 8980 (0.0007) +[2023-10-08 16:03:37,083][21195] Updated weights for policy 0, policy_version 8990 (0.0007) +[2023-10-08 16:03:37,560][21194] Updated weights for policy 1, policy_version 8900 (0.0009) +[2023-10-08 16:03:37,928][21194] Updated weights for policy 1, policy_version 8910 (0.0009) +[2023-10-08 16:03:38,287][21194] Updated weights for policy 1, policy_version 8920 (0.0008) +[2023-10-08 16:03:38,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 18350080. Throughput: 0: 1730.1, 1: 1747.2. Samples: 4589476. Policy #0 lag: (min: 12.0, avg: 12.0, max: 12.0) +[2023-10-08 16:03:38,803][19739] Avg episode reward: [(0, '156.860'), (1, '238.970')] +[2023-10-08 16:03:38,804][20836] Saving new best policy, reward=238.970! +[2023-10-08 16:03:41,005][21195] Updated weights for policy 0, policy_version 9000 (0.0008) +[2023-10-08 16:03:41,375][21195] Updated weights for policy 0, policy_version 9010 (0.0011) +[2023-10-08 16:03:41,753][21195] Updated weights for policy 0, policy_version 9020 (0.0011) +[2023-10-08 16:03:42,371][21194] Updated weights for policy 1, policy_version 8930 (0.0009) +[2023-10-08 16:03:42,737][21194] Updated weights for policy 1, policy_version 8940 (0.0007) +[2023-10-08 16:03:43,113][21194] Updated weights for policy 1, policy_version 8950 (0.0008) +[2023-10-08 16:03:43,488][21194] Updated weights for policy 1, policy_version 8960 (0.0008) +[2023-10-08 16:03:43,803][19739] Fps is (10 sec: 16383.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 18415616. Throughput: 0: 1717.2, 1: 1725.2. Samples: 4609546. Policy #0 lag: (min: 12.0, avg: 12.0, max: 12.0) +[2023-10-08 16:03:43,804][19739] Avg episode reward: [(0, '153.780'), (1, '238.970')] +[2023-10-08 16:03:45,755][21195] Updated weights for policy 0, policy_version 9030 (0.0007) +[2023-10-08 16:03:46,126][21195] Updated weights for policy 0, policy_version 9040 (0.0008) +[2023-10-08 16:03:46,497][21195] Updated weights for policy 0, policy_version 9050 (0.0011) +[2023-10-08 16:03:47,410][21194] Updated weights for policy 1, policy_version 8970 (0.0008) +[2023-10-08 16:03:47,783][21194] Updated weights for policy 1, policy_version 8980 (0.0009) +[2023-10-08 16:03:48,145][21194] Updated weights for policy 1, policy_version 8990 (0.0010) +[2023-10-08 16:03:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 18481152. Throughput: 0: 1734.8, 1: 1741.5. Samples: 4625652. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 16:03:48,803][19739] Avg episode reward: [(0, '153.780'), (1, '246.140')] +[2023-10-08 16:03:48,804][20836] Saving new best policy, reward=246.140! +[2023-10-08 16:03:50,454][21195] Updated weights for policy 0, policy_version 9060 (0.0008) +[2023-10-08 16:03:50,834][21195] Updated weights for policy 0, policy_version 9070 (0.0008) +[2023-10-08 16:03:51,212][21195] Updated weights for policy 0, policy_version 9080 (0.0008) +[2023-10-08 16:03:52,024][21194] Updated weights for policy 1, policy_version 9000 (0.0007) +[2023-10-08 16:03:52,391][21194] Updated weights for policy 1, policy_version 9010 (0.0007) +[2023-10-08 16:03:52,762][21194] Updated weights for policy 1, policy_version 9020 (0.0008) +[2023-10-08 16:03:53,802][19739] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 18546688. Throughput: 0: 1712.3, 1: 1738.7. Samples: 4640508. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 16:03:53,803][19739] Avg episode reward: [(0, '144.510'), (1, '246.140')] +[2023-10-08 16:03:55,257][21195] Updated weights for policy 0, policy_version 9090 (0.0009) +[2023-10-08 16:03:55,632][21195] Updated weights for policy 0, policy_version 9100 (0.0008) +[2023-10-08 16:03:56,001][21195] Updated weights for policy 0, policy_version 9110 (0.0007) +[2023-10-08 16:03:56,369][21195] Updated weights for policy 0, policy_version 9120 (0.0007) +[2023-10-08 16:03:56,696][21194] Updated weights for policy 1, policy_version 9030 (0.0007) +[2023-10-08 16:03:57,063][21194] Updated weights for policy 1, policy_version 9040 (0.0008) +[2023-10-08 16:03:57,432][21194] Updated weights for policy 1, policy_version 9050 (0.0008) +[2023-10-08 16:03:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 18612224. Throughput: 0: 1721.1, 1: 1713.9. Samples: 4661166. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:03:58,803][19739] Avg episode reward: [(0, '145.560'), (1, '246.140')] +[2023-10-08 16:04:00,155][21195] Updated weights for policy 0, policy_version 9130 (0.0010) +[2023-10-08 16:04:00,538][21195] Updated weights for policy 0, policy_version 9140 (0.0010) +[2023-10-08 16:04:00,912][21195] Updated weights for policy 0, policy_version 9150 (0.0009) +[2023-10-08 16:04:01,502][21194] Updated weights for policy 1, policy_version 9060 (0.0009) +[2023-10-08 16:04:01,859][21194] Updated weights for policy 1, policy_version 9070 (0.0008) +[2023-10-08 16:04:02,225][21194] Updated weights for policy 1, policy_version 9080 (0.0010) +[2023-10-08 16:04:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 18677760. Throughput: 0: 1741.2, 1: 1744.5. Samples: 4677910. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:04:03,803][19739] Avg episode reward: [(0, '146.390'), (1, '246.140')] +[2023-10-08 16:04:04,917][21195] Updated weights for policy 0, policy_version 9160 (0.0010) +[2023-10-08 16:04:05,295][21195] Updated weights for policy 0, policy_version 9170 (0.0010) +[2023-10-08 16:04:05,658][21195] Updated weights for policy 0, policy_version 9180 (0.0009) +[2023-10-08 16:04:06,103][21194] Updated weights for policy 1, policy_version 9090 (0.0009) +[2023-10-08 16:04:06,475][21194] Updated weights for policy 1, policy_version 9100 (0.0010) +[2023-10-08 16:04:06,852][21194] Updated weights for policy 1, policy_version 9110 (0.0007) +[2023-10-08 16:04:07,211][21194] Updated weights for policy 1, policy_version 9120 (0.0008) +[2023-10-08 16:04:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 18743296. Throughput: 0: 1708.1, 1: 1718.1. Samples: 4691916. Policy #0 lag: (min: 17.0, avg: 26.2, max: 49.0) +[2023-10-08 16:04:08,803][19739] Avg episode reward: [(0, '146.390'), (1, '246.140')] +[2023-10-08 16:04:09,662][21195] Updated weights for policy 0, policy_version 9190 (0.0009) +[2023-10-08 16:04:10,038][21195] Updated weights for policy 0, policy_version 9200 (0.0008) +[2023-10-08 16:04:10,400][21195] Updated weights for policy 0, policy_version 9210 (0.0008) +[2023-10-08 16:04:11,075][21194] Updated weights for policy 1, policy_version 9130 (0.0011) +[2023-10-08 16:04:11,446][21194] Updated weights for policy 1, policy_version 9140 (0.0008) +[2023-10-08 16:04:11,808][21194] Updated weights for policy 1, policy_version 9150 (0.0008) +[2023-10-08 16:04:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 18808832. Throughput: 0: 1738.4, 1: 1713.0. Samples: 4713046. Policy #0 lag: (min: 17.0, avg: 26.2, max: 49.0) +[2023-10-08 16:04:13,803][19739] Avg episode reward: [(0, '155.030'), (1, '239.740')] +[2023-10-08 16:04:14,411][21195] Updated weights for policy 0, policy_version 9220 (0.0009) +[2023-10-08 16:04:14,789][21195] Updated weights for policy 0, policy_version 9230 (0.0008) +[2023-10-08 16:04:15,169][21195] Updated weights for policy 0, policy_version 9240 (0.0007) +[2023-10-08 16:04:15,655][21194] Updated weights for policy 1, policy_version 9160 (0.0009) +[2023-10-08 16:04:16,022][21194] Updated weights for policy 1, policy_version 9170 (0.0009) +[2023-10-08 16:04:16,385][21194] Updated weights for policy 1, policy_version 9180 (0.0009) +[2023-10-08 16:04:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 18874368. Throughput: 0: 1734.4, 1: 1727.0. Samples: 4729112. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:04:18,803][19739] Avg episode reward: [(0, '155.030'), (1, '252.770')] +[2023-10-08 16:04:18,804][20836] Saving new best policy, reward=252.770! +[2023-10-08 16:04:18,977][21195] Updated weights for policy 0, policy_version 9250 (0.0008) +[2023-10-08 16:04:19,350][21195] Updated weights for policy 0, policy_version 9260 (0.0007) +[2023-10-08 16:04:19,727][21195] Updated weights for policy 0, policy_version 9270 (0.0007) +[2023-10-08 16:04:20,101][21195] Updated weights for policy 0, policy_version 9280 (0.0008) +[2023-10-08 16:04:20,366][21194] Updated weights for policy 1, policy_version 9190 (0.0009) +[2023-10-08 16:04:20,727][21194] Updated weights for policy 1, policy_version 9200 (0.0008) +[2023-10-08 16:04:21,106][21194] Updated weights for policy 1, policy_version 9210 (0.0007) +[2023-10-08 16:04:23,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 18939904. Throughput: 0: 1727.8, 1: 1705.9. Samples: 4743992. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:04:23,804][19739] Avg episode reward: [(0, '142.510'), (1, '252.770')] +[2023-10-08 16:04:24,108][21195] Updated weights for policy 0, policy_version 9290 (0.0011) +[2023-10-08 16:04:24,489][21195] Updated weights for policy 0, policy_version 9300 (0.0009) +[2023-10-08 16:04:24,857][21195] Updated weights for policy 0, policy_version 9310 (0.0009) +[2023-10-08 16:04:24,929][21194] Updated weights for policy 1, policy_version 9220 (0.0007) +[2023-10-08 16:04:25,300][21194] Updated weights for policy 1, policy_version 9230 (0.0011) +[2023-10-08 16:04:25,669][21194] Updated weights for policy 1, policy_version 9240 (0.0009) +[2023-10-08 16:04:28,800][21195] Updated weights for policy 0, policy_version 9320 (0.0011) +[2023-10-08 16:04:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 19005440. Throughput: 0: 1734.6, 1: 1729.6. Samples: 4765434. Policy #0 lag: (min: 11.0, avg: 11.3, max: 22.0) +[2023-10-08 16:04:28,803][19739] Avg episode reward: [(0, '142.510'), (1, '252.770')] +[2023-10-08 16:04:29,170][21195] Updated weights for policy 0, policy_version 9330 (0.0009) +[2023-10-08 16:04:29,540][21195] Updated weights for policy 0, policy_version 9340 (0.0007) +[2023-10-08 16:04:29,652][21194] Updated weights for policy 1, policy_version 9250 (0.0009) +[2023-10-08 16:04:30,012][21194] Updated weights for policy 1, policy_version 9260 (0.0007) +[2023-10-08 16:04:30,383][21194] Updated weights for policy 1, policy_version 9270 (0.0007) +[2023-10-08 16:04:30,746][21194] Updated weights for policy 1, policy_version 9280 (0.0010) +[2023-10-08 16:04:33,502][21195] Updated weights for policy 0, policy_version 9350 (0.0008) +[2023-10-08 16:04:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 19070976. Throughput: 0: 1724.8, 1: 1711.9. Samples: 4780306. Policy #0 lag: (min: 11.0, avg: 11.3, max: 22.0) +[2023-10-08 16:04:33,804][19739] Avg episode reward: [(0, '142.510'), (1, '255.090')] +[2023-10-08 16:04:33,805][20836] Saving new best policy, reward=255.090! +[2023-10-08 16:04:33,885][21195] Updated weights for policy 0, policy_version 9360 (0.0010) +[2023-10-08 16:04:34,253][21195] Updated weights for policy 0, policy_version 9370 (0.0008) +[2023-10-08 16:04:34,735][21194] Updated weights for policy 1, policy_version 9290 (0.0009) +[2023-10-08 16:04:35,097][21194] Updated weights for policy 1, policy_version 9300 (0.0009) +[2023-10-08 16:04:35,472][21194] Updated weights for policy 1, policy_version 9310 (0.0008) +[2023-10-08 16:04:38,001][21195] Updated weights for policy 0, policy_version 9380 (0.0008) +[2023-10-08 16:04:38,376][21195] Updated weights for policy 0, policy_version 9390 (0.0009) +[2023-10-08 16:04:38,757][21195] Updated weights for policy 0, policy_version 9400 (0.0010) +[2023-10-08 16:04:38,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 19136512. Throughput: 0: 1744.4, 1: 1723.0. Samples: 4796544. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:04:38,803][19739] Avg episode reward: [(0, '142.770'), (1, '266.000')] +[2023-10-08 16:04:38,805][20836] Saving new best policy, reward=266.000! +[2023-10-08 16:04:39,501][21194] Updated weights for policy 1, policy_version 9320 (0.0008) +[2023-10-08 16:04:39,878][21194] Updated weights for policy 1, policy_version 9330 (0.0007) +[2023-10-08 16:04:40,250][21194] Updated weights for policy 1, policy_version 9340 (0.0007) +[2023-10-08 16:04:42,436][21195] Updated weights for policy 0, policy_version 9410 (0.0007) +[2023-10-08 16:04:42,804][21195] Updated weights for policy 0, policy_version 9420 (0.0008) +[2023-10-08 16:04:43,175][21195] Updated weights for policy 0, policy_version 9430 (0.0010) +[2023-10-08 16:04:43,546][21195] Updated weights for policy 0, policy_version 9440 (0.0008) +[2023-10-08 16:04:43,803][19739] Fps is (10 sec: 16384.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 19234816. Throughput: 0: 1736.0, 1: 1744.4. Samples: 4817786. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:04:43,803][19739] Avg episode reward: [(0, '150.520'), (1, '266.000')] +[2023-10-08 16:04:43,969][21194] Updated weights for policy 1, policy_version 9350 (0.0007) +[2023-10-08 16:04:44,335][21194] Updated weights for policy 1, policy_version 9360 (0.0007) +[2023-10-08 16:04:44,708][21194] Updated weights for policy 1, policy_version 9370 (0.0007) +[2023-10-08 16:04:47,424][21195] Updated weights for policy 0, policy_version 9450 (0.0009) +[2023-10-08 16:04:47,796][21195] Updated weights for policy 0, policy_version 9460 (0.0007) +[2023-10-08 16:04:48,162][21195] Updated weights for policy 0, policy_version 9470 (0.0008) +[2023-10-08 16:04:48,762][21194] Updated weights for policy 1, policy_version 9380 (0.0007) +[2023-10-08 16:04:48,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 19300352. Throughput: 0: 1719.5, 1: 1712.8. Samples: 4832360. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:04:48,803][19739] Avg episode reward: [(0, '160.770'), (1, '266.000')] +[2023-10-08 16:04:49,125][21194] Updated weights for policy 1, policy_version 9390 (0.0008) +[2023-10-08 16:04:49,495][21194] Updated weights for policy 1, policy_version 9400 (0.0007) +[2023-10-08 16:04:52,031][21195] Updated weights for policy 0, policy_version 9480 (0.0007) +[2023-10-08 16:04:52,401][21195] Updated weights for policy 0, policy_version 9490 (0.0008) +[2023-10-08 16:04:52,772][21195] Updated weights for policy 0, policy_version 9500 (0.0009) +[2023-10-08 16:04:53,570][21194] Updated weights for policy 1, policy_version 9410 (0.0010) +[2023-10-08 16:04:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 19365888. Throughput: 0: 1754.7, 1: 1735.6. Samples: 4848978. Policy #0 lag: (min: 21.0, avg: 24.7, max: 53.0) +[2023-10-08 16:04:53,803][19739] Avg episode reward: [(0, '160.770'), (1, '266.000')] +[2023-10-08 16:04:53,942][21194] Updated weights for policy 1, policy_version 9420 (0.0009) +[2023-10-08 16:04:54,312][21194] Updated weights for policy 1, policy_version 9430 (0.0007) +[2023-10-08 16:04:54,676][21194] Updated weights for policy 1, policy_version 9440 (0.0007) +[2023-10-08 16:04:56,688][21195] Updated weights for policy 0, policy_version 9510 (0.0008) +[2023-10-08 16:04:57,058][21195] Updated weights for policy 0, policy_version 9520 (0.0007) +[2023-10-08 16:04:57,433][21195] Updated weights for policy 0, policy_version 9530 (0.0010) +[2023-10-08 16:04:58,632][21194] Updated weights for policy 1, policy_version 9450 (0.0007) +[2023-10-08 16:04:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 19431424. Throughput: 0: 1723.7, 1: 1740.5. Samples: 4868934. Policy #0 lag: (min: 21.0, avg: 24.7, max: 53.0) +[2023-10-08 16:04:58,803][19739] Avg episode reward: [(0, '160.770'), (1, '266.000')] +[2023-10-08 16:04:59,001][21194] Updated weights for policy 1, policy_version 9460 (0.0010) +[2023-10-08 16:04:59,361][21194] Updated weights for policy 1, policy_version 9470 (0.0009) +[2023-10-08 16:05:01,417][21195] Updated weights for policy 0, policy_version 9540 (0.0010) +[2023-10-08 16:05:01,793][21195] Updated weights for policy 0, policy_version 9550 (0.0010) +[2023-10-08 16:05:02,160][21195] Updated weights for policy 0, policy_version 9560 (0.0010) +[2023-10-08 16:05:03,224][21194] Updated weights for policy 1, policy_version 9480 (0.0008) +[2023-10-08 16:05:03,592][21194] Updated weights for policy 1, policy_version 9490 (0.0007) +[2023-10-08 16:05:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 19496960. Throughput: 0: 1725.5, 1: 1722.9. Samples: 4884290. Policy #0 lag: (min: 18.0, avg: 26.0, max: 50.0) +[2023-10-08 16:05:03,803][19739] Avg episode reward: [(0, '169.130'), (1, '282.050')] +[2023-10-08 16:05:03,804][20740] Saving new best policy, reward=169.130! +[2023-10-08 16:05:03,955][21194] Updated weights for policy 1, policy_version 9500 (0.0009) +[2023-10-08 16:05:04,097][20836] Saving new best policy, reward=282.050! +[2023-10-08 16:05:06,008][21195] Updated weights for policy 0, policy_version 9570 (0.0011) +[2023-10-08 16:05:06,377][21195] Updated weights for policy 0, policy_version 9580 (0.0007) +[2023-10-08 16:05:06,757][21195] Updated weights for policy 0, policy_version 9590 (0.0007) +[2023-10-08 16:05:07,133][21195] Updated weights for policy 0, policy_version 9600 (0.0010) +[2023-10-08 16:05:07,991][21194] Updated weights for policy 1, policy_version 9510 (0.0009) +[2023-10-08 16:05:08,367][21194] Updated weights for policy 1, policy_version 9520 (0.0007) +[2023-10-08 16:05:08,730][21194] Updated weights for policy 1, policy_version 9530 (0.0007) +[2023-10-08 16:05:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 19562496. Throughput: 0: 1730.3, 1: 1739.2. Samples: 4900116. Policy #0 lag: (min: 18.0, avg: 26.0, max: 50.0) +[2023-10-08 16:05:08,803][19739] Avg episode reward: [(0, '170.810'), (1, '282.050')] +[2023-10-08 16:05:08,804][20740] Saving new best policy, reward=170.810! +[2023-10-08 16:05:10,763][21195] Updated weights for policy 0, policy_version 9610 (0.0008) +[2023-10-08 16:05:11,142][21195] Updated weights for policy 0, policy_version 9620 (0.0010) +[2023-10-08 16:05:11,505][21195] Updated weights for policy 0, policy_version 9630 (0.0011) +[2023-10-08 16:05:12,681][21194] Updated weights for policy 1, policy_version 9540 (0.0010) +[2023-10-08 16:05:13,045][21194] Updated weights for policy 1, policy_version 9550 (0.0009) +[2023-10-08 16:05:13,404][21194] Updated weights for policy 1, policy_version 9560 (0.0008) +[2023-10-08 16:05:13,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 19660800. Throughput: 0: 1727.5, 1: 1719.2. Samples: 4920536. Policy #0 lag: (min: 14.0, avg: 22.0, max: 46.0) +[2023-10-08 16:05:13,803][19739] Avg episode reward: [(0, '170.810'), (1, '285.460')] +[2023-10-08 16:05:13,814][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000009568_9797632.pth... +[2023-10-08 16:05:13,815][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000009632_9863168.pth... +[2023-10-08 16:05:13,849][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000008000_8192000.pth +[2023-10-08 16:05:13,854][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000007936_8126464.pth +[2023-10-08 16:05:13,859][20836] Saving new best policy, reward=285.460! +[2023-10-08 16:05:15,741][21195] Updated weights for policy 0, policy_version 9640 (0.0010) +[2023-10-08 16:05:16,109][21195] Updated weights for policy 0, policy_version 9650 (0.0010) +[2023-10-08 16:05:16,487][21195] Updated weights for policy 0, policy_version 9660 (0.0010) +[2023-10-08 16:05:17,258][21194] Updated weights for policy 1, policy_version 9570 (0.0007) +[2023-10-08 16:05:17,622][21194] Updated weights for policy 1, policy_version 9580 (0.0007) +[2023-10-08 16:05:18,003][21194] Updated weights for policy 1, policy_version 9590 (0.0009) +[2023-10-08 16:05:18,365][21194] Updated weights for policy 1, policy_version 9600 (0.0009) +[2023-10-08 16:05:18,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 19726336. Throughput: 0: 1735.0, 1: 1731.6. Samples: 4936306. Policy #0 lag: (min: 14.0, avg: 22.0, max: 46.0) +[2023-10-08 16:05:18,803][19739] Avg episode reward: [(0, '174.430'), (1, '282.720')] +[2023-10-08 16:05:18,804][20740] Saving new best policy, reward=174.430! +[2023-10-08 16:05:20,597][21195] Updated weights for policy 0, policy_version 9670 (0.0008) +[2023-10-08 16:05:20,978][21195] Updated weights for policy 0, policy_version 9680 (0.0009) +[2023-10-08 16:05:21,345][21195] Updated weights for policy 0, policy_version 9690 (0.0010) +[2023-10-08 16:05:22,498][21194] Updated weights for policy 1, policy_version 9610 (0.0008) +[2023-10-08 16:05:22,869][21194] Updated weights for policy 1, policy_version 9620 (0.0008) +[2023-10-08 16:05:23,238][21194] Updated weights for policy 1, policy_version 9630 (0.0008) +[2023-10-08 16:05:23,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 19791872. Throughput: 0: 1716.3, 1: 1727.4. Samples: 4951512. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 16:05:23,803][19739] Avg episode reward: [(0, '173.050'), (1, '282.720')] +[2023-10-08 16:05:25,372][21195] Updated weights for policy 0, policy_version 9700 (0.0008) +[2023-10-08 16:05:25,752][21195] Updated weights for policy 0, policy_version 9710 (0.0008) +[2023-10-08 16:05:26,123][21195] Updated weights for policy 0, policy_version 9720 (0.0009) +[2023-10-08 16:05:27,123][21194] Updated weights for policy 1, policy_version 9640 (0.0007) +[2023-10-08 16:05:27,499][21194] Updated weights for policy 1, policy_version 9650 (0.0007) +[2023-10-08 16:05:27,876][21194] Updated weights for policy 1, policy_version 9660 (0.0009) +[2023-10-08 16:05:28,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 19857408. Throughput: 0: 1720.8, 1: 1699.0. Samples: 4971676. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 16:05:28,803][19739] Avg episode reward: [(0, '186.380'), (1, '282.720')] +[2023-10-08 16:05:28,812][20740] Saving new best policy, reward=186.380! +[2023-10-08 16:05:30,034][21195] Updated weights for policy 0, policy_version 9730 (0.0009) +[2023-10-08 16:05:30,403][21195] Updated weights for policy 0, policy_version 9740 (0.0010) +[2023-10-08 16:05:30,772][21195] Updated weights for policy 0, policy_version 9750 (0.0009) +[2023-10-08 16:05:31,143][21195] Updated weights for policy 0, policy_version 9760 (0.0007) +[2023-10-08 16:05:31,799][21194] Updated weights for policy 1, policy_version 9670 (0.0007) +[2023-10-08 16:05:32,167][21194] Updated weights for policy 1, policy_version 9680 (0.0008) +[2023-10-08 16:05:32,537][21194] Updated weights for policy 1, policy_version 9690 (0.0008) +[2023-10-08 16:05:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 19922944. Throughput: 0: 1738.1, 1: 1725.3. Samples: 4988212. Policy #0 lag: (min: 31.0, avg: 32.2, max: 55.0) +[2023-10-08 16:05:33,803][19739] Avg episode reward: [(0, '186.380'), (1, '282.720')] +[2023-10-08 16:05:35,128][21195] Updated weights for policy 0, policy_version 9770 (0.0009) +[2023-10-08 16:05:35,499][21195] Updated weights for policy 0, policy_version 9780 (0.0008) +[2023-10-08 16:05:35,866][21195] Updated weights for policy 0, policy_version 9790 (0.0008) +[2023-10-08 16:05:36,568][21194] Updated weights for policy 1, policy_version 9700 (0.0008) +[2023-10-08 16:05:36,945][21194] Updated weights for policy 1, policy_version 9710 (0.0007) +[2023-10-08 16:05:37,310][21194] Updated weights for policy 1, policy_version 9720 (0.0007) +[2023-10-08 16:05:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 19988480. Throughput: 0: 1706.3, 1: 1714.9. Samples: 5002930. Policy #0 lag: (min: 31.0, avg: 32.2, max: 55.0) +[2023-10-08 16:05:38,803][19739] Avg episode reward: [(0, '182.690'), (1, '284.930')] +[2023-10-08 16:05:39,818][21195] Updated weights for policy 0, policy_version 9800 (0.0007) +[2023-10-08 16:05:40,185][21195] Updated weights for policy 0, policy_version 9810 (0.0008) +[2023-10-08 16:05:40,556][21195] Updated weights for policy 0, policy_version 9820 (0.0008) +[2023-10-08 16:05:41,251][21194] Updated weights for policy 1, policy_version 9730 (0.0008) +[2023-10-08 16:05:41,626][21194] Updated weights for policy 1, policy_version 9740 (0.0010) +[2023-10-08 16:05:41,991][21194] Updated weights for policy 1, policy_version 9750 (0.0007) +[2023-10-08 16:05:42,355][21194] Updated weights for policy 1, policy_version 9760 (0.0007) +[2023-10-08 16:05:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 20054016. Throughput: 0: 1737.0, 1: 1704.4. Samples: 5023794. Policy #0 lag: (min: 27.0, avg: 27.5, max: 43.0) +[2023-10-08 16:05:43,803][19739] Avg episode reward: [(0, '182.240'), (1, '284.930')] +[2023-10-08 16:05:44,344][21195] Updated weights for policy 0, policy_version 9830 (0.0008) +[2023-10-08 16:05:44,716][21195] Updated weights for policy 0, policy_version 9840 (0.0007) +[2023-10-08 16:05:45,096][21195] Updated weights for policy 0, policy_version 9850 (0.0008) +[2023-10-08 16:05:46,305][21194] Updated weights for policy 1, policy_version 9770 (0.0009) +[2023-10-08 16:05:46,675][21194] Updated weights for policy 1, policy_version 9780 (0.0010) +[2023-10-08 16:05:47,037][21194] Updated weights for policy 1, policy_version 9790 (0.0009) +[2023-10-08 16:05:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 20119552. Throughput: 0: 1735.0, 1: 1735.9. Samples: 5040482. Policy #0 lag: (min: 27.0, avg: 27.5, max: 43.0) +[2023-10-08 16:05:48,803][19739] Avg episode reward: [(0, '186.640'), (1, '273.210')] +[2023-10-08 16:05:48,804][20740] Saving new best policy, reward=186.640! +[2023-10-08 16:05:49,137][21195] Updated weights for policy 0, policy_version 9860 (0.0009) +[2023-10-08 16:05:49,514][21195] Updated weights for policy 0, policy_version 9870 (0.0008) +[2023-10-08 16:05:49,882][21195] Updated weights for policy 0, policy_version 9880 (0.0009) +[2023-10-08 16:05:50,911][21194] Updated weights for policy 1, policy_version 9800 (0.0008) +[2023-10-08 16:05:51,275][21194] Updated weights for policy 1, policy_version 9810 (0.0010) +[2023-10-08 16:05:51,649][21194] Updated weights for policy 1, policy_version 9820 (0.0007) +[2023-10-08 16:05:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 20185088. Throughput: 0: 1728.1, 1: 1705.7. Samples: 5054638. Policy #0 lag: (min: 26.0, avg: 26.5, max: 41.0) +[2023-10-08 16:05:53,803][19739] Avg episode reward: [(0, '193.330'), (1, '281.600')] +[2023-10-08 16:05:53,850][21195] Updated weights for policy 0, policy_version 9890 (0.0008) +[2023-10-08 16:05:54,211][21195] Updated weights for policy 0, policy_version 9900 (0.0010) +[2023-10-08 16:05:54,582][21195] Updated weights for policy 0, policy_version 9910 (0.0009) +[2023-10-08 16:05:54,950][20740] Saving new best policy, reward=193.330! +[2023-10-08 16:05:54,956][21195] Updated weights for policy 0, policy_version 9920 (0.0009) +[2023-10-08 16:05:55,537][21194] Updated weights for policy 1, policy_version 9830 (0.0009) +[2023-10-08 16:05:55,910][21194] Updated weights for policy 1, policy_version 9840 (0.0010) +[2023-10-08 16:05:56,283][21194] Updated weights for policy 1, policy_version 9850 (0.0010) +[2023-10-08 16:05:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 20250624. Throughput: 0: 1735.9, 1: 1723.9. Samples: 5076228. Policy #0 lag: (min: 26.0, avg: 26.5, max: 41.0) +[2023-10-08 16:05:58,803][19739] Avg episode reward: [(0, '193.330'), (1, '281.600')] +[2023-10-08 16:05:58,879][21195] Updated weights for policy 0, policy_version 9930 (0.0009) +[2023-10-08 16:05:59,258][21195] Updated weights for policy 0, policy_version 9940 (0.0007) +[2023-10-08 16:05:59,629][21195] Updated weights for policy 0, policy_version 9950 (0.0008) +[2023-10-08 16:06:00,230][21194] Updated weights for policy 1, policy_version 9860 (0.0012) +[2023-10-08 16:06:00,606][21194] Updated weights for policy 1, policy_version 9870 (0.0010) +[2023-10-08 16:06:00,975][21194] Updated weights for policy 1, policy_version 9880 (0.0011) +[2023-10-08 16:06:03,460][21195] Updated weights for policy 0, policy_version 9960 (0.0008) +[2023-10-08 16:06:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 20316160. Throughput: 0: 1724.2, 1: 1714.4. Samples: 5091042. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:06:03,803][19739] Avg episode reward: [(0, '198.410'), (1, '281.600')] +[2023-10-08 16:06:03,823][21195] Updated weights for policy 0, policy_version 9970 (0.0007) +[2023-10-08 16:06:04,192][21195] Updated weights for policy 0, policy_version 9980 (0.0008) +[2023-10-08 16:06:04,339][20740] Saving new best policy, reward=198.410! +[2023-10-08 16:06:04,792][21194] Updated weights for policy 1, policy_version 9890 (0.0008) +[2023-10-08 16:06:05,157][21194] Updated weights for policy 1, policy_version 9900 (0.0007) +[2023-10-08 16:06:05,517][21194] Updated weights for policy 1, policy_version 9910 (0.0009) +[2023-10-08 16:06:05,892][21194] Updated weights for policy 1, policy_version 9920 (0.0008) +[2023-10-08 16:06:08,186][21195] Updated weights for policy 0, policy_version 9990 (0.0010) +[2023-10-08 16:06:08,561][21195] Updated weights for policy 0, policy_version 10000 (0.0010) +[2023-10-08 16:06:08,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 20381696. Throughput: 0: 1740.4, 1: 1710.0. Samples: 5106780. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:06:08,804][19739] Avg episode reward: [(0, '199.440'), (1, '282.970')] +[2023-10-08 16:06:08,935][21195] Updated weights for policy 0, policy_version 10010 (0.0010) +[2023-10-08 16:06:09,158][20740] Saving new best policy, reward=199.440! +[2023-10-08 16:06:09,864][21194] Updated weights for policy 1, policy_version 9930 (0.0008) +[2023-10-08 16:06:10,233][21194] Updated weights for policy 1, policy_version 9940 (0.0009) +[2023-10-08 16:06:10,602][21194] Updated weights for policy 1, policy_version 9950 (0.0010) +[2023-10-08 16:06:12,897][21195] Updated weights for policy 0, policy_version 10020 (0.0009) +[2023-10-08 16:06:13,289][21195] Updated weights for policy 0, policy_version 10030 (0.0009) +[2023-10-08 16:06:13,666][21195] Updated weights for policy 0, policy_version 10040 (0.0009) +[2023-10-08 16:06:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 20447232. Throughput: 0: 1736.9, 1: 1739.3. Samples: 5128108. Policy #0 lag: (min: 31.0, avg: 46.9, max: 63.0) +[2023-10-08 16:06:13,803][19739] Avg episode reward: [(0, '199.440'), (1, '273.420')] +[2023-10-08 16:06:14,659][21194] Updated weights for policy 1, policy_version 9960 (0.0009) +[2023-10-08 16:06:15,026][21194] Updated weights for policy 1, policy_version 9970 (0.0007) +[2023-10-08 16:06:15,401][21194] Updated weights for policy 1, policy_version 9980 (0.0008) +[2023-10-08 16:06:17,388][21195] Updated weights for policy 0, policy_version 10050 (0.0008) +[2023-10-08 16:06:17,748][21195] Updated weights for policy 0, policy_version 10060 (0.0008) +[2023-10-08 16:06:18,115][21195] Updated weights for policy 0, policy_version 10070 (0.0008) +[2023-10-08 16:06:18,493][21195] Updated weights for policy 0, policy_version 10080 (0.0008) +[2023-10-08 16:06:18,803][19739] Fps is (10 sec: 16384.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 20545536. Throughput: 0: 1711.0, 1: 1711.7. Samples: 5142232. Policy #0 lag: (min: 4.0, avg: 12.0, max: 36.0) +[2023-10-08 16:06:18,803][19739] Avg episode reward: [(0, '209.270'), (1, '273.420')] +[2023-10-08 16:06:18,804][20740] Saving new best policy, reward=209.270! +[2023-10-08 16:06:19,271][21194] Updated weights for policy 1, policy_version 9990 (0.0009) +[2023-10-08 16:06:19,640][21194] Updated weights for policy 1, policy_version 10000 (0.0010) +[2023-10-08 16:06:20,015][21194] Updated weights for policy 1, policy_version 10010 (0.0008) +[2023-10-08 16:06:22,348][21195] Updated weights for policy 0, policy_version 10090 (0.0007) +[2023-10-08 16:06:22,720][21195] Updated weights for policy 0, policy_version 10100 (0.0008) +[2023-10-08 16:06:23,102][21195] Updated weights for policy 0, policy_version 10110 (0.0008) +[2023-10-08 16:06:23,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 20611072. Throughput: 0: 1739.3, 1: 1727.1. Samples: 5158918. Policy #0 lag: (min: 4.0, avg: 12.0, max: 36.0) +[2023-10-08 16:06:23,803][19739] Avg episode reward: [(0, '202.430'), (1, '273.420')] +[2023-10-08 16:06:24,009][21194] Updated weights for policy 1, policy_version 10020 (0.0007) +[2023-10-08 16:06:24,377][21194] Updated weights for policy 1, policy_version 10030 (0.0008) +[2023-10-08 16:06:24,735][21194] Updated weights for policy 1, policy_version 10040 (0.0008) +[2023-10-08 16:06:27,143][21195] Updated weights for policy 0, policy_version 10120 (0.0008) +[2023-10-08 16:06:27,511][21195] Updated weights for policy 0, policy_version 10130 (0.0007) +[2023-10-08 16:06:27,884][21195] Updated weights for policy 0, policy_version 10140 (0.0007) +[2023-10-08 16:06:28,722][21194] Updated weights for policy 1, policy_version 10050 (0.0007) +[2023-10-08 16:06:28,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 20676608. Throughput: 0: 1715.8, 1: 1737.4. Samples: 5179188. Policy #0 lag: (min: 9.0, avg: 9.7, max: 26.0) +[2023-10-08 16:06:28,804][19739] Avg episode reward: [(0, '216.320'), (1, '273.790')] +[2023-10-08 16:06:28,815][20740] Saving new best policy, reward=216.320! +[2023-10-08 16:06:29,088][21194] Updated weights for policy 1, policy_version 10060 (0.0008) +[2023-10-08 16:06:29,471][21194] Updated weights for policy 1, policy_version 10070 (0.0009) +[2023-10-08 16:06:29,851][21194] Updated weights for policy 1, policy_version 10080 (0.0010) +[2023-10-08 16:06:31,865][21195] Updated weights for policy 0, policy_version 10150 (0.0010) +[2023-10-08 16:06:32,241][21195] Updated weights for policy 0, policy_version 10160 (0.0010) +[2023-10-08 16:06:32,609][21195] Updated weights for policy 0, policy_version 10170 (0.0010) +[2023-10-08 16:06:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 20742144. Throughput: 0: 1708.8, 1: 1705.8. Samples: 5194136. Policy #0 lag: (min: 9.0, avg: 9.7, max: 26.0) +[2023-10-08 16:06:33,803][19739] Avg episode reward: [(0, '210.840'), (1, '273.790')] +[2023-10-08 16:06:33,909][21194] Updated weights for policy 1, policy_version 10090 (0.0011) +[2023-10-08 16:06:34,278][21194] Updated weights for policy 1, policy_version 10100 (0.0010) +[2023-10-08 16:06:34,644][21194] Updated weights for policy 1, policy_version 10110 (0.0011) +[2023-10-08 16:06:36,564][21195] Updated weights for policy 0, policy_version 10180 (0.0009) +[2023-10-08 16:06:36,945][21195] Updated weights for policy 0, policy_version 10190 (0.0009) +[2023-10-08 16:06:37,314][21195] Updated weights for policy 0, policy_version 10200 (0.0010) +[2023-10-08 16:06:38,485][21194] Updated weights for policy 1, policy_version 10120 (0.0008) +[2023-10-08 16:06:38,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 20807680. Throughput: 0: 1730.0, 1: 1736.6. Samples: 5210638. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:06:38,803][19739] Avg episode reward: [(0, '210.360'), (1, '273.790')] +[2023-10-08 16:06:38,847][21194] Updated weights for policy 1, policy_version 10130 (0.0008) +[2023-10-08 16:06:39,225][21194] Updated weights for policy 1, policy_version 10140 (0.0007) +[2023-10-08 16:06:41,197][21195] Updated weights for policy 0, policy_version 10210 (0.0009) +[2023-10-08 16:06:41,568][21195] Updated weights for policy 0, policy_version 10220 (0.0008) +[2023-10-08 16:06:41,947][21195] Updated weights for policy 0, policy_version 10230 (0.0009) +[2023-10-08 16:06:42,329][21195] Updated weights for policy 0, policy_version 10240 (0.0007) +[2023-10-08 16:06:43,204][21194] Updated weights for policy 1, policy_version 10150 (0.0009) +[2023-10-08 16:06:43,570][21194] Updated weights for policy 1, policy_version 10160 (0.0011) +[2023-10-08 16:06:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 20873216. Throughput: 0: 1706.7, 1: 1728.9. Samples: 5230830. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:06:43,803][19739] Avg episode reward: [(0, '207.970'), (1, '273.790')] +[2023-10-08 16:06:43,930][21194] Updated weights for policy 1, policy_version 10170 (0.0010) +[2023-10-08 16:06:46,132][21195] Updated weights for policy 0, policy_version 10250 (0.0007) +[2023-10-08 16:06:46,507][21195] Updated weights for policy 0, policy_version 10260 (0.0009) +[2023-10-08 16:06:46,870][21195] Updated weights for policy 0, policy_version 10270 (0.0010) +[2023-10-08 16:06:48,038][21194] Updated weights for policy 1, policy_version 10180 (0.0010) +[2023-10-08 16:06:48,408][21194] Updated weights for policy 1, policy_version 10190 (0.0007) +[2023-10-08 16:06:48,779][21194] Updated weights for policy 1, policy_version 10200 (0.0011) +[2023-10-08 16:06:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 20938752. Throughput: 0: 1730.2, 1: 1723.0. Samples: 5246434. Policy #0 lag: (min: 10.0, avg: 17.5, max: 42.0) +[2023-10-08 16:06:48,803][19739] Avg episode reward: [(0, '210.140'), (1, '287.760')] +[2023-10-08 16:06:49,067][20836] Saving new best policy, reward=287.760! +[2023-10-08 16:06:50,704][21195] Updated weights for policy 0, policy_version 10280 (0.0008) +[2023-10-08 16:06:51,082][21195] Updated weights for policy 0, policy_version 10290 (0.0007) +[2023-10-08 16:06:51,455][21195] Updated weights for policy 0, policy_version 10300 (0.0008) +[2023-10-08 16:06:52,663][21194] Updated weights for policy 1, policy_version 10210 (0.0009) +[2023-10-08 16:06:53,038][21194] Updated weights for policy 1, policy_version 10220 (0.0009) +[2023-10-08 16:06:53,398][21194] Updated weights for policy 1, policy_version 10230 (0.0007) +[2023-10-08 16:06:53,773][21194] Updated weights for policy 1, policy_version 10240 (0.0009) +[2023-10-08 16:06:53,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 21037056. Throughput: 0: 1719.2, 1: 1725.6. Samples: 5261796. Policy #0 lag: (min: 10.0, avg: 17.5, max: 42.0) +[2023-10-08 16:06:53,804][19739] Avg episode reward: [(0, '210.140'), (1, '295.650')] +[2023-10-08 16:06:53,805][20836] Saving new best policy, reward=295.650! +[2023-10-08 16:06:55,260][21195] Updated weights for policy 0, policy_version 10310 (0.0008) +[2023-10-08 16:06:55,624][21195] Updated weights for policy 0, policy_version 10320 (0.0008) +[2023-10-08 16:06:55,988][21195] Updated weights for policy 0, policy_version 10330 (0.0009) +[2023-10-08 16:06:57,749][21194] Updated weights for policy 1, policy_version 10250 (0.0008) +[2023-10-08 16:06:58,114][21194] Updated weights for policy 1, policy_version 10260 (0.0007) +[2023-10-08 16:06:58,482][21194] Updated weights for policy 1, policy_version 10270 (0.0008) +[2023-10-08 16:06:58,803][19739] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 21102592. Throughput: 0: 1728.1, 1: 1706.5. Samples: 5282666. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:06:58,804][19739] Avg episode reward: [(0, '211.000'), (1, '299.930')] +[2023-10-08 16:06:58,815][20836] Saving new best policy, reward=299.930! +[2023-10-08 16:06:59,861][21195] Updated weights for policy 0, policy_version 10340 (0.0009) +[2023-10-08 16:07:00,249][21195] Updated weights for policy 0, policy_version 10350 (0.0008) +[2023-10-08 16:07:00,630][21195] Updated weights for policy 0, policy_version 10360 (0.0011) +[2023-10-08 16:07:02,565][21194] Updated weights for policy 1, policy_version 10280 (0.0007) +[2023-10-08 16:07:02,936][21194] Updated weights for policy 1, policy_version 10290 (0.0009) +[2023-10-08 16:07:03,305][21194] Updated weights for policy 1, policy_version 10300 (0.0008) +[2023-10-08 16:07:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 21168128. Throughput: 0: 1758.1, 1: 1724.3. Samples: 5298940. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:07:03,804][19739] Avg episode reward: [(0, '210.930'), (1, '306.100')] +[2023-10-08 16:07:03,806][20836] Saving new best policy, reward=306.100! +[2023-10-08 16:07:04,479][21195] Updated weights for policy 0, policy_version 10370 (0.0009) +[2023-10-08 16:07:04,855][21195] Updated weights for policy 0, policy_version 10380 (0.0011) +[2023-10-08 16:07:05,229][21195] Updated weights for policy 0, policy_version 10390 (0.0008) +[2023-10-08 16:07:05,593][21195] Updated weights for policy 0, policy_version 10400 (0.0008) +[2023-10-08 16:07:07,163][21194] Updated weights for policy 1, policy_version 10310 (0.0008) +[2023-10-08 16:07:07,538][21194] Updated weights for policy 1, policy_version 10320 (0.0010) +[2023-10-08 16:07:07,902][21194] Updated weights for policy 1, policy_version 10330 (0.0008) +[2023-10-08 16:07:08,803][19739] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 21233664. Throughput: 0: 1730.4, 1: 1722.2. Samples: 5314288. Policy #0 lag: (min: 26.0, avg: 34.0, max: 58.0) +[2023-10-08 16:07:08,803][19739] Avg episode reward: [(0, '210.930'), (1, '305.590')] +[2023-10-08 16:07:09,440][21195] Updated weights for policy 0, policy_version 10410 (0.0010) +[2023-10-08 16:07:09,810][21195] Updated weights for policy 0, policy_version 10420 (0.0007) +[2023-10-08 16:07:10,193][21195] Updated weights for policy 0, policy_version 10430 (0.0010) +[2023-10-08 16:07:11,821][21194] Updated weights for policy 1, policy_version 10340 (0.0010) +[2023-10-08 16:07:12,193][21194] Updated weights for policy 1, policy_version 10350 (0.0011) +[2023-10-08 16:07:12,572][21194] Updated weights for policy 1, policy_version 10360 (0.0009) +[2023-10-08 16:07:13,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 21299200. Throughput: 0: 1758.3, 1: 1694.0. Samples: 5334540. Policy #0 lag: (min: 26.0, avg: 34.0, max: 58.0) +[2023-10-08 16:07:13,803][19739] Avg episode reward: [(0, '223.670'), (1, '308.460')] +[2023-10-08 16:07:13,810][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000010368_10616832.pth... +[2023-10-08 16:07:13,852][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000008768_8978432.pth +[2023-10-08 16:07:13,858][20836] Saving new best policy, reward=308.460! +[2023-10-08 16:07:14,011][21195] Updated weights for policy 0, policy_version 10440 (0.0009) +[2023-10-08 16:07:14,376][21195] Updated weights for policy 0, policy_version 10450 (0.0008) +[2023-10-08 16:07:14,756][21195] Updated weights for policy 0, policy_version 10460 (0.0009) +[2023-10-08 16:07:14,898][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000010464_10715136.pth... +[2023-10-08 16:07:14,937][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000008832_9043968.pth +[2023-10-08 16:07:14,941][20740] Saving new best policy, reward=223.670! +[2023-10-08 16:07:16,426][21194] Updated weights for policy 1, policy_version 10370 (0.0009) +[2023-10-08 16:07:16,799][21194] Updated weights for policy 1, policy_version 10380 (0.0008) +[2023-10-08 16:07:17,163][21194] Updated weights for policy 1, policy_version 10390 (0.0008) +[2023-10-08 16:07:17,535][21194] Updated weights for policy 1, policy_version 10400 (0.0008) +[2023-10-08 16:07:18,603][21195] Updated weights for policy 0, policy_version 10470 (0.0007) +[2023-10-08 16:07:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 21364736. Throughput: 0: 1756.1, 1: 1727.1. Samples: 5350880. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 16:07:18,803][19739] Avg episode reward: [(0, '225.370'), (1, '308.460')] +[2023-10-08 16:07:18,969][21195] Updated weights for policy 0, policy_version 10480 (0.0008) +[2023-10-08 16:07:19,344][21195] Updated weights for policy 0, policy_version 10490 (0.0008) +[2023-10-08 16:07:19,561][20740] Saving new best policy, reward=225.370! +[2023-10-08 16:07:21,631][21194] Updated weights for policy 1, policy_version 10410 (0.0009) +[2023-10-08 16:07:21,993][21194] Updated weights for policy 1, policy_version 10420 (0.0007) +[2023-10-08 16:07:22,361][21194] Updated weights for policy 1, policy_version 10430 (0.0010) +[2023-10-08 16:07:23,317][21195] Updated weights for policy 0, policy_version 10500 (0.0009) +[2023-10-08 16:07:23,698][21195] Updated weights for policy 0, policy_version 10510 (0.0007) +[2023-10-08 16:07:23,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 21430272. Throughput: 0: 1743.6, 1: 1699.7. Samples: 5365584. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 16:07:23,803][19739] Avg episode reward: [(0, '232.000'), (1, '321.540')] +[2023-10-08 16:07:23,804][20836] Saving new best policy, reward=321.540! +[2023-10-08 16:07:24,066][21195] Updated weights for policy 0, policy_version 10520 (0.0008) +[2023-10-08 16:07:24,357][20740] Saving new best policy, reward=232.000! +[2023-10-08 16:07:26,287][21194] Updated weights for policy 1, policy_version 10440 (0.0008) +[2023-10-08 16:07:26,652][21194] Updated weights for policy 1, policy_version 10450 (0.0008) +[2023-10-08 16:07:27,020][21194] Updated weights for policy 1, policy_version 10460 (0.0009) +[2023-10-08 16:07:28,027][21195] Updated weights for policy 0, policy_version 10530 (0.0008) +[2023-10-08 16:07:28,398][21195] Updated weights for policy 0, policy_version 10540 (0.0009) +[2023-10-08 16:07:28,764][21195] Updated weights for policy 0, policy_version 10550 (0.0007) +[2023-10-08 16:07:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 21495808. Throughput: 0: 1767.0, 1: 1691.6. Samples: 5386466. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 16:07:28,803][19739] Avg episode reward: [(0, '233.080'), (1, '337.880')] +[2023-10-08 16:07:28,810][20836] Saving new best policy, reward=337.880! +[2023-10-08 16:07:29,128][20740] Saving new best policy, reward=233.080! +[2023-10-08 16:07:29,129][21195] Updated weights for policy 0, policy_version 10560 (0.0011) +[2023-10-08 16:07:31,099][21194] Updated weights for policy 1, policy_version 10470 (0.0010) +[2023-10-08 16:07:31,461][21194] Updated weights for policy 1, policy_version 10480 (0.0010) +[2023-10-08 16:07:31,823][21194] Updated weights for policy 1, policy_version 10490 (0.0010) +[2023-10-08 16:07:33,090][21195] Updated weights for policy 0, policy_version 10570 (0.0008) +[2023-10-08 16:07:33,467][21195] Updated weights for policy 0, policy_version 10580 (0.0008) +[2023-10-08 16:07:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 21561344. Throughput: 0: 1730.6, 1: 1718.2. Samples: 5401630. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 16:07:33,803][19739] Avg episode reward: [(0, '248.700'), (1, '346.490')] +[2023-10-08 16:07:33,804][20836] Saving new best policy, reward=346.490! +[2023-10-08 16:07:33,838][21195] Updated weights for policy 0, policy_version 10590 (0.0007) +[2023-10-08 16:07:33,906][20740] Saving new best policy, reward=248.700! +[2023-10-08 16:07:35,673][21194] Updated weights for policy 1, policy_version 10500 (0.0010) +[2023-10-08 16:07:36,033][21194] Updated weights for policy 1, policy_version 10510 (0.0008) +[2023-10-08 16:07:36,397][21194] Updated weights for policy 1, policy_version 10520 (0.0010) +[2023-10-08 16:07:37,824][21195] Updated weights for policy 0, policy_version 10600 (0.0008) +[2023-10-08 16:07:38,204][21195] Updated weights for policy 0, policy_version 10610 (0.0007) +[2023-10-08 16:07:38,579][21195] Updated weights for policy 0, policy_version 10620 (0.0007) +[2023-10-08 16:07:38,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 21659648. Throughput: 0: 1753.3, 1: 1704.9. Samples: 5417416. Policy #0 lag: (min: 25.0, avg: 32.9, max: 57.0) +[2023-10-08 16:07:38,803][19739] Avg episode reward: [(0, '253.180'), (1, '346.490')] +[2023-10-08 16:07:38,804][20740] Saving new best policy, reward=253.180! +[2023-10-08 16:07:40,169][21194] Updated weights for policy 1, policy_version 10530 (0.0007) +[2023-10-08 16:07:40,527][21194] Updated weights for policy 1, policy_version 10540 (0.0009) +[2023-10-08 16:07:40,901][21194] Updated weights for policy 1, policy_version 10550 (0.0008) +[2023-10-08 16:07:41,267][21194] Updated weights for policy 1, policy_version 10560 (0.0009) +[2023-10-08 16:07:42,658][21195] Updated weights for policy 0, policy_version 10630 (0.0008) +[2023-10-08 16:07:43,028][21195] Updated weights for policy 0, policy_version 10640 (0.0007) +[2023-10-08 16:07:43,398][21195] Updated weights for policy 0, policy_version 10650 (0.0008) +[2023-10-08 16:07:43,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 21725184. Throughput: 0: 1733.1, 1: 1727.7. Samples: 5438404. Policy #0 lag: (min: 19.0, avg: 27.4, max: 51.0) +[2023-10-08 16:07:43,803][19739] Avg episode reward: [(0, '252.680'), (1, '346.490')] +[2023-10-08 16:07:45,295][21194] Updated weights for policy 1, policy_version 10570 (0.0008) +[2023-10-08 16:07:45,667][21194] Updated weights for policy 1, policy_version 10580 (0.0008) +[2023-10-08 16:07:46,031][21194] Updated weights for policy 1, policy_version 10590 (0.0007) +[2023-10-08 16:07:47,331][21195] Updated weights for policy 0, policy_version 10660 (0.0009) +[2023-10-08 16:07:47,725][21195] Updated weights for policy 0, policy_version 10670 (0.0009) +[2023-10-08 16:07:48,098][21195] Updated weights for policy 0, policy_version 10680 (0.0007) +[2023-10-08 16:07:48,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 21790720. Throughput: 0: 1705.8, 1: 1714.9. Samples: 5452870. Policy #0 lag: (min: 19.0, avg: 27.4, max: 51.0) +[2023-10-08 16:07:48,803][19739] Avg episode reward: [(0, '251.020'), (1, '345.020')] +[2023-10-08 16:07:49,874][21194] Updated weights for policy 1, policy_version 10600 (0.0007) +[2023-10-08 16:07:50,237][21194] Updated weights for policy 1, policy_version 10610 (0.0008) +[2023-10-08 16:07:50,609][21194] Updated weights for policy 1, policy_version 10620 (0.0009) +[2023-10-08 16:07:51,985][21195] Updated weights for policy 0, policy_version 10690 (0.0008) +[2023-10-08 16:07:52,362][21195] Updated weights for policy 0, policy_version 10700 (0.0010) +[2023-10-08 16:07:52,725][21195] Updated weights for policy 0, policy_version 10710 (0.0010) +[2023-10-08 16:07:53,096][21195] Updated weights for policy 0, policy_version 10720 (0.0008) +[2023-10-08 16:07:53,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 21856256. Throughput: 0: 1735.7, 1: 1713.7. Samples: 5469512. Policy #0 lag: (min: 16.0, avg: 42.4, max: 48.0) +[2023-10-08 16:07:53,803][19739] Avg episode reward: [(0, '250.020'), (1, '378.110')] +[2023-10-08 16:07:53,804][20836] Saving new best policy, reward=378.110! +[2023-10-08 16:07:54,478][21194] Updated weights for policy 1, policy_version 10630 (0.0008) +[2023-10-08 16:07:54,844][21194] Updated weights for policy 1, policy_version 10640 (0.0007) +[2023-10-08 16:07:55,223][21194] Updated weights for policy 1, policy_version 10650 (0.0008) +[2023-10-08 16:07:57,124][21195] Updated weights for policy 0, policy_version 10730 (0.0009) +[2023-10-08 16:07:57,500][21195] Updated weights for policy 0, policy_version 10740 (0.0008) +[2023-10-08 16:07:57,864][21195] Updated weights for policy 0, policy_version 10750 (0.0008) +[2023-10-08 16:07:58,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 21921792. Throughput: 0: 1703.4, 1: 1746.1. Samples: 5489766. Policy #0 lag: (min: 16.0, avg: 42.4, max: 48.0) +[2023-10-08 16:07:58,804][19739] Avg episode reward: [(0, '244.500'), (1, '384.970')] +[2023-10-08 16:07:58,815][20836] Saving new best policy, reward=384.970! +[2023-10-08 16:07:59,125][21194] Updated weights for policy 1, policy_version 10660 (0.0010) +[2023-10-08 16:07:59,504][21194] Updated weights for policy 1, policy_version 10670 (0.0008) +[2023-10-08 16:07:59,873][21194] Updated weights for policy 1, policy_version 10680 (0.0008) +[2023-10-08 16:08:01,668][21195] Updated weights for policy 0, policy_version 10760 (0.0009) +[2023-10-08 16:08:02,038][21195] Updated weights for policy 0, policy_version 10770 (0.0011) +[2023-10-08 16:08:02,403][21195] Updated weights for policy 0, policy_version 10780 (0.0010) +[2023-10-08 16:08:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 21987328. Throughput: 0: 1711.4, 1: 1713.6. Samples: 5505004. Policy #0 lag: (min: 5.0, avg: 5.0, max: 5.0) +[2023-10-08 16:08:03,803][19739] Avg episode reward: [(0, '244.500'), (1, '384.860')] +[2023-10-08 16:08:03,812][21194] Updated weights for policy 1, policy_version 10690 (0.0008) +[2023-10-08 16:08:04,185][21194] Updated weights for policy 1, policy_version 10700 (0.0007) +[2023-10-08 16:08:04,556][21194] Updated weights for policy 1, policy_version 10710 (0.0007) +[2023-10-08 16:08:04,936][21194] Updated weights for policy 1, policy_version 10720 (0.0007) +[2023-10-08 16:08:06,378][21195] Updated weights for policy 0, policy_version 10790 (0.0007) +[2023-10-08 16:08:06,746][21195] Updated weights for policy 0, policy_version 10800 (0.0007) +[2023-10-08 16:08:07,117][21195] Updated weights for policy 0, policy_version 10810 (0.0007) +[2023-10-08 16:08:08,802][19739] Fps is (10 sec: 13107.8, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 22052864. Throughput: 0: 1718.3, 1: 1739.1. Samples: 5521166. Policy #0 lag: (min: 5.0, avg: 5.0, max: 5.0) +[2023-10-08 16:08:08,803][19739] Avg episode reward: [(0, '251.960'), (1, '384.860')] +[2023-10-08 16:08:08,821][21194] Updated weights for policy 1, policy_version 10730 (0.0009) +[2023-10-08 16:08:09,192][21194] Updated weights for policy 1, policy_version 10740 (0.0009) +[2023-10-08 16:08:09,553][21194] Updated weights for policy 1, policy_version 10750 (0.0009) +[2023-10-08 16:08:11,144][21195] Updated weights for policy 0, policy_version 10820 (0.0007) +[2023-10-08 16:08:11,521][21195] Updated weights for policy 0, policy_version 10830 (0.0009) +[2023-10-08 16:08:11,880][21195] Updated weights for policy 0, policy_version 10840 (0.0010) +[2023-10-08 16:08:13,422][21194] Updated weights for policy 1, policy_version 10760 (0.0007) +[2023-10-08 16:08:13,790][21194] Updated weights for policy 1, policy_version 10770 (0.0008) +[2023-10-08 16:08:13,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 22118400. Throughput: 0: 1699.6, 1: 1752.7. Samples: 5541822. Policy #0 lag: (min: 31.0, avg: 31.0, max: 35.0) +[2023-10-08 16:08:13,804][19739] Avg episode reward: [(0, '254.800'), (1, '396.600')] +[2023-10-08 16:08:13,817][20740] Saving new best policy, reward=254.800! +[2023-10-08 16:08:14,156][21194] Updated weights for policy 1, policy_version 10780 (0.0007) +[2023-10-08 16:08:14,299][20836] Saving new best policy, reward=396.600! +[2023-10-08 16:08:15,782][21195] Updated weights for policy 0, policy_version 10850 (0.0010) +[2023-10-08 16:08:16,152][21195] Updated weights for policy 0, policy_version 10860 (0.0008) +[2023-10-08 16:08:16,524][21195] Updated weights for policy 0, policy_version 10870 (0.0008) +[2023-10-08 16:08:16,900][21195] Updated weights for policy 0, policy_version 10880 (0.0008) +[2023-10-08 16:08:18,076][21194] Updated weights for policy 1, policy_version 10790 (0.0009) +[2023-10-08 16:08:18,442][21194] Updated weights for policy 1, policy_version 10800 (0.0010) +[2023-10-08 16:08:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 22183936. Throughput: 0: 1725.5, 1: 1729.7. Samples: 5557114. Policy #0 lag: (min: 31.0, avg: 31.0, max: 35.0) +[2023-10-08 16:08:18,803][19739] Avg episode reward: [(0, '254.800'), (1, '390.230')] +[2023-10-08 16:08:18,805][21194] Updated weights for policy 1, policy_version 10810 (0.0007) +[2023-10-08 16:08:20,794][21195] Updated weights for policy 0, policy_version 10890 (0.0009) +[2023-10-08 16:08:21,157][21195] Updated weights for policy 0, policy_version 10900 (0.0009) +[2023-10-08 16:08:21,534][21195] Updated weights for policy 0, policy_version 10910 (0.0007) +[2023-10-08 16:08:22,841][21194] Updated weights for policy 1, policy_version 10820 (0.0009) +[2023-10-08 16:08:23,203][21194] Updated weights for policy 1, policy_version 10830 (0.0010) +[2023-10-08 16:08:23,569][21194] Updated weights for policy 1, policy_version 10840 (0.0007) +[2023-10-08 16:08:23,802][19739] Fps is (10 sec: 13107.7, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 22249472. Throughput: 0: 1699.6, 1: 1744.8. Samples: 5572414. Policy #0 lag: (min: 31.0, avg: 31.0, max: 35.0) +[2023-10-08 16:08:23,803][19739] Avg episode reward: [(0, '264.370'), (1, '390.230')] +[2023-10-08 16:08:23,804][20740] Saving new best policy, reward=264.370! +[2023-10-08 16:08:25,404][21195] Updated weights for policy 0, policy_version 10920 (0.0008) +[2023-10-08 16:08:25,767][21195] Updated weights for policy 0, policy_version 10930 (0.0010) +[2023-10-08 16:08:26,139][21195] Updated weights for policy 0, policy_version 10940 (0.0010) +[2023-10-08 16:08:27,541][21194] Updated weights for policy 1, policy_version 10850 (0.0008) +[2023-10-08 16:08:27,908][21194] Updated weights for policy 1, policy_version 10860 (0.0007) +[2023-10-08 16:08:28,277][21194] Updated weights for policy 1, policy_version 10870 (0.0008) +[2023-10-08 16:08:28,643][21194] Updated weights for policy 1, policy_version 10880 (0.0008) +[2023-10-08 16:08:28,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 22347776. Throughput: 0: 1716.4, 1: 1730.8. Samples: 5593526. Policy #0 lag: (min: 31.0, avg: 31.8, max: 50.0) +[2023-10-08 16:08:28,803][19739] Avg episode reward: [(0, '266.200'), (1, '395.200')] +[2023-10-08 16:08:28,814][20740] Saving new best policy, reward=266.200! +[2023-10-08 16:08:30,143][21195] Updated weights for policy 0, policy_version 10950 (0.0008) +[2023-10-08 16:08:30,506][21195] Updated weights for policy 0, policy_version 10960 (0.0008) +[2023-10-08 16:08:30,871][21195] Updated weights for policy 0, policy_version 10970 (0.0010) +[2023-10-08 16:08:32,629][21194] Updated weights for policy 1, policy_version 10890 (0.0010) +[2023-10-08 16:08:32,998][21194] Updated weights for policy 1, policy_version 10900 (0.0010) +[2023-10-08 16:08:33,376][21194] Updated weights for policy 1, policy_version 10910 (0.0010) +[2023-10-08 16:08:33,803][19739] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 22413312. Throughput: 0: 1744.4, 1: 1738.9. Samples: 5609620. Policy #0 lag: (min: 31.0, avg: 31.8, max: 50.0) +[2023-10-08 16:08:33,804][19739] Avg episode reward: [(0, '263.560'), (1, '411.590')] +[2023-10-08 16:08:33,806][20836] Saving new best policy, reward=411.590! +[2023-10-08 16:08:34,702][21195] Updated weights for policy 0, policy_version 10980 (0.0008) +[2023-10-08 16:08:35,087][21195] Updated weights for policy 0, policy_version 10990 (0.0007) +[2023-10-08 16:08:35,461][21195] Updated weights for policy 0, policy_version 11000 (0.0008) +[2023-10-08 16:08:37,517][21194] Updated weights for policy 1, policy_version 10920 (0.0008) +[2023-10-08 16:08:37,885][21194] Updated weights for policy 1, policy_version 10930 (0.0009) +[2023-10-08 16:08:38,259][21194] Updated weights for policy 1, policy_version 10940 (0.0009) +[2023-10-08 16:08:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 22478848. Throughput: 0: 1711.9, 1: 1740.1. Samples: 5624852. Policy #0 lag: (min: 31.0, avg: 31.8, max: 50.0) +[2023-10-08 16:08:38,803][19739] Avg episode reward: [(0, '263.560'), (1, '411.590')] +[2023-10-08 16:08:39,451][21195] Updated weights for policy 0, policy_version 11010 (0.0008) +[2023-10-08 16:08:39,810][21195] Updated weights for policy 0, policy_version 11020 (0.0007) +[2023-10-08 16:08:40,177][21195] Updated weights for policy 0, policy_version 11030 (0.0009) +[2023-10-08 16:08:40,546][21195] Updated weights for policy 0, policy_version 11040 (0.0007) +[2023-10-08 16:08:42,007][21194] Updated weights for policy 1, policy_version 10950 (0.0008) +[2023-10-08 16:08:42,374][21194] Updated weights for policy 1, policy_version 10960 (0.0009) +[2023-10-08 16:08:42,739][21194] Updated weights for policy 1, policy_version 10970 (0.0007) +[2023-10-08 16:08:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 22544384. Throughput: 0: 1741.9, 1: 1706.9. Samples: 5644960. Policy #0 lag: (min: 26.0, avg: 27.0, max: 42.0) +[2023-10-08 16:08:43,803][19739] Avg episode reward: [(0, '264.020'), (1, '411.590')] +[2023-10-08 16:08:44,505][21195] Updated weights for policy 0, policy_version 11050 (0.0012) +[2023-10-08 16:08:44,867][21195] Updated weights for policy 0, policy_version 11060 (0.0010) +[2023-10-08 16:08:45,246][21195] Updated weights for policy 0, policy_version 11070 (0.0010) +[2023-10-08 16:08:46,565][21194] Updated weights for policy 1, policy_version 10980 (0.0007) +[2023-10-08 16:08:46,938][21194] Updated weights for policy 1, policy_version 10990 (0.0007) +[2023-10-08 16:08:47,308][21194] Updated weights for policy 1, policy_version 11000 (0.0008) +[2023-10-08 16:08:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 22609920. Throughput: 0: 1738.3, 1: 1746.3. Samples: 5661812. Policy #0 lag: (min: 26.0, avg: 27.0, max: 42.0) +[2023-10-08 16:08:48,803][19739] Avg episode reward: [(0, '263.990'), (1, '410.190')] +[2023-10-08 16:08:49,232][21195] Updated weights for policy 0, policy_version 11080 (0.0011) +[2023-10-08 16:08:49,600][21195] Updated weights for policy 0, policy_version 11090 (0.0010) +[2023-10-08 16:08:49,978][21195] Updated weights for policy 0, policy_version 11100 (0.0010) +[2023-10-08 16:08:51,257][21194] Updated weights for policy 1, policy_version 11010 (0.0007) +[2023-10-08 16:08:51,614][21194] Updated weights for policy 1, policy_version 11020 (0.0008) +[2023-10-08 16:08:51,976][21194] Updated weights for policy 1, policy_version 11030 (0.0008) +[2023-10-08 16:08:52,348][21194] Updated weights for policy 1, policy_version 11040 (0.0008) +[2023-10-08 16:08:53,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 22675456. Throughput: 0: 1725.0, 1: 1724.1. Samples: 5676376. Policy #0 lag: (min: 0.0, avg: 20.5, max: 32.0) +[2023-10-08 16:08:53,804][19739] Avg episode reward: [(0, '267.200'), (1, '403.490')] +[2023-10-08 16:08:53,876][21195] Updated weights for policy 0, policy_version 11110 (0.0007) +[2023-10-08 16:08:54,244][21195] Updated weights for policy 0, policy_version 11120 (0.0009) +[2023-10-08 16:08:54,614][21195] Updated weights for policy 0, policy_version 11130 (0.0007) +[2023-10-08 16:08:54,829][20740] Saving new best policy, reward=267.200! +[2023-10-08 16:08:56,267][21194] Updated weights for policy 1, policy_version 11050 (0.0009) +[2023-10-08 16:08:56,632][21194] Updated weights for policy 1, policy_version 11060 (0.0007) +[2023-10-08 16:08:56,999][21194] Updated weights for policy 1, policy_version 11070 (0.0007) +[2023-10-08 16:08:58,541][21195] Updated weights for policy 0, policy_version 11140 (0.0008) +[2023-10-08 16:08:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 22740992. Throughput: 0: 1743.1, 1: 1711.2. Samples: 5697266. Policy #0 lag: (min: 0.0, avg: 20.5, max: 32.0) +[2023-10-08 16:08:58,803][19739] Avg episode reward: [(0, '274.200'), (1, '403.490')] +[2023-10-08 16:08:58,915][21195] Updated weights for policy 0, policy_version 11150 (0.0009) +[2023-10-08 16:08:59,286][21195] Updated weights for policy 0, policy_version 11160 (0.0007) +[2023-10-08 16:08:59,585][20740] Saving new best policy, reward=274.200! +[2023-10-08 16:09:00,990][21194] Updated weights for policy 1, policy_version 11080 (0.0008) +[2023-10-08 16:09:01,356][21194] Updated weights for policy 1, policy_version 11090 (0.0009) +[2023-10-08 16:09:01,721][21194] Updated weights for policy 1, policy_version 11100 (0.0009) +[2023-10-08 16:09:03,319][21195] Updated weights for policy 0, policy_version 11170 (0.0007) +[2023-10-08 16:09:03,689][21195] Updated weights for policy 0, policy_version 11180 (0.0008) +[2023-10-08 16:09:03,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 22806528. Throughput: 0: 1729.9, 1: 1737.0. Samples: 5713126. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 16:09:03,803][19739] Avg episode reward: [(0, '276.410'), (1, '403.490')] +[2023-10-08 16:09:04,054][21195] Updated weights for policy 0, policy_version 11190 (0.0007) +[2023-10-08 16:09:04,423][20740] Saving new best policy, reward=276.410! +[2023-10-08 16:09:04,429][21195] Updated weights for policy 0, policy_version 11200 (0.0007) +[2023-10-08 16:09:05,500][21194] Updated weights for policy 1, policy_version 11110 (0.0009) +[2023-10-08 16:09:05,863][21194] Updated weights for policy 1, policy_version 11120 (0.0009) +[2023-10-08 16:09:06,232][21194] Updated weights for policy 1, policy_version 11130 (0.0010) +[2023-10-08 16:09:08,224][21195] Updated weights for policy 0, policy_version 11210 (0.0007) +[2023-10-08 16:09:08,596][21195] Updated weights for policy 0, policy_version 11220 (0.0007) +[2023-10-08 16:09:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 22872064. Throughput: 0: 1746.4, 1: 1720.1. Samples: 5728408. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 16:09:08,803][19739] Avg episode reward: [(0, '276.410'), (1, '403.730')] +[2023-10-08 16:09:08,963][21195] Updated weights for policy 0, policy_version 11230 (0.0007) +[2023-10-08 16:09:10,068][21194] Updated weights for policy 1, policy_version 11140 (0.0008) +[2023-10-08 16:09:10,428][21194] Updated weights for policy 1, policy_version 11150 (0.0009) +[2023-10-08 16:09:10,791][21194] Updated weights for policy 1, policy_version 11160 (0.0011) +[2023-10-08 16:09:12,759][21195] Updated weights for policy 0, policy_version 11240 (0.0008) +[2023-10-08 16:09:13,131][21195] Updated weights for policy 0, policy_version 11250 (0.0008) +[2023-10-08 16:09:13,513][21195] Updated weights for policy 0, policy_version 11260 (0.0008) +[2023-10-08 16:09:13,803][19739] Fps is (10 sec: 16383.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 22970368. Throughput: 0: 1737.2, 1: 1728.7. Samples: 5749496. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 16:09:13,804][19739] Avg episode reward: [(0, '278.210'), (1, '403.730')] +[2023-10-08 16:09:13,817][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000011264_11534336.pth... +[2023-10-08 16:09:13,818][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000011168_11436032.pth... +[2023-10-08 16:09:13,848][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000009632_9863168.pth +[2023-10-08 16:09:13,851][20740] Saving new best policy, reward=278.210! +[2023-10-08 16:09:13,857][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000009568_9797632.pth +[2023-10-08 16:09:14,862][21194] Updated weights for policy 1, policy_version 11170 (0.0009) +[2023-10-08 16:09:15,230][21194] Updated weights for policy 1, policy_version 11180 (0.0010) +[2023-10-08 16:09:15,606][21194] Updated weights for policy 1, policy_version 11190 (0.0010) +[2023-10-08 16:09:15,973][21194] Updated weights for policy 1, policy_version 11200 (0.0009) +[2023-10-08 16:09:17,269][21195] Updated weights for policy 0, policy_version 11270 (0.0007) +[2023-10-08 16:09:17,649][21195] Updated weights for policy 0, policy_version 11280 (0.0009) +[2023-10-08 16:09:18,014][21195] Updated weights for policy 0, policy_version 11290 (0.0010) +[2023-10-08 16:09:18,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13884.8). Total num frames: 23035904. Throughput: 0: 1711.5, 1: 1716.5. Samples: 5763876. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 16:09:18,803][19739] Avg episode reward: [(0, '277.830'), (1, '408.200')] +[2023-10-08 16:09:19,994][21194] Updated weights for policy 1, policy_version 11210 (0.0007) +[2023-10-08 16:09:20,355][21194] Updated weights for policy 1, policy_version 11220 (0.0007) +[2023-10-08 16:09:20,725][21194] Updated weights for policy 1, policy_version 11230 (0.0008) +[2023-10-08 16:09:22,111][21195] Updated weights for policy 0, policy_version 11300 (0.0008) +[2023-10-08 16:09:22,506][21195] Updated weights for policy 0, policy_version 11310 (0.0008) +[2023-10-08 16:09:22,868][21195] Updated weights for policy 0, policy_version 11320 (0.0008) +[2023-10-08 16:09:23,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 23101440. Throughput: 0: 1744.3, 1: 1713.7. Samples: 5780464. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 16:09:23,804][19739] Avg episode reward: [(0, '280.410'), (1, '408.200')] +[2023-10-08 16:09:23,805][20740] Saving new best policy, reward=280.410! +[2023-10-08 16:09:24,737][21194] Updated weights for policy 1, policy_version 11240 (0.0009) +[2023-10-08 16:09:25,108][21194] Updated weights for policy 1, policy_version 11250 (0.0009) +[2023-10-08 16:09:25,476][21194] Updated weights for policy 1, policy_version 11260 (0.0008) +[2023-10-08 16:09:26,766][21195] Updated weights for policy 0, policy_version 11330 (0.0009) +[2023-10-08 16:09:27,137][21195] Updated weights for policy 0, policy_version 11340 (0.0009) +[2023-10-08 16:09:27,508][21195] Updated weights for policy 0, policy_version 11350 (0.0007) +[2023-10-08 16:09:27,881][21195] Updated weights for policy 0, policy_version 11360 (0.0007) +[2023-10-08 16:09:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 23166976. Throughput: 0: 1712.3, 1: 1745.9. Samples: 5800580. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:09:28,803][19739] Avg episode reward: [(0, '280.410'), (1, '400.740')] +[2023-10-08 16:09:29,366][21194] Updated weights for policy 1, policy_version 11270 (0.0009) +[2023-10-08 16:09:29,722][21194] Updated weights for policy 1, policy_version 11280 (0.0007) +[2023-10-08 16:09:30,092][21194] Updated weights for policy 1, policy_version 11290 (0.0007) +[2023-10-08 16:09:31,867][21195] Updated weights for policy 0, policy_version 11370 (0.0009) +[2023-10-08 16:09:32,233][21195] Updated weights for policy 0, policy_version 11380 (0.0008) +[2023-10-08 16:09:32,605][21195] Updated weights for policy 0, policy_version 11390 (0.0008) +[2023-10-08 16:09:33,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 23232512. Throughput: 0: 1716.5, 1: 1706.5. Samples: 5815848. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:09:33,803][19739] Avg episode reward: [(0, '281.830'), (1, '397.920')] +[2023-10-08 16:09:33,804][20740] Saving new best policy, reward=281.830! +[2023-10-08 16:09:34,220][21194] Updated weights for policy 1, policy_version 11300 (0.0009) +[2023-10-08 16:09:34,590][21194] Updated weights for policy 1, policy_version 11310 (0.0008) +[2023-10-08 16:09:34,956][21194] Updated weights for policy 1, policy_version 11320 (0.0008) +[2023-10-08 16:09:36,650][21195] Updated weights for policy 0, policy_version 11400 (0.0010) +[2023-10-08 16:09:37,023][21195] Updated weights for policy 0, policy_version 11410 (0.0010) +[2023-10-08 16:09:37,389][21195] Updated weights for policy 0, policy_version 11420 (0.0009) +[2023-10-08 16:09:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 23298048. Throughput: 0: 1733.8, 1: 1723.7. Samples: 5831960. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:09:38,803][19739] Avg episode reward: [(0, '281.080'), (1, '397.920')] +[2023-10-08 16:09:38,835][21194] Updated weights for policy 1, policy_version 11330 (0.0009) +[2023-10-08 16:09:39,204][21194] Updated weights for policy 1, policy_version 11340 (0.0011) +[2023-10-08 16:09:39,578][21194] Updated weights for policy 1, policy_version 11350 (0.0009) +[2023-10-08 16:09:39,942][21194] Updated weights for policy 1, policy_version 11360 (0.0008) +[2023-10-08 16:09:41,359][21195] Updated weights for policy 0, policy_version 11430 (0.0008) +[2023-10-08 16:09:41,731][21195] Updated weights for policy 0, policy_version 11440 (0.0007) +[2023-10-08 16:09:42,090][21195] Updated weights for policy 0, policy_version 11450 (0.0007) +[2023-10-08 16:09:43,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 23363584. Throughput: 0: 1712.1, 1: 1733.4. Samples: 5852314. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 16:09:43,804][19739] Avg episode reward: [(0, '273.690'), (1, '397.920')] +[2023-10-08 16:09:43,883][21194] Updated weights for policy 1, policy_version 11370 (0.0009) +[2023-10-08 16:09:44,244][21194] Updated weights for policy 1, policy_version 11380 (0.0010) +[2023-10-08 16:09:44,610][21194] Updated weights for policy 1, policy_version 11390 (0.0010) +[2023-10-08 16:09:46,163][21195] Updated weights for policy 0, policy_version 11460 (0.0007) +[2023-10-08 16:09:46,534][21195] Updated weights for policy 0, policy_version 11470 (0.0007) +[2023-10-08 16:09:46,913][21195] Updated weights for policy 0, policy_version 11480 (0.0007) +[2023-10-08 16:09:48,614][21194] Updated weights for policy 1, policy_version 11400 (0.0008) +[2023-10-08 16:09:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 23429120. Throughput: 0: 1724.2, 1: 1707.8. Samples: 5867566. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 16:09:48,803][19739] Avg episode reward: [(0, '243.900'), (1, '397.920')] +[2023-10-08 16:09:48,981][21194] Updated weights for policy 1, policy_version 11410 (0.0009) +[2023-10-08 16:09:49,350][21194] Updated weights for policy 1, policy_version 11420 (0.0008) +[2023-10-08 16:09:50,829][21195] Updated weights for policy 0, policy_version 11490 (0.0007) +[2023-10-08 16:09:51,201][21195] Updated weights for policy 0, policy_version 11500 (0.0008) +[2023-10-08 16:09:51,577][21195] Updated weights for policy 0, policy_version 11510 (0.0007) +[2023-10-08 16:09:51,945][21195] Updated weights for policy 0, policy_version 11520 (0.0009) +[2023-10-08 16:09:53,291][21194] Updated weights for policy 1, policy_version 11430 (0.0009) +[2023-10-08 16:09:53,653][21194] Updated weights for policy 1, policy_version 11440 (0.0009) +[2023-10-08 16:09:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 23494656. Throughput: 0: 1715.9, 1: 1723.6. Samples: 5883184. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 16:09:53,803][19739] Avg episode reward: [(0, '243.900'), (1, '386.970')] +[2023-10-08 16:09:54,026][21194] Updated weights for policy 1, policy_version 11450 (0.0008) +[2023-10-08 16:09:55,823][21195] Updated weights for policy 0, policy_version 11530 (0.0009) +[2023-10-08 16:09:56,200][21195] Updated weights for policy 0, policy_version 11540 (0.0010) +[2023-10-08 16:09:56,568][21195] Updated weights for policy 0, policy_version 11550 (0.0010) +[2023-10-08 16:09:57,957][21194] Updated weights for policy 1, policy_version 11460 (0.0009) +[2023-10-08 16:09:58,322][21194] Updated weights for policy 1, policy_version 11470 (0.0008) +[2023-10-08 16:09:58,687][21194] Updated weights for policy 1, policy_version 11480 (0.0008) +[2023-10-08 16:09:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 23560192. Throughput: 0: 1721.1, 1: 1719.7. Samples: 5904330. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 16:09:58,803][19739] Avg episode reward: [(0, '246.970'), (1, '387.190')] +[2023-10-08 16:10:00,356][21195] Updated weights for policy 0, policy_version 11560 (0.0009) +[2023-10-08 16:10:00,726][21195] Updated weights for policy 0, policy_version 11570 (0.0008) +[2023-10-08 16:10:01,100][21195] Updated weights for policy 0, policy_version 11580 (0.0010) +[2023-10-08 16:10:02,794][21194] Updated weights for policy 1, policy_version 11490 (0.0008) +[2023-10-08 16:10:03,161][21194] Updated weights for policy 1, policy_version 11500 (0.0009) +[2023-10-08 16:10:03,535][21194] Updated weights for policy 1, policy_version 11510 (0.0007) +[2023-10-08 16:10:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 23625728. Throughput: 0: 1743.2, 1: 1722.8. Samples: 5919844. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 16:10:03,803][19739] Avg episode reward: [(0, '246.970'), (1, '387.190')] +[2023-10-08 16:10:03,900][21194] Updated weights for policy 1, policy_version 11520 (0.0009) +[2023-10-08 16:10:04,969][21195] Updated weights for policy 0, policy_version 11590 (0.0009) +[2023-10-08 16:10:05,348][21195] Updated weights for policy 0, policy_version 11600 (0.0009) +[2023-10-08 16:10:05,711][21195] Updated weights for policy 0, policy_version 11610 (0.0010) +[2023-10-08 16:10:07,827][21194] Updated weights for policy 1, policy_version 11530 (0.0009) +[2023-10-08 16:10:08,186][21194] Updated weights for policy 1, policy_version 11540 (0.0010) +[2023-10-08 16:10:08,550][21194] Updated weights for policy 1, policy_version 11550 (0.0011) +[2023-10-08 16:10:08,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 23724032. Throughput: 0: 1710.1, 1: 1728.7. Samples: 5935210. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 16:10:08,803][19739] Avg episode reward: [(0, '246.970'), (1, '387.190')] +[2023-10-08 16:10:09,591][21195] Updated weights for policy 0, policy_version 11620 (0.0010) +[2023-10-08 16:10:09,975][21195] Updated weights for policy 0, policy_version 11630 (0.0007) +[2023-10-08 16:10:10,339][21195] Updated weights for policy 0, policy_version 11640 (0.0009) +[2023-10-08 16:10:12,748][21194] Updated weights for policy 1, policy_version 11560 (0.0011) +[2023-10-08 16:10:13,113][21194] Updated weights for policy 1, policy_version 11570 (0.0009) +[2023-10-08 16:10:13,476][21194] Updated weights for policy 1, policy_version 11580 (0.0008) +[2023-10-08 16:10:13,803][19739] Fps is (10 sec: 16383.7, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 23789568. Throughput: 0: 1741.9, 1: 1711.0. Samples: 5955962. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 16:10:13,804][19739] Avg episode reward: [(0, '245.830'), (1, '389.050')] +[2023-10-08 16:10:14,193][21195] Updated weights for policy 0, policy_version 11650 (0.0008) +[2023-10-08 16:10:14,553][21195] Updated weights for policy 0, policy_version 11660 (0.0008) +[2023-10-08 16:10:14,923][21195] Updated weights for policy 0, policy_version 11670 (0.0007) +[2023-10-08 16:10:15,292][21195] Updated weights for policy 0, policy_version 11680 (0.0009) +[2023-10-08 16:10:17,083][21194] Updated weights for policy 1, policy_version 11590 (0.0010) +[2023-10-08 16:10:17,453][21194] Updated weights for policy 1, policy_version 11600 (0.0009) +[2023-10-08 16:10:17,819][21194] Updated weights for policy 1, policy_version 11610 (0.0010) +[2023-10-08 16:10:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 23855104. Throughput: 0: 1745.9, 1: 1728.2. Samples: 5972184. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 16:10:18,803][19739] Avg episode reward: [(0, '237.410'), (1, '389.050')] +[2023-10-08 16:10:19,079][21195] Updated weights for policy 0, policy_version 11690 (0.0010) +[2023-10-08 16:10:19,450][21195] Updated weights for policy 0, policy_version 11700 (0.0009) +[2023-10-08 16:10:19,818][21195] Updated weights for policy 0, policy_version 11710 (0.0007) +[2023-10-08 16:10:21,943][21194] Updated weights for policy 1, policy_version 11620 (0.0009) +[2023-10-08 16:10:22,313][21194] Updated weights for policy 1, policy_version 11630 (0.0010) +[2023-10-08 16:10:22,673][21194] Updated weights for policy 1, policy_version 11640 (0.0008) +[2023-10-08 16:10:23,666][21195] Updated weights for policy 0, policy_version 11720 (0.0007) +[2023-10-08 16:10:23,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 23920640. Throughput: 0: 1729.7, 1: 1723.3. Samples: 5987346. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 16:10:23,803][19739] Avg episode reward: [(0, '241.290'), (1, '383.920')] +[2023-10-08 16:10:24,049][21195] Updated weights for policy 0, policy_version 11730 (0.0009) +[2023-10-08 16:10:24,431][21195] Updated weights for policy 0, policy_version 11740 (0.0008) +[2023-10-08 16:10:26,752][21194] Updated weights for policy 1, policy_version 11650 (0.0007) +[2023-10-08 16:10:27,117][21194] Updated weights for policy 1, policy_version 11660 (0.0008) +[2023-10-08 16:10:27,490][21194] Updated weights for policy 1, policy_version 11670 (0.0008) +[2023-10-08 16:10:27,852][21194] Updated weights for policy 1, policy_version 11680 (0.0008) +[2023-10-08 16:10:28,399][21195] Updated weights for policy 0, policy_version 11750 (0.0009) +[2023-10-08 16:10:28,767][21195] Updated weights for policy 0, policy_version 11760 (0.0008) +[2023-10-08 16:10:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 23986176. Throughput: 0: 1751.1, 1: 1696.9. Samples: 6007472. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 16:10:28,803][19739] Avg episode reward: [(0, '242.210'), (1, '383.920')] +[2023-10-08 16:10:29,141][21195] Updated weights for policy 0, policy_version 11770 (0.0008) +[2023-10-08 16:10:31,774][21194] Updated weights for policy 1, policy_version 11690 (0.0008) +[2023-10-08 16:10:32,128][21194] Updated weights for policy 1, policy_version 11700 (0.0009) +[2023-10-08 16:10:32,501][21194] Updated weights for policy 1, policy_version 11710 (0.0008) +[2023-10-08 16:10:33,130][21195] Updated weights for policy 0, policy_version 11780 (0.0008) +[2023-10-08 16:10:33,494][21195] Updated weights for policy 0, policy_version 11790 (0.0008) +[2023-10-08 16:10:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 24051712. Throughput: 0: 1735.9, 1: 1725.4. Samples: 6023324. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 16:10:33,803][19739] Avg episode reward: [(0, '242.210'), (1, '383.920')] +[2023-10-08 16:10:33,866][21195] Updated weights for policy 0, policy_version 11800 (0.0008) +[2023-10-08 16:10:36,332][21194] Updated weights for policy 1, policy_version 11720 (0.0009) +[2023-10-08 16:10:36,712][21194] Updated weights for policy 1, policy_version 11730 (0.0008) +[2023-10-08 16:10:37,081][21194] Updated weights for policy 1, policy_version 11740 (0.0008) +[2023-10-08 16:10:37,710][21195] Updated weights for policy 0, policy_version 11810 (0.0009) +[2023-10-08 16:10:38,078][21195] Updated weights for policy 0, policy_version 11820 (0.0010) +[2023-10-08 16:10:38,444][21195] Updated weights for policy 0, policy_version 11830 (0.0009) +[2023-10-08 16:10:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 24117248. Throughput: 0: 1750.3, 1: 1705.7. Samples: 6038704. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 16:10:38,803][19739] Avg episode reward: [(0, '239.580'), (1, '383.420')] +[2023-10-08 16:10:38,812][21195] Updated weights for policy 0, policy_version 11840 (0.0008) +[2023-10-08 16:10:40,996][21194] Updated weights for policy 1, policy_version 11750 (0.0007) +[2023-10-08 16:10:41,360][21194] Updated weights for policy 1, policy_version 11760 (0.0008) +[2023-10-08 16:10:41,729][21194] Updated weights for policy 1, policy_version 11770 (0.0009) +[2023-10-08 16:10:42,729][21195] Updated weights for policy 0, policy_version 11850 (0.0007) +[2023-10-08 16:10:43,097][21195] Updated weights for policy 0, policy_version 11860 (0.0008) +[2023-10-08 16:10:43,471][21195] Updated weights for policy 0, policy_version 11870 (0.0010) +[2023-10-08 16:10:43,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 24215552. Throughput: 0: 1738.9, 1: 1705.5. Samples: 6059328. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 16:10:43,803][19739] Avg episode reward: [(0, '229.990'), (1, '383.420')] +[2023-10-08 16:10:45,567][21194] Updated weights for policy 1, policy_version 11780 (0.0010) +[2023-10-08 16:10:45,941][21194] Updated weights for policy 1, policy_version 11790 (0.0009) +[2023-10-08 16:10:46,306][21194] Updated weights for policy 1, policy_version 11800 (0.0011) +[2023-10-08 16:10:47,534][21195] Updated weights for policy 0, policy_version 11880 (0.0010) +[2023-10-08 16:10:47,894][21195] Updated weights for policy 0, policy_version 11890 (0.0008) +[2023-10-08 16:10:48,267][21195] Updated weights for policy 0, policy_version 11900 (0.0009) +[2023-10-08 16:10:48,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 24281088. Throughput: 0: 1718.3, 1: 1721.6. Samples: 6074638. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 16:10:48,803][19739] Avg episode reward: [(0, '230.840'), (1, '383.420')] +[2023-10-08 16:10:50,301][21194] Updated weights for policy 1, policy_version 11810 (0.0011) +[2023-10-08 16:10:50,663][21194] Updated weights for policy 1, policy_version 11820 (0.0008) +[2023-10-08 16:10:51,030][21194] Updated weights for policy 1, policy_version 11830 (0.0008) +[2023-10-08 16:10:51,401][21194] Updated weights for policy 1, policy_version 11840 (0.0008) +[2023-10-08 16:10:52,122][21195] Updated weights for policy 0, policy_version 11910 (0.0010) +[2023-10-08 16:10:52,491][21195] Updated weights for policy 0, policy_version 11920 (0.0010) +[2023-10-08 16:10:52,869][21195] Updated weights for policy 0, policy_version 11930 (0.0010) +[2023-10-08 16:10:53,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 24346624. Throughput: 0: 1754.8, 1: 1701.7. Samples: 6090752. Policy #0 lag: (min: 1.0, avg: 14.1, max: 33.0) +[2023-10-08 16:10:53,803][19739] Avg episode reward: [(0, '219.920'), (1, '389.970')] +[2023-10-08 16:10:55,259][21194] Updated weights for policy 1, policy_version 11850 (0.0009) +[2023-10-08 16:10:55,633][21194] Updated weights for policy 1, policy_version 11860 (0.0010) +[2023-10-08 16:10:55,996][21194] Updated weights for policy 1, policy_version 11870 (0.0009) +[2023-10-08 16:10:56,945][21195] Updated weights for policy 0, policy_version 11940 (0.0009) +[2023-10-08 16:10:57,334][21195] Updated weights for policy 0, policy_version 11950 (0.0009) +[2023-10-08 16:10:57,710][21195] Updated weights for policy 0, policy_version 11960 (0.0009) +[2023-10-08 16:10:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 24412160. Throughput: 0: 1727.1, 1: 1720.9. Samples: 6111122. Policy #0 lag: (min: 1.0, avg: 14.1, max: 33.0) +[2023-10-08 16:10:58,804][19739] Avg episode reward: [(0, '220.050'), (1, '389.210')] +[2023-10-08 16:11:00,191][21194] Updated weights for policy 1, policy_version 11880 (0.0008) +[2023-10-08 16:11:00,558][21194] Updated weights for policy 1, policy_version 11890 (0.0008) +[2023-10-08 16:11:00,937][21194] Updated weights for policy 1, policy_version 11900 (0.0009) +[2023-10-08 16:11:01,524][21195] Updated weights for policy 0, policy_version 11970 (0.0010) +[2023-10-08 16:11:01,886][21195] Updated weights for policy 0, policy_version 11980 (0.0008) +[2023-10-08 16:11:02,257][21195] Updated weights for policy 0, policy_version 11990 (0.0011) +[2023-10-08 16:11:02,624][21195] Updated weights for policy 0, policy_version 12000 (0.0007) +[2023-10-08 16:11:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 24477696. Throughput: 0: 1725.1, 1: 1704.4. Samples: 6126510. Policy #0 lag: (min: 31.0, avg: 31.7, max: 49.0) +[2023-10-08 16:11:03,803][19739] Avg episode reward: [(0, '228.840'), (1, '389.210')] +[2023-10-08 16:11:04,959][21194] Updated weights for policy 1, policy_version 11910 (0.0010) +[2023-10-08 16:11:05,329][21194] Updated weights for policy 1, policy_version 11920 (0.0010) +[2023-10-08 16:11:05,691][21194] Updated weights for policy 1, policy_version 11930 (0.0010) +[2023-10-08 16:11:06,461][21195] Updated weights for policy 0, policy_version 12010 (0.0010) +[2023-10-08 16:11:06,837][21195] Updated weights for policy 0, policy_version 12020 (0.0007) +[2023-10-08 16:11:07,217][21195] Updated weights for policy 0, policy_version 12030 (0.0007) +[2023-10-08 16:11:08,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 24543232. Throughput: 0: 1739.2, 1: 1706.3. Samples: 6142394. Policy #0 lag: (min: 31.0, avg: 31.7, max: 49.0) +[2023-10-08 16:11:08,803][19739] Avg episode reward: [(0, '239.570'), (1, '396.740')] +[2023-10-08 16:11:09,705][21194] Updated weights for policy 1, policy_version 11940 (0.0008) +[2023-10-08 16:11:10,072][21194] Updated weights for policy 1, policy_version 11950 (0.0007) +[2023-10-08 16:11:10,449][21194] Updated weights for policy 1, policy_version 11960 (0.0009) +[2023-10-08 16:11:11,038][21195] Updated weights for policy 0, policy_version 12040 (0.0008) +[2023-10-08 16:11:11,410][21195] Updated weights for policy 0, policy_version 12050 (0.0007) +[2023-10-08 16:11:11,779][21195] Updated weights for policy 0, policy_version 12060 (0.0009) +[2023-10-08 16:11:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 24608768. Throughput: 0: 1730.6, 1: 1735.0. Samples: 6163424. Policy #0 lag: (min: 31.0, avg: 31.7, max: 49.0) +[2023-10-08 16:11:13,803][19739] Avg episode reward: [(0, '249.150'), (1, '396.840')] +[2023-10-08 16:11:13,814][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000011968_12255232.pth... +[2023-10-08 16:11:13,814][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000012064_12353536.pth... +[2023-10-08 16:11:13,844][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000010368_10616832.pth +[2023-10-08 16:11:13,858][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000010464_10715136.pth +[2023-10-08 16:11:14,337][21194] Updated weights for policy 1, policy_version 11970 (0.0008) +[2023-10-08 16:11:14,695][21194] Updated weights for policy 1, policy_version 11980 (0.0007) +[2023-10-08 16:11:15,059][21194] Updated weights for policy 1, policy_version 11990 (0.0008) +[2023-10-08 16:11:15,428][21194] Updated weights for policy 1, policy_version 12000 (0.0009) +[2023-10-08 16:11:15,570][21195] Updated weights for policy 0, policy_version 12070 (0.0009) +[2023-10-08 16:11:15,930][21195] Updated weights for policy 0, policy_version 12080 (0.0008) +[2023-10-08 16:11:16,303][21195] Updated weights for policy 0, policy_version 12090 (0.0008) +[2023-10-08 16:11:18,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 24674304. Throughput: 0: 1748.8, 1: 1703.9. Samples: 6178694. Policy #0 lag: (min: 22.0, avg: 23.8, max: 51.0) +[2023-10-08 16:11:18,804][19739] Avg episode reward: [(0, '249.150'), (1, '405.780')] +[2023-10-08 16:11:19,427][21194] Updated weights for policy 1, policy_version 12010 (0.0007) +[2023-10-08 16:11:19,786][21194] Updated weights for policy 1, policy_version 12020 (0.0007) +[2023-10-08 16:11:20,047][21195] Updated weights for policy 0, policy_version 12100 (0.0007) +[2023-10-08 16:11:20,149][21194] Updated weights for policy 1, policy_version 12030 (0.0008) +[2023-10-08 16:11:20,408][21195] Updated weights for policy 0, policy_version 12110 (0.0009) +[2023-10-08 16:11:20,783][21195] Updated weights for policy 0, policy_version 12120 (0.0007) +[2023-10-08 16:11:23,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 24739840. Throughput: 0: 1728.6, 1: 1729.5. Samples: 6194318. Policy #0 lag: (min: 22.0, avg: 23.8, max: 51.0) +[2023-10-08 16:11:23,803][19739] Avg episode reward: [(0, '244.240'), (1, '405.610')] +[2023-10-08 16:11:24,033][21194] Updated weights for policy 1, policy_version 12040 (0.0008) +[2023-10-08 16:11:24,393][21194] Updated weights for policy 1, policy_version 12050 (0.0009) +[2023-10-08 16:11:24,612][21195] Updated weights for policy 0, policy_version 12130 (0.0009) +[2023-10-08 16:11:24,764][21194] Updated weights for policy 1, policy_version 12060 (0.0009) +[2023-10-08 16:11:24,974][21195] Updated weights for policy 0, policy_version 12140 (0.0009) +[2023-10-08 16:11:25,349][21195] Updated weights for policy 0, policy_version 12150 (0.0008) +[2023-10-08 16:11:25,721][21195] Updated weights for policy 0, policy_version 12160 (0.0009) +[2023-10-08 16:11:28,721][21194] Updated weights for policy 1, policy_version 12070 (0.0008) +[2023-10-08 16:11:28,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 24805376. Throughput: 0: 1745.8, 1: 1735.8. Samples: 6216000. Policy #0 lag: (min: 22.0, avg: 23.8, max: 51.0) +[2023-10-08 16:11:28,803][19739] Avg episode reward: [(0, '258.120'), (1, '420.110')] +[2023-10-08 16:11:29,073][21194] Updated weights for policy 1, policy_version 12080 (0.0008) +[2023-10-08 16:11:29,440][21194] Updated weights for policy 1, policy_version 12090 (0.0007) +[2023-10-08 16:11:29,445][21195] Updated weights for policy 0, policy_version 12170 (0.0008) +[2023-10-08 16:11:29,658][20836] Saving new best policy, reward=420.110! +[2023-10-08 16:11:29,813][21195] Updated weights for policy 0, policy_version 12180 (0.0008) +[2023-10-08 16:11:30,174][21195] Updated weights for policy 0, policy_version 12190 (0.0008) +[2023-10-08 16:11:33,450][21194] Updated weights for policy 1, policy_version 12100 (0.0007) +[2023-10-08 16:11:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 24870912. Throughput: 0: 1768.4, 1: 1715.2. Samples: 6231404. Policy #0 lag: (min: 31.0, avg: 31.3, max: 43.0) +[2023-10-08 16:11:33,803][19739] Avg episode reward: [(0, '258.120'), (1, '420.110')] +[2023-10-08 16:11:33,821][21194] Updated weights for policy 1, policy_version 12110 (0.0009) +[2023-10-08 16:11:34,185][21194] Updated weights for policy 1, policy_version 12120 (0.0007) +[2023-10-08 16:11:34,266][21195] Updated weights for policy 0, policy_version 12200 (0.0009) +[2023-10-08 16:11:34,641][21195] Updated weights for policy 0, policy_version 12210 (0.0010) +[2023-10-08 16:11:35,004][21195] Updated weights for policy 0, policy_version 12220 (0.0009) +[2023-10-08 16:11:38,022][21194] Updated weights for policy 1, policy_version 12130 (0.0009) +[2023-10-08 16:11:38,392][21194] Updated weights for policy 1, policy_version 12140 (0.0010) +[2023-10-08 16:11:38,769][21194] Updated weights for policy 1, policy_version 12150 (0.0008) +[2023-10-08 16:11:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 24936448. Throughput: 0: 1734.1, 1: 1728.8. Samples: 6246584. Policy #0 lag: (min: 31.0, avg: 31.3, max: 43.0) +[2023-10-08 16:11:38,803][19739] Avg episode reward: [(0, '257.510'), (1, '439.460')] +[2023-10-08 16:11:38,831][21195] Updated weights for policy 0, policy_version 12230 (0.0009) +[2023-10-08 16:11:39,133][20836] Saving new best policy, reward=439.460! +[2023-10-08 16:11:39,134][21194] Updated weights for policy 1, policy_version 12160 (0.0008) +[2023-10-08 16:11:39,205][21195] Updated weights for policy 0, policy_version 12240 (0.0009) +[2023-10-08 16:11:39,572][21195] Updated weights for policy 0, policy_version 12250 (0.0008) +[2023-10-08 16:11:43,093][21194] Updated weights for policy 1, policy_version 12170 (0.0009) +[2023-10-08 16:11:43,461][21194] Updated weights for policy 1, policy_version 12180 (0.0008) +[2023-10-08 16:11:43,594][21195] Updated weights for policy 0, policy_version 12260 (0.0009) +[2023-10-08 16:11:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 25001984. Throughput: 0: 1763.7, 1: 1717.1. Samples: 6267754. Policy #0 lag: (min: 31.0, avg: 31.3, max: 43.0) +[2023-10-08 16:11:43,803][19739] Avg episode reward: [(0, '259.270'), (1, '438.740')] +[2023-10-08 16:11:43,831][21194] Updated weights for policy 1, policy_version 12190 (0.0007) +[2023-10-08 16:11:43,997][21195] Updated weights for policy 0, policy_version 12270 (0.0009) +[2023-10-08 16:11:44,368][21195] Updated weights for policy 0, policy_version 12280 (0.0008) +[2023-10-08 16:11:47,827][21194] Updated weights for policy 1, policy_version 12200 (0.0009) +[2023-10-08 16:11:48,205][21194] Updated weights for policy 1, policy_version 12210 (0.0007) +[2023-10-08 16:11:48,423][21195] Updated weights for policy 0, policy_version 12290 (0.0007) +[2023-10-08 16:11:48,578][21194] Updated weights for policy 1, policy_version 12220 (0.0007) +[2023-10-08 16:11:48,791][21195] Updated weights for policy 0, policy_version 12300 (0.0009) +[2023-10-08 16:11:48,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 25100288. Throughput: 0: 1745.0, 1: 1727.9. Samples: 6282790. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:11:48,803][19739] Avg episode reward: [(0, '258.080'), (1, '438.740')] +[2023-10-08 16:11:49,167][21195] Updated weights for policy 0, policy_version 12310 (0.0008) +[2023-10-08 16:11:49,534][21195] Updated weights for policy 0, policy_version 12320 (0.0009) +[2023-10-08 16:11:52,466][21194] Updated weights for policy 1, policy_version 12230 (0.0007) +[2023-10-08 16:11:52,836][21194] Updated weights for policy 1, policy_version 12240 (0.0007) +[2023-10-08 16:11:53,209][21194] Updated weights for policy 1, policy_version 12250 (0.0010) +[2023-10-08 16:11:53,449][21195] Updated weights for policy 0, policy_version 12330 (0.0008) +[2023-10-08 16:11:53,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 25165824. Throughput: 0: 1735.7, 1: 1731.3. Samples: 6298410. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:11:53,803][19739] Avg episode reward: [(0, '261.760'), (1, '438.740')] +[2023-10-08 16:11:53,822][21195] Updated weights for policy 0, policy_version 12340 (0.0010) +[2023-10-08 16:11:54,186][21195] Updated weights for policy 0, policy_version 12350 (0.0010) +[2023-10-08 16:11:57,161][21194] Updated weights for policy 1, policy_version 12260 (0.0007) +[2023-10-08 16:11:57,531][21194] Updated weights for policy 1, policy_version 12270 (0.0009) +[2023-10-08 16:11:57,897][21194] Updated weights for policy 1, policy_version 12280 (0.0007) +[2023-10-08 16:11:58,014][21195] Updated weights for policy 0, policy_version 12360 (0.0007) +[2023-10-08 16:11:58,381][21195] Updated weights for policy 0, policy_version 12370 (0.0009) +[2023-10-08 16:11:58,751][21195] Updated weights for policy 0, policy_version 12380 (0.0009) +[2023-10-08 16:11:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 25231360. Throughput: 0: 1746.3, 1: 1709.3. Samples: 6318924. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:11:58,803][19739] Avg episode reward: [(0, '261.760'), (1, '430.680')] +[2023-10-08 16:12:01,780][21194] Updated weights for policy 1, policy_version 12290 (0.0008) +[2023-10-08 16:12:02,138][21194] Updated weights for policy 1, policy_version 12300 (0.0011) +[2023-10-08 16:12:02,505][21194] Updated weights for policy 1, policy_version 12310 (0.0008) +[2023-10-08 16:12:02,867][21194] Updated weights for policy 1, policy_version 12320 (0.0008) +[2023-10-08 16:12:02,890][21195] Updated weights for policy 0, policy_version 12390 (0.0008) +[2023-10-08 16:12:03,259][21195] Updated weights for policy 0, policy_version 12400 (0.0007) +[2023-10-08 16:12:03,628][21195] Updated weights for policy 0, policy_version 12410 (0.0007) +[2023-10-08 16:12:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 25296896. Throughput: 0: 1720.6, 1: 1732.6. Samples: 6334088. Policy #0 lag: (min: 31.0, avg: 37.9, max: 63.0) +[2023-10-08 16:12:03,803][19739] Avg episode reward: [(0, '261.760'), (1, '454.550')] +[2023-10-08 16:12:03,804][20836] Saving new best policy, reward=454.550! +[2023-10-08 16:12:06,854][21194] Updated weights for policy 1, policy_version 12330 (0.0008) +[2023-10-08 16:12:07,218][21194] Updated weights for policy 1, policy_version 12340 (0.0008) +[2023-10-08 16:12:07,578][21194] Updated weights for policy 1, policy_version 12350 (0.0010) +[2023-10-08 16:12:07,586][21195] Updated weights for policy 0, policy_version 12420 (0.0008) +[2023-10-08 16:12:07,956][21195] Updated weights for policy 0, policy_version 12430 (0.0008) +[2023-10-08 16:12:08,325][21195] Updated weights for policy 0, policy_version 12440 (0.0009) +[2023-10-08 16:12:08,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 25395200. Throughput: 0: 1744.9, 1: 1716.7. Samples: 6350092. Policy #0 lag: (min: 31.0, avg: 37.9, max: 63.0) +[2023-10-08 16:12:08,803][19739] Avg episode reward: [(0, '249.000'), (1, '452.710')] +[2023-10-08 16:12:11,527][21194] Updated weights for policy 1, policy_version 12360 (0.0008) +[2023-10-08 16:12:11,900][21194] Updated weights for policy 1, policy_version 12370 (0.0011) +[2023-10-08 16:12:12,272][21194] Updated weights for policy 1, policy_version 12380 (0.0010) +[2023-10-08 16:12:12,354][21195] Updated weights for policy 0, policy_version 12450 (0.0009) +[2023-10-08 16:12:12,740][21195] Updated weights for policy 0, policy_version 12460 (0.0009) +[2023-10-08 16:12:13,119][21195] Updated weights for policy 0, policy_version 12470 (0.0008) +[2023-10-08 16:12:13,494][21195] Updated weights for policy 0, policy_version 12480 (0.0007) +[2023-10-08 16:12:13,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 25460736. Throughput: 0: 1724.3, 1: 1701.2. Samples: 6370148. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:12:13,803][19739] Avg episode reward: [(0, '241.030'), (1, '452.710')] +[2023-10-08 16:12:16,238][21194] Updated weights for policy 1, policy_version 12390 (0.0008) +[2023-10-08 16:12:16,606][21194] Updated weights for policy 1, policy_version 12400 (0.0009) +[2023-10-08 16:12:16,973][21194] Updated weights for policy 1, policy_version 12410 (0.0010) +[2023-10-08 16:12:17,358][21195] Updated weights for policy 0, policy_version 12490 (0.0009) +[2023-10-08 16:12:17,731][21195] Updated weights for policy 0, policy_version 12500 (0.0008) +[2023-10-08 16:12:18,099][21195] Updated weights for policy 0, policy_version 12510 (0.0008) +[2023-10-08 16:12:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 25526272. Throughput: 0: 1703.1, 1: 1730.2. Samples: 6385902. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:12:18,803][19739] Avg episode reward: [(0, '241.030'), (1, '452.710')] +[2023-10-08 16:12:20,980][21194] Updated weights for policy 1, policy_version 12420 (0.0010) +[2023-10-08 16:12:21,350][21194] Updated weights for policy 1, policy_version 12430 (0.0009) +[2023-10-08 16:12:21,725][21194] Updated weights for policy 1, policy_version 12440 (0.0009) +[2023-10-08 16:12:21,924][21195] Updated weights for policy 0, policy_version 12520 (0.0009) +[2023-10-08 16:12:22,303][21195] Updated weights for policy 0, policy_version 12530 (0.0008) +[2023-10-08 16:12:22,675][21195] Updated weights for policy 0, policy_version 12540 (0.0007) +[2023-10-08 16:12:23,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 25591808. Throughput: 0: 1729.7, 1: 1704.9. Samples: 6401140. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:12:23,803][19739] Avg episode reward: [(0, '244.440'), (1, '452.710')] +[2023-10-08 16:12:25,770][21194] Updated weights for policy 1, policy_version 12450 (0.0009) +[2023-10-08 16:12:26,140][21194] Updated weights for policy 1, policy_version 12460 (0.0007) +[2023-10-08 16:12:26,508][21194] Updated weights for policy 1, policy_version 12470 (0.0011) +[2023-10-08 16:12:26,707][21195] Updated weights for policy 0, policy_version 12550 (0.0008) +[2023-10-08 16:12:26,879][21194] Updated weights for policy 1, policy_version 12480 (0.0008) +[2023-10-08 16:12:27,085][21195] Updated weights for policy 0, policy_version 12560 (0.0009) +[2023-10-08 16:12:27,445][21195] Updated weights for policy 0, policy_version 12570 (0.0009) +[2023-10-08 16:12:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 25657344. Throughput: 0: 1698.8, 1: 1710.3. Samples: 6421164. Policy #0 lag: (min: 12.0, avg: 13.3, max: 32.0) +[2023-10-08 16:12:28,803][19739] Avg episode reward: [(0, '248.090'), (1, '452.710')] +[2023-10-08 16:12:30,787][21194] Updated weights for policy 1, policy_version 12490 (0.0008) +[2023-10-08 16:12:31,157][21194] Updated weights for policy 1, policy_version 12500 (0.0010) +[2023-10-08 16:12:31,317][21195] Updated weights for policy 0, policy_version 12580 (0.0008) +[2023-10-08 16:12:31,522][21194] Updated weights for policy 1, policy_version 12510 (0.0009) +[2023-10-08 16:12:31,687][21195] Updated weights for policy 0, policy_version 12590 (0.0007) +[2023-10-08 16:12:32,064][21195] Updated weights for policy 0, policy_version 12600 (0.0007) +[2023-10-08 16:12:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 25722880. Throughput: 0: 1717.5, 1: 1716.8. Samples: 6437332. Policy #0 lag: (min: 12.0, avg: 13.3, max: 32.0) +[2023-10-08 16:12:33,803][19739] Avg episode reward: [(0, '248.090'), (1, '452.760')] +[2023-10-08 16:12:35,568][21194] Updated weights for policy 1, policy_version 12520 (0.0008) +[2023-10-08 16:12:35,870][21195] Updated weights for policy 0, policy_version 12610 (0.0008) +[2023-10-08 16:12:35,949][21194] Updated weights for policy 1, policy_version 12530 (0.0008) +[2023-10-08 16:12:36,230][21195] Updated weights for policy 0, policy_version 12620 (0.0009) +[2023-10-08 16:12:36,307][21194] Updated weights for policy 1, policy_version 12540 (0.0008) +[2023-10-08 16:12:36,593][21195] Updated weights for policy 0, policy_version 12630 (0.0009) +[2023-10-08 16:12:36,968][21195] Updated weights for policy 0, policy_version 12640 (0.0008) +[2023-10-08 16:12:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 25788416. Throughput: 0: 1714.3, 1: 1701.3. Samples: 6452112. Policy #0 lag: (min: 12.0, avg: 13.3, max: 32.0) +[2023-10-08 16:12:38,803][19739] Avg episode reward: [(0, '248.090'), (1, '452.760')] +[2023-10-08 16:12:40,334][21194] Updated weights for policy 1, policy_version 12550 (0.0009) +[2023-10-08 16:12:40,700][21194] Updated weights for policy 1, policy_version 12560 (0.0009) +[2023-10-08 16:12:40,951][21195] Updated weights for policy 0, policy_version 12650 (0.0008) +[2023-10-08 16:12:41,056][21194] Updated weights for policy 1, policy_version 12570 (0.0008) +[2023-10-08 16:12:41,320][21195] Updated weights for policy 0, policy_version 12660 (0.0007) +[2023-10-08 16:12:41,694][21195] Updated weights for policy 0, policy_version 12670 (0.0009) +[2023-10-08 16:12:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 25853952. Throughput: 0: 1701.8, 1: 1715.8. Samples: 6472718. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:12:43,803][19739] Avg episode reward: [(0, '252.340'), (1, '447.400')] +[2023-10-08 16:12:45,045][21194] Updated weights for policy 1, policy_version 12580 (0.0009) +[2023-10-08 16:12:45,418][21194] Updated weights for policy 1, policy_version 12590 (0.0008) +[2023-10-08 16:12:45,701][21195] Updated weights for policy 0, policy_version 12680 (0.0010) +[2023-10-08 16:12:45,787][21194] Updated weights for policy 1, policy_version 12600 (0.0009) +[2023-10-08 16:12:46,072][21195] Updated weights for policy 0, policy_version 12690 (0.0007) +[2023-10-08 16:12:46,446][21195] Updated weights for policy 0, policy_version 12700 (0.0009) +[2023-10-08 16:12:48,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 25919488. Throughput: 0: 1729.5, 1: 1696.1. Samples: 6488240. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:12:48,804][19739] Avg episode reward: [(0, '253.270'), (1, '449.410')] +[2023-10-08 16:12:49,803][21194] Updated weights for policy 1, policy_version 12610 (0.0008) +[2023-10-08 16:12:50,173][21194] Updated weights for policy 1, policy_version 12620 (0.0007) +[2023-10-08 16:12:50,262][21195] Updated weights for policy 0, policy_version 12710 (0.0007) +[2023-10-08 16:12:50,537][21194] Updated weights for policy 1, policy_version 12630 (0.0010) +[2023-10-08 16:12:50,635][21195] Updated weights for policy 0, policy_version 12720 (0.0009) +[2023-10-08 16:12:50,894][21194] Updated weights for policy 1, policy_version 12640 (0.0007) +[2023-10-08 16:12:51,008][21195] Updated weights for policy 0, policy_version 12730 (0.0008) +[2023-10-08 16:12:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 25985024. Throughput: 0: 1702.8, 1: 1703.7. Samples: 6503388. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:12:53,803][19739] Avg episode reward: [(0, '254.860'), (1, '449.410')] +[2023-10-08 16:12:54,848][21194] Updated weights for policy 1, policy_version 12650 (0.0008) +[2023-10-08 16:12:55,002][21195] Updated weights for policy 0, policy_version 12740 (0.0010) +[2023-10-08 16:12:55,215][21194] Updated weights for policy 1, policy_version 12660 (0.0009) +[2023-10-08 16:12:55,378][21195] Updated weights for policy 0, policy_version 12750 (0.0009) +[2023-10-08 16:12:55,579][21194] Updated weights for policy 1, policy_version 12670 (0.0010) +[2023-10-08 16:12:55,743][21195] Updated weights for policy 0, policy_version 12760 (0.0010) +[2023-10-08 16:12:58,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 26050560. Throughput: 0: 1717.2, 1: 1717.3. Samples: 6524702. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:12:58,803][19739] Avg episode reward: [(0, '241.470'), (1, '439.060')] +[2023-10-08 16:12:59,673][21194] Updated weights for policy 1, policy_version 12680 (0.0009) +[2023-10-08 16:12:59,679][21195] Updated weights for policy 0, policy_version 12770 (0.0008) +[2023-10-08 16:13:00,042][21194] Updated weights for policy 1, policy_version 12690 (0.0009) +[2023-10-08 16:13:00,044][21195] Updated weights for policy 0, policy_version 12780 (0.0008) +[2023-10-08 16:13:00,399][21194] Updated weights for policy 1, policy_version 12700 (0.0010) +[2023-10-08 16:13:00,415][21195] Updated weights for policy 0, policy_version 12790 (0.0009) +[2023-10-08 16:13:00,794][21195] Updated weights for policy 0, policy_version 12800 (0.0008) +[2023-10-08 16:13:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 26116096. Throughput: 0: 1734.1, 1: 1686.9. Samples: 6539850. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:13:03,803][19739] Avg episode reward: [(0, '240.380'), (1, '446.600')] +[2023-10-08 16:13:04,335][21194] Updated weights for policy 1, policy_version 12710 (0.0009) +[2023-10-08 16:13:04,703][21194] Updated weights for policy 1, policy_version 12720 (0.0008) +[2023-10-08 16:13:04,784][21195] Updated weights for policy 0, policy_version 12810 (0.0008) +[2023-10-08 16:13:05,077][21194] Updated weights for policy 1, policy_version 12730 (0.0007) +[2023-10-08 16:13:05,158][21195] Updated weights for policy 0, policy_version 12820 (0.0008) +[2023-10-08 16:13:05,530][21195] Updated weights for policy 0, policy_version 12830 (0.0009) +[2023-10-08 16:13:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 26181632. Throughput: 0: 1706.3, 1: 1721.4. Samples: 6555388. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:13:08,803][19739] Avg episode reward: [(0, '241.330'), (1, '446.600')] +[2023-10-08 16:13:08,926][21194] Updated weights for policy 1, policy_version 12740 (0.0009) +[2023-10-08 16:13:09,294][21194] Updated weights for policy 1, policy_version 12750 (0.0009) +[2023-10-08 16:13:09,504][21195] Updated weights for policy 0, policy_version 12840 (0.0007) +[2023-10-08 16:13:09,656][21194] Updated weights for policy 1, policy_version 12760 (0.0007) +[2023-10-08 16:13:09,866][21195] Updated weights for policy 0, policy_version 12850 (0.0007) +[2023-10-08 16:13:10,233][21195] Updated weights for policy 0, policy_version 12860 (0.0007) +[2023-10-08 16:13:13,687][21194] Updated weights for policy 1, policy_version 12770 (0.0009) +[2023-10-08 16:13:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 26247168. Throughput: 0: 1734.0, 1: 1724.5. Samples: 6576798. Policy #0 lag: (min: 24.0, avg: 46.1, max: 56.0) +[2023-10-08 16:13:13,803][19739] Avg episode reward: [(0, '247.970'), (1, '449.370')] +[2023-10-08 16:13:14,049][21194] Updated weights for policy 1, policy_version 12780 (0.0010) +[2023-10-08 16:13:14,100][21195] Updated weights for policy 0, policy_version 12870 (0.0009) +[2023-10-08 16:13:14,421][21194] Updated weights for policy 1, policy_version 12790 (0.0007) +[2023-10-08 16:13:14,476][21195] Updated weights for policy 0, policy_version 12880 (0.0008) +[2023-10-08 16:13:14,778][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000012800_13107200.pth... +[2023-10-08 16:13:14,780][21194] Updated weights for policy 1, policy_version 12800 (0.0007) +[2023-10-08 16:13:14,806][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000011168_11436032.pth +[2023-10-08 16:13:14,854][21195] Updated weights for policy 0, policy_version 12890 (0.0008) +[2023-10-08 16:13:15,077][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000012896_13205504.pth... +[2023-10-08 16:13:15,116][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000011264_11534336.pth +[2023-10-08 16:13:18,752][21194] Updated weights for policy 1, policy_version 12810 (0.0008) +[2023-10-08 16:13:18,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 26312704. Throughput: 0: 1731.2, 1: 1707.0. Samples: 6592054. Policy #0 lag: (min: 24.0, avg: 46.1, max: 56.0) +[2023-10-08 16:13:18,803][19739] Avg episode reward: [(0, '247.970'), (1, '452.380')] +[2023-10-08 16:13:18,879][21195] Updated weights for policy 0, policy_version 12900 (0.0009) +[2023-10-08 16:13:19,118][21194] Updated weights for policy 1, policy_version 12820 (0.0008) +[2023-10-08 16:13:19,256][21195] Updated weights for policy 0, policy_version 12910 (0.0008) +[2023-10-08 16:13:19,491][21194] Updated weights for policy 1, policy_version 12830 (0.0008) +[2023-10-08 16:13:19,633][21195] Updated weights for policy 0, policy_version 12920 (0.0007) +[2023-10-08 16:13:23,522][21194] Updated weights for policy 1, policy_version 12840 (0.0008) +[2023-10-08 16:13:23,550][21195] Updated weights for policy 0, policy_version 12930 (0.0009) +[2023-10-08 16:13:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 26378240. Throughput: 0: 1724.5, 1: 1723.2. Samples: 6607258. Policy #0 lag: (min: 24.0, avg: 46.1, max: 56.0) +[2023-10-08 16:13:23,803][19739] Avg episode reward: [(0, '260.470'), (1, '452.380')] +[2023-10-08 16:13:23,891][21194] Updated weights for policy 1, policy_version 12850 (0.0009) +[2023-10-08 16:13:23,924][21195] Updated weights for policy 0, policy_version 12940 (0.0008) +[2023-10-08 16:13:24,268][21194] Updated weights for policy 1, policy_version 12860 (0.0007) +[2023-10-08 16:13:24,293][21195] Updated weights for policy 0, policy_version 12950 (0.0009) +[2023-10-08 16:13:24,661][21195] Updated weights for policy 0, policy_version 12960 (0.0007) +[2023-10-08 16:13:28,047][21194] Updated weights for policy 1, policy_version 12870 (0.0007) +[2023-10-08 16:13:28,422][21194] Updated weights for policy 1, policy_version 12880 (0.0007) +[2023-10-08 16:13:28,615][21195] Updated weights for policy 0, policy_version 12970 (0.0008) +[2023-10-08 16:13:28,792][21194] Updated weights for policy 1, policy_version 12890 (0.0007) +[2023-10-08 16:13:28,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 26443776. Throughput: 0: 1734.1, 1: 1730.4. Samples: 6628620. Policy #0 lag: (min: 1.0, avg: 14.9, max: 33.0) +[2023-10-08 16:13:28,803][19739] Avg episode reward: [(0, '260.470'), (1, '452.380')] +[2023-10-08 16:13:28,988][21195] Updated weights for policy 0, policy_version 12980 (0.0008) +[2023-10-08 16:13:29,355][21195] Updated weights for policy 0, policy_version 12990 (0.0009) +[2023-10-08 16:13:32,507][21194] Updated weights for policy 1, policy_version 12900 (0.0007) +[2023-10-08 16:13:32,878][21194] Updated weights for policy 1, policy_version 12910 (0.0009) +[2023-10-08 16:13:33,252][21194] Updated weights for policy 1, policy_version 12920 (0.0009) +[2023-10-08 16:13:33,324][21195] Updated weights for policy 0, policy_version 13000 (0.0010) +[2023-10-08 16:13:33,690][21195] Updated weights for policy 0, policy_version 13010 (0.0008) +[2023-10-08 16:13:33,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 26542080. Throughput: 0: 1715.3, 1: 1732.0. Samples: 6643366. Policy #0 lag: (min: 1.0, avg: 14.9, max: 33.0) +[2023-10-08 16:13:33,803][19739] Avg episode reward: [(0, '260.470'), (1, '449.030')] +[2023-10-08 16:13:34,056][21195] Updated weights for policy 0, policy_version 13020 (0.0010) +[2023-10-08 16:13:37,243][21194] Updated weights for policy 1, policy_version 12930 (0.0008) +[2023-10-08 16:13:37,613][21194] Updated weights for policy 1, policy_version 12940 (0.0007) +[2023-10-08 16:13:37,917][21195] Updated weights for policy 0, policy_version 13030 (0.0010) +[2023-10-08 16:13:37,973][21194] Updated weights for policy 1, policy_version 12950 (0.0008) +[2023-10-08 16:13:38,289][21195] Updated weights for policy 0, policy_version 13040 (0.0008) +[2023-10-08 16:13:38,336][21194] Updated weights for policy 1, policy_version 12960 (0.0007) +[2023-10-08 16:13:38,659][21195] Updated weights for policy 0, policy_version 13050 (0.0007) +[2023-10-08 16:13:38,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 26607616. Throughput: 0: 1736.3, 1: 1735.7. Samples: 6659628. Policy #0 lag: (min: 1.0, avg: 14.9, max: 33.0) +[2023-10-08 16:13:38,803][19739] Avg episode reward: [(0, '259.990'), (1, '449.030')] +[2023-10-08 16:13:42,189][21194] Updated weights for policy 1, policy_version 12970 (0.0008) +[2023-10-08 16:13:42,558][21194] Updated weights for policy 1, policy_version 12980 (0.0008) +[2023-10-08 16:13:42,569][21195] Updated weights for policy 0, policy_version 13060 (0.0007) +[2023-10-08 16:13:42,934][21194] Updated weights for policy 1, policy_version 12990 (0.0009) +[2023-10-08 16:13:42,950][21195] Updated weights for policy 0, policy_version 13070 (0.0009) +[2023-10-08 16:13:43,314][21195] Updated weights for policy 0, policy_version 13080 (0.0008) +[2023-10-08 16:13:43,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 26705920. Throughput: 0: 1730.8, 1: 1706.4. Samples: 6679376. Policy #0 lag: (min: 31.0, avg: 31.4, max: 44.0) +[2023-10-08 16:13:43,803][19739] Avg episode reward: [(0, '247.920'), (1, '449.030')] +[2023-10-08 16:13:46,945][21194] Updated weights for policy 1, policy_version 13000 (0.0008) +[2023-10-08 16:13:47,195][21195] Updated weights for policy 0, policy_version 13090 (0.0009) +[2023-10-08 16:13:47,318][21194] Updated weights for policy 1, policy_version 13010 (0.0009) +[2023-10-08 16:13:47,566][21195] Updated weights for policy 0, policy_version 13100 (0.0010) +[2023-10-08 16:13:47,678][21194] Updated weights for policy 1, policy_version 13020 (0.0008) +[2023-10-08 16:13:47,939][21195] Updated weights for policy 0, policy_version 13110 (0.0009) +[2023-10-08 16:13:48,311][21195] Updated weights for policy 0, policy_version 13120 (0.0009) +[2023-10-08 16:13:48,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 26771456. Throughput: 0: 1711.3, 1: 1738.2. Samples: 6695076. Policy #0 lag: (min: 31.0, avg: 31.4, max: 44.0) +[2023-10-08 16:13:48,803][19739] Avg episode reward: [(0, '247.920'), (1, '449.030')] +[2023-10-08 16:13:51,842][21194] Updated weights for policy 1, policy_version 13030 (0.0007) +[2023-10-08 16:13:52,210][21194] Updated weights for policy 1, policy_version 13040 (0.0007) +[2023-10-08 16:13:52,379][21195] Updated weights for policy 0, policy_version 13130 (0.0007) +[2023-10-08 16:13:52,574][21194] Updated weights for policy 1, policy_version 13050 (0.0009) +[2023-10-08 16:13:52,750][21195] Updated weights for policy 0, policy_version 13140 (0.0007) +[2023-10-08 16:13:53,122][21195] Updated weights for policy 0, policy_version 13150 (0.0009) +[2023-10-08 16:13:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 26836992. Throughput: 0: 1744.3, 1: 1722.4. Samples: 6711390. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 16:13:53,803][19739] Avg episode reward: [(0, '247.000'), (1, '449.030')] +[2023-10-08 16:13:56,506][21194] Updated weights for policy 1, policy_version 13060 (0.0008) +[2023-10-08 16:13:56,873][21194] Updated weights for policy 1, policy_version 13070 (0.0007) +[2023-10-08 16:13:56,951][21195] Updated weights for policy 0, policy_version 13160 (0.0007) +[2023-10-08 16:13:57,243][21194] Updated weights for policy 1, policy_version 13080 (0.0007) +[2023-10-08 16:13:57,325][21195] Updated weights for policy 0, policy_version 13170 (0.0009) +[2023-10-08 16:13:57,695][21195] Updated weights for policy 0, policy_version 13180 (0.0009) +[2023-10-08 16:13:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 26902528. Throughput: 0: 1718.0, 1: 1702.2. Samples: 6730706. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 16:13:58,803][19739] Avg episode reward: [(0, '239.160'), (1, '449.030')] +[2023-10-08 16:14:01,162][21194] Updated weights for policy 1, policy_version 13090 (0.0008) +[2023-10-08 16:14:01,517][21195] Updated weights for policy 0, policy_version 13190 (0.0008) +[2023-10-08 16:14:01,529][21194] Updated weights for policy 1, policy_version 13100 (0.0008) +[2023-10-08 16:14:01,884][21195] Updated weights for policy 0, policy_version 13200 (0.0008) +[2023-10-08 16:14:01,901][21194] Updated weights for policy 1, policy_version 13110 (0.0010) +[2023-10-08 16:14:02,250][21195] Updated weights for policy 0, policy_version 13210 (0.0008) +[2023-10-08 16:14:02,256][21194] Updated weights for policy 1, policy_version 13120 (0.0007) +[2023-10-08 16:14:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 26968064. Throughput: 0: 1717.3, 1: 1733.1. Samples: 6747322. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 16:14:03,804][19739] Avg episode reward: [(0, '238.520'), (1, '449.030')] +[2023-10-08 16:14:06,269][21194] Updated weights for policy 1, policy_version 13130 (0.0007) +[2023-10-08 16:14:06,288][21195] Updated weights for policy 0, policy_version 13220 (0.0007) +[2023-10-08 16:14:06,636][21194] Updated weights for policy 1, policy_version 13140 (0.0008) +[2023-10-08 16:14:06,682][21195] Updated weights for policy 0, policy_version 13230 (0.0008) +[2023-10-08 16:14:06,990][21194] Updated weights for policy 1, policy_version 13150 (0.0007) +[2023-10-08 16:14:07,054][21195] Updated weights for policy 0, policy_version 13240 (0.0008) +[2023-10-08 16:14:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 27033600. Throughput: 0: 1728.0, 1: 1707.0. Samples: 6761832. Policy #0 lag: (min: 8.0, avg: 28.2, max: 40.0) +[2023-10-08 16:14:08,803][19739] Avg episode reward: [(0, '238.520'), (1, '449.030')] +[2023-10-08 16:14:10,773][21195] Updated weights for policy 0, policy_version 13250 (0.0009) +[2023-10-08 16:14:11,143][21195] Updated weights for policy 0, policy_version 13260 (0.0008) +[2023-10-08 16:14:11,171][21194] Updated weights for policy 1, policy_version 13160 (0.0008) +[2023-10-08 16:14:11,511][21195] Updated weights for policy 0, policy_version 13270 (0.0008) +[2023-10-08 16:14:11,547][21194] Updated weights for policy 1, policy_version 13170 (0.0007) +[2023-10-08 16:14:11,886][21195] Updated weights for policy 0, policy_version 13280 (0.0009) +[2023-10-08 16:14:11,918][21194] Updated weights for policy 1, policy_version 13180 (0.0008) +[2023-10-08 16:14:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 27099136. Throughput: 0: 1712.8, 1: 1699.8. Samples: 6782190. Policy #0 lag: (min: 8.0, avg: 28.2, max: 40.0) +[2023-10-08 16:14:13,803][19739] Avg episode reward: [(0, '238.520'), (1, '464.860')] +[2023-10-08 16:14:13,813][20836] Saving new best policy, reward=464.860! +[2023-10-08 16:14:15,928][21195] Updated weights for policy 0, policy_version 13290 (0.0009) +[2023-10-08 16:14:16,059][21194] Updated weights for policy 1, policy_version 13190 (0.0008) +[2023-10-08 16:14:16,306][21195] Updated weights for policy 0, policy_version 13300 (0.0009) +[2023-10-08 16:14:16,426][21194] Updated weights for policy 1, policy_version 13200 (0.0008) +[2023-10-08 16:14:16,674][21195] Updated weights for policy 0, policy_version 13310 (0.0008) +[2023-10-08 16:14:16,793][21194] Updated weights for policy 1, policy_version 13210 (0.0010) +[2023-10-08 16:14:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 27164672. Throughput: 0: 1730.7, 1: 1714.8. Samples: 6798412. Policy #0 lag: (min: 8.0, avg: 28.2, max: 40.0) +[2023-10-08 16:14:18,803][19739] Avg episode reward: [(0, '238.520'), (1, '464.860')] +[2023-10-08 16:14:20,723][21195] Updated weights for policy 0, policy_version 13320 (0.0007) +[2023-10-08 16:14:20,752][21194] Updated weights for policy 1, policy_version 13220 (0.0008) +[2023-10-08 16:14:21,090][21195] Updated weights for policy 0, policy_version 13330 (0.0008) +[2023-10-08 16:14:21,123][21194] Updated weights for policy 1, policy_version 13230 (0.0007) +[2023-10-08 16:14:21,465][21195] Updated weights for policy 0, policy_version 13340 (0.0008) +[2023-10-08 16:14:21,485][21194] Updated weights for policy 1, policy_version 13240 (0.0007) +[2023-10-08 16:14:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 27230208. Throughput: 0: 1708.8, 1: 1688.0. Samples: 6812486. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 16:14:23,803][19739] Avg episode reward: [(0, '239.500'), (1, '472.740')] +[2023-10-08 16:14:23,804][20836] Saving new best policy, reward=472.740! +[2023-10-08 16:14:25,390][21194] Updated weights for policy 1, policy_version 13250 (0.0009) +[2023-10-08 16:14:25,582][21195] Updated weights for policy 0, policy_version 13350 (0.0010) +[2023-10-08 16:14:25,762][21194] Updated weights for policy 1, policy_version 13260 (0.0008) +[2023-10-08 16:14:25,955][21195] Updated weights for policy 0, policy_version 13360 (0.0009) +[2023-10-08 16:14:26,129][21194] Updated weights for policy 1, policy_version 13270 (0.0008) +[2023-10-08 16:14:26,326][21195] Updated weights for policy 0, policy_version 13370 (0.0010) +[2023-10-08 16:14:26,499][21194] Updated weights for policy 1, policy_version 13280 (0.0007) +[2023-10-08 16:14:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 27295744. Throughput: 0: 1714.8, 1: 1720.3. Samples: 6833954. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 16:14:28,803][19739] Avg episode reward: [(0, '242.100'), (1, '472.740')] +[2023-10-08 16:14:30,116][21195] Updated weights for policy 0, policy_version 13380 (0.0010) +[2023-10-08 16:14:30,403][21194] Updated weights for policy 1, policy_version 13290 (0.0009) +[2023-10-08 16:14:30,486][21195] Updated weights for policy 0, policy_version 13390 (0.0009) +[2023-10-08 16:14:30,774][21194] Updated weights for policy 1, policy_version 13300 (0.0007) +[2023-10-08 16:14:30,863][21195] Updated weights for policy 0, policy_version 13400 (0.0009) +[2023-10-08 16:14:31,147][21194] Updated weights for policy 1, policy_version 13310 (0.0007) +[2023-10-08 16:14:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 27361280. Throughput: 0: 1735.4, 1: 1695.2. Samples: 6849454. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 16:14:33,803][19739] Avg episode reward: [(0, '250.700'), (1, '472.940')] +[2023-10-08 16:14:33,804][20836] Saving new best policy, reward=472.940! +[2023-10-08 16:14:34,904][21195] Updated weights for policy 0, policy_version 13410 (0.0008) +[2023-10-08 16:14:35,201][21194] Updated weights for policy 1, policy_version 13320 (0.0007) +[2023-10-08 16:14:35,267][21195] Updated weights for policy 0, policy_version 13420 (0.0008) +[2023-10-08 16:14:35,574][21194] Updated weights for policy 1, policy_version 13330 (0.0009) +[2023-10-08 16:14:35,631][21195] Updated weights for policy 0, policy_version 13430 (0.0008) +[2023-10-08 16:14:35,941][21194] Updated weights for policy 1, policy_version 13340 (0.0011) +[2023-10-08 16:14:36,005][21195] Updated weights for policy 0, policy_version 13440 (0.0007) +[2023-10-08 16:14:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 27426816. Throughput: 0: 1705.0, 1: 1704.0. Samples: 6864794. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:14:38,803][19739] Avg episode reward: [(0, '242.630'), (1, '472.940')] +[2023-10-08 16:14:39,791][21195] Updated weights for policy 0, policy_version 13450 (0.0009) +[2023-10-08 16:14:39,812][21194] Updated weights for policy 1, policy_version 13350 (0.0007) +[2023-10-08 16:14:40,164][21195] Updated weights for policy 0, policy_version 13460 (0.0008) +[2023-10-08 16:14:40,172][21194] Updated weights for policy 1, policy_version 13360 (0.0008) +[2023-10-08 16:14:40,528][21195] Updated weights for policy 0, policy_version 13470 (0.0007) +[2023-10-08 16:14:40,548][21194] Updated weights for policy 1, policy_version 13370 (0.0009) +[2023-10-08 16:14:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 27492352. Throughput: 0: 1732.9, 1: 1724.3. Samples: 6886282. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:14:43,803][19739] Avg episode reward: [(0, '248.110'), (1, '477.850')] +[2023-10-08 16:14:43,810][20836] Saving new best policy, reward=477.850! +[2023-10-08 16:14:44,477][21195] Updated weights for policy 0, policy_version 13480 (0.0008) +[2023-10-08 16:14:44,522][21194] Updated weights for policy 1, policy_version 13380 (0.0008) +[2023-10-08 16:14:44,848][21195] Updated weights for policy 0, policy_version 13490 (0.0009) +[2023-10-08 16:14:44,886][21194] Updated weights for policy 1, policy_version 13390 (0.0010) +[2023-10-08 16:14:45,216][21195] Updated weights for policy 0, policy_version 13500 (0.0007) +[2023-10-08 16:14:45,259][21194] Updated weights for policy 1, policy_version 13400 (0.0009) +[2023-10-08 16:14:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 27557888. Throughput: 0: 1734.4, 1: 1695.0. Samples: 6901646. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:14:48,803][19739] Avg episode reward: [(0, '259.580'), (1, '477.850')] +[2023-10-08 16:14:49,179][21195] Updated weights for policy 0, policy_version 13510 (0.0008) +[2023-10-08 16:14:49,276][21194] Updated weights for policy 1, policy_version 13410 (0.0009) +[2023-10-08 16:14:49,545][21195] Updated weights for policy 0, policy_version 13520 (0.0007) +[2023-10-08 16:14:49,647][21194] Updated weights for policy 1, policy_version 13420 (0.0007) +[2023-10-08 16:14:49,923][21195] Updated weights for policy 0, policy_version 13530 (0.0007) +[2023-10-08 16:14:50,008][21194] Updated weights for policy 1, policy_version 13430 (0.0008) +[2023-10-08 16:14:50,378][21194] Updated weights for policy 1, policy_version 13440 (0.0010) +[2023-10-08 16:14:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 27623424. Throughput: 0: 1725.0, 1: 1715.2. Samples: 6916642. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:14:53,803][19739] Avg episode reward: [(0, '254.790'), (1, '477.850')] +[2023-10-08 16:14:53,970][21195] Updated weights for policy 0, policy_version 13540 (0.0008) +[2023-10-08 16:14:54,352][21195] Updated weights for policy 0, policy_version 13550 (0.0009) +[2023-10-08 16:14:54,376][21194] Updated weights for policy 1, policy_version 13450 (0.0007) +[2023-10-08 16:14:54,712][21195] Updated weights for policy 0, policy_version 13560 (0.0007) +[2023-10-08 16:14:54,740][21194] Updated weights for policy 1, policy_version 13460 (0.0007) +[2023-10-08 16:14:55,112][21194] Updated weights for policy 1, policy_version 13470 (0.0008) +[2023-10-08 16:14:58,687][21195] Updated weights for policy 0, policy_version 13570 (0.0008) +[2023-10-08 16:14:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 27688960. Throughput: 0: 1741.0, 1: 1722.3. Samples: 6938036. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:14:58,804][19739] Avg episode reward: [(0, '265.170'), (1, '477.850')] +[2023-10-08 16:14:59,049][21195] Updated weights for policy 0, policy_version 13580 (0.0009) +[2023-10-08 16:14:59,165][21194] Updated weights for policy 1, policy_version 13480 (0.0008) +[2023-10-08 16:14:59,422][21195] Updated weights for policy 0, policy_version 13590 (0.0009) +[2023-10-08 16:14:59,527][21194] Updated weights for policy 1, policy_version 13490 (0.0007) +[2023-10-08 16:14:59,800][21195] Updated weights for policy 0, policy_version 13600 (0.0010) +[2023-10-08 16:14:59,889][21194] Updated weights for policy 1, policy_version 13500 (0.0007) +[2023-10-08 16:15:03,757][21195] Updated weights for policy 0, policy_version 13610 (0.0010) +[2023-10-08 16:15:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 27754496. Throughput: 0: 1727.7, 1: 1702.0. Samples: 6952748. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:15:03,803][19739] Avg episode reward: [(0, '247.410'), (1, '478.930')] +[2023-10-08 16:15:03,902][21194] Updated weights for policy 1, policy_version 13510 (0.0008) +[2023-10-08 16:15:04,129][21195] Updated weights for policy 0, policy_version 13620 (0.0008) +[2023-10-08 16:15:04,274][21194] Updated weights for policy 1, policy_version 13520 (0.0007) +[2023-10-08 16:15:04,491][21195] Updated weights for policy 0, policy_version 13630 (0.0008) +[2023-10-08 16:15:04,637][21194] Updated weights for policy 1, policy_version 13530 (0.0009) +[2023-10-08 16:15:04,860][20836] Saving new best policy, reward=478.930! +[2023-10-08 16:15:08,251][21195] Updated weights for policy 0, policy_version 13640 (0.0008) +[2023-10-08 16:15:08,625][21195] Updated weights for policy 0, policy_version 13650 (0.0008) +[2023-10-08 16:15:08,696][21194] Updated weights for policy 1, policy_version 13540 (0.0010) +[2023-10-08 16:15:08,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 27820032. Throughput: 0: 1742.0, 1: 1721.2. Samples: 6968328. Policy #0 lag: (min: 13.0, avg: 17.0, max: 45.0) +[2023-10-08 16:15:08,803][19739] Avg episode reward: [(0, '253.810'), (1, '487.380')] +[2023-10-08 16:15:08,993][21195] Updated weights for policy 0, policy_version 13660 (0.0008) +[2023-10-08 16:15:09,057][21194] Updated weights for policy 1, policy_version 13550 (0.0009) +[2023-10-08 16:15:09,424][21194] Updated weights for policy 1, policy_version 13560 (0.0009) +[2023-10-08 16:15:09,720][20836] Saving new best policy, reward=487.380! +[2023-10-08 16:15:12,914][21195] Updated weights for policy 0, policy_version 13670 (0.0010) +[2023-10-08 16:15:13,287][21194] Updated weights for policy 1, policy_version 13570 (0.0008) +[2023-10-08 16:15:13,290][21195] Updated weights for policy 0, policy_version 13680 (0.0009) +[2023-10-08 16:15:13,645][21194] Updated weights for policy 1, policy_version 13580 (0.0008) +[2023-10-08 16:15:13,657][21195] Updated weights for policy 0, policy_version 13690 (0.0007) +[2023-10-08 16:15:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 27885568. Throughput: 0: 1738.5, 1: 1716.7. Samples: 6989438. Policy #0 lag: (min: 13.0, avg: 17.0, max: 45.0) +[2023-10-08 16:15:13,803][19739] Avg episode reward: [(0, '253.810'), (1, '484.820')] +[2023-10-08 16:15:13,874][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000013696_14024704.pth... +[2023-10-08 16:15:13,912][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000012064_12353536.pth +[2023-10-08 16:15:14,019][21194] Updated weights for policy 1, policy_version 13590 (0.0008) +[2023-10-08 16:15:14,384][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000013600_13926400.pth... +[2023-10-08 16:15:14,385][21194] Updated weights for policy 1, policy_version 13600 (0.0010) +[2023-10-08 16:15:14,426][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000011968_12255232.pth +[2023-10-08 16:15:17,521][21195] Updated weights for policy 0, policy_version 13700 (0.0007) +[2023-10-08 16:15:17,892][21195] Updated weights for policy 0, policy_version 13710 (0.0009) +[2023-10-08 16:15:18,266][21195] Updated weights for policy 0, policy_version 13720 (0.0008) +[2023-10-08 16:15:18,505][21194] Updated weights for policy 1, policy_version 13610 (0.0007) +[2023-10-08 16:15:18,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 27983872. Throughput: 0: 1714.3, 1: 1711.2. Samples: 7003600. Policy #0 lag: (min: 2.0, avg: 10.1, max: 34.0) +[2023-10-08 16:15:18,803][19739] Avg episode reward: [(0, '248.640'), (1, '480.550')] +[2023-10-08 16:15:18,871][21194] Updated weights for policy 1, policy_version 13620 (0.0010) +[2023-10-08 16:15:19,245][21194] Updated weights for policy 1, policy_version 13630 (0.0007) +[2023-10-08 16:15:22,082][21195] Updated weights for policy 0, policy_version 13730 (0.0008) +[2023-10-08 16:15:22,451][21195] Updated weights for policy 0, policy_version 13740 (0.0008) +[2023-10-08 16:15:22,819][21195] Updated weights for policy 0, policy_version 13750 (0.0007) +[2023-10-08 16:15:23,134][21194] Updated weights for policy 1, policy_version 13640 (0.0008) +[2023-10-08 16:15:23,187][21195] Updated weights for policy 0, policy_version 13760 (0.0007) +[2023-10-08 16:15:23,500][21194] Updated weights for policy 1, policy_version 13650 (0.0007) +[2023-10-08 16:15:23,803][19739] Fps is (10 sec: 16383.7, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 28049408. Throughput: 0: 1745.5, 1: 1715.5. Samples: 7020542. Policy #0 lag: (min: 2.0, avg: 10.1, max: 34.0) +[2023-10-08 16:15:23,804][19739] Avg episode reward: [(0, '243.430'), (1, '480.550')] +[2023-10-08 16:15:23,870][21194] Updated weights for policy 1, policy_version 13660 (0.0008) +[2023-10-08 16:15:27,286][21195] Updated weights for policy 0, policy_version 13770 (0.0007) +[2023-10-08 16:15:27,659][21195] Updated weights for policy 0, policy_version 13780 (0.0007) +[2023-10-08 16:15:27,687][21194] Updated weights for policy 1, policy_version 13670 (0.0009) +[2023-10-08 16:15:28,022][21195] Updated weights for policy 0, policy_version 13790 (0.0008) +[2023-10-08 16:15:28,055][21194] Updated weights for policy 1, policy_version 13680 (0.0008) +[2023-10-08 16:15:28,414][21194] Updated weights for policy 1, policy_version 13690 (0.0009) +[2023-10-08 16:15:28,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 28147712. Throughput: 0: 1720.1, 1: 1704.4. Samples: 7040382. Policy #0 lag: (min: 2.0, avg: 10.1, max: 34.0) +[2023-10-08 16:15:28,803][19739] Avg episode reward: [(0, '232.680'), (1, '476.150')] +[2023-10-08 16:15:32,010][21195] Updated weights for policy 0, policy_version 13800 (0.0009) +[2023-10-08 16:15:32,390][21195] Updated weights for policy 0, policy_version 13810 (0.0009) +[2023-10-08 16:15:32,394][21194] Updated weights for policy 1, policy_version 13700 (0.0007) +[2023-10-08 16:15:32,752][21195] Updated weights for policy 0, policy_version 13820 (0.0007) +[2023-10-08 16:15:32,756][21194] Updated weights for policy 1, policy_version 13710 (0.0007) +[2023-10-08 16:15:33,127][21194] Updated weights for policy 1, policy_version 13720 (0.0009) +[2023-10-08 16:15:33,803][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 28213248. Throughput: 0: 1709.8, 1: 1714.5. Samples: 7055742. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 16:15:33,803][19739] Avg episode reward: [(0, '225.610'), (1, '476.150')] +[2023-10-08 16:15:36,562][21195] Updated weights for policy 0, policy_version 13830 (0.0007) +[2023-10-08 16:15:36,935][21195] Updated weights for policy 0, policy_version 13840 (0.0008) +[2023-10-08 16:15:36,968][21194] Updated weights for policy 1, policy_version 13730 (0.0010) +[2023-10-08 16:15:37,308][21195] Updated weights for policy 0, policy_version 13850 (0.0009) +[2023-10-08 16:15:37,339][21194] Updated weights for policy 1, policy_version 13740 (0.0007) +[2023-10-08 16:15:37,705][21194] Updated weights for policy 1, policy_version 13750 (0.0007) +[2023-10-08 16:15:38,066][21194] Updated weights for policy 1, policy_version 13760 (0.0009) +[2023-10-08 16:15:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 28278784. Throughput: 0: 1729.5, 1: 1722.5. Samples: 7071982. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 16:15:38,803][19739] Avg episode reward: [(0, '225.610'), (1, '476.150')] +[2023-10-08 16:15:41,340][21195] Updated weights for policy 0, policy_version 13860 (0.0009) +[2023-10-08 16:15:41,717][21195] Updated weights for policy 0, policy_version 13870 (0.0010) +[2023-10-08 16:15:42,072][21194] Updated weights for policy 1, policy_version 13770 (0.0008) +[2023-10-08 16:15:42,087][21195] Updated weights for policy 0, policy_version 13880 (0.0008) +[2023-10-08 16:15:42,444][21194] Updated weights for policy 1, policy_version 13780 (0.0008) +[2023-10-08 16:15:42,816][21194] Updated weights for policy 1, policy_version 13790 (0.0009) +[2023-10-08 16:15:43,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 28344320. Throughput: 0: 1704.6, 1: 1695.3. Samples: 7091030. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 16:15:43,803][19739] Avg episode reward: [(0, '207.830'), (1, '486.940')] +[2023-10-08 16:15:46,167][21195] Updated weights for policy 0, policy_version 13890 (0.0008) +[2023-10-08 16:15:46,536][21195] Updated weights for policy 0, policy_version 13900 (0.0007) +[2023-10-08 16:15:46,869][21194] Updated weights for policy 1, policy_version 13800 (0.0009) +[2023-10-08 16:15:46,904][21195] Updated weights for policy 0, policy_version 13910 (0.0007) +[2023-10-08 16:15:47,244][21194] Updated weights for policy 1, policy_version 13810 (0.0008) +[2023-10-08 16:15:47,272][21195] Updated weights for policy 0, policy_version 13920 (0.0009) +[2023-10-08 16:15:47,618][21194] Updated weights for policy 1, policy_version 13820 (0.0008) +[2023-10-08 16:15:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 28409856. Throughput: 0: 1712.0, 1: 1728.0. Samples: 7107548. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:15:48,803][19739] Avg episode reward: [(0, '216.480'), (1, '479.940')] +[2023-10-08 16:15:51,286][21195] Updated weights for policy 0, policy_version 13930 (0.0008) +[2023-10-08 16:15:51,535][21194] Updated weights for policy 1, policy_version 13830 (0.0010) +[2023-10-08 16:15:51,653][21195] Updated weights for policy 0, policy_version 13940 (0.0009) +[2023-10-08 16:15:51,911][21194] Updated weights for policy 1, policy_version 13840 (0.0008) +[2023-10-08 16:15:52,026][21195] Updated weights for policy 0, policy_version 13950 (0.0009) +[2023-10-08 16:15:52,284][21194] Updated weights for policy 1, policy_version 13850 (0.0009) +[2023-10-08 16:15:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 28475392. Throughput: 0: 1710.3, 1: 1714.2. Samples: 7122430. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:15:53,803][19739] Avg episode reward: [(0, '210.380'), (1, '498.550')] +[2023-10-08 16:15:53,804][20836] Saving new best policy, reward=498.550! +[2023-10-08 16:15:56,076][21195] Updated weights for policy 0, policy_version 13960 (0.0009) +[2023-10-08 16:15:56,309][21194] Updated weights for policy 1, policy_version 13860 (0.0008) +[2023-10-08 16:15:56,446][21195] Updated weights for policy 0, policy_version 13970 (0.0008) +[2023-10-08 16:15:56,681][21194] Updated weights for policy 1, policy_version 13870 (0.0007) +[2023-10-08 16:15:56,812][21195] Updated weights for policy 0, policy_version 13980 (0.0008) +[2023-10-08 16:15:57,040][21194] Updated weights for policy 1, policy_version 13880 (0.0007) +[2023-10-08 16:15:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 28540928. Throughput: 0: 1704.7, 1: 1701.7. Samples: 7142726. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:15:58,804][19739] Avg episode reward: [(0, '210.380'), (1, '498.550')] +[2023-10-08 16:16:00,752][21195] Updated weights for policy 0, policy_version 13990 (0.0008) +[2023-10-08 16:16:01,011][21194] Updated weights for policy 1, policy_version 13890 (0.0009) +[2023-10-08 16:16:01,120][21195] Updated weights for policy 0, policy_version 14000 (0.0009) +[2023-10-08 16:16:01,378][21194] Updated weights for policy 1, policy_version 13900 (0.0010) +[2023-10-08 16:16:01,490][21195] Updated weights for policy 0, policy_version 14010 (0.0009) +[2023-10-08 16:16:01,748][21194] Updated weights for policy 1, policy_version 13910 (0.0009) +[2023-10-08 16:16:02,122][21194] Updated weights for policy 1, policy_version 13920 (0.0009) +[2023-10-08 16:16:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 28606464. Throughput: 0: 1732.3, 1: 1727.5. Samples: 7159290. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 16:16:03,804][19739] Avg episode reward: [(0, '205.540'), (1, '498.550')] +[2023-10-08 16:16:05,459][21195] Updated weights for policy 0, policy_version 14020 (0.0009) +[2023-10-08 16:16:05,826][21195] Updated weights for policy 0, policy_version 14030 (0.0008) +[2023-10-08 16:16:06,004][21194] Updated weights for policy 1, policy_version 13930 (0.0007) +[2023-10-08 16:16:06,196][21195] Updated weights for policy 0, policy_version 14040 (0.0009) +[2023-10-08 16:16:06,366][21194] Updated weights for policy 1, policy_version 13940 (0.0007) +[2023-10-08 16:16:06,733][21194] Updated weights for policy 1, policy_version 13950 (0.0008) +[2023-10-08 16:16:08,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 28672000. Throughput: 0: 1696.0, 1: 1697.4. Samples: 7173244. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 16:16:08,803][19739] Avg episode reward: [(0, '203.430'), (1, '492.570')] +[2023-10-08 16:16:10,043][21195] Updated weights for policy 0, policy_version 14050 (0.0008) +[2023-10-08 16:16:10,421][21195] Updated weights for policy 0, policy_version 14060 (0.0009) +[2023-10-08 16:16:10,680][21194] Updated weights for policy 1, policy_version 13960 (0.0009) +[2023-10-08 16:16:10,796][21195] Updated weights for policy 0, policy_version 14070 (0.0009) +[2023-10-08 16:16:11,040][21194] Updated weights for policy 1, policy_version 13970 (0.0007) +[2023-10-08 16:16:11,158][21195] Updated weights for policy 0, policy_version 14080 (0.0009) +[2023-10-08 16:16:11,406][21194] Updated weights for policy 1, policy_version 13980 (0.0007) +[2023-10-08 16:16:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 28737536. Throughput: 0: 1721.2, 1: 1712.8. Samples: 7194912. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 16:16:13,803][19739] Avg episode reward: [(0, '204.220'), (1, '484.010')] +[2023-10-08 16:16:14,908][21195] Updated weights for policy 0, policy_version 14090 (0.0007) +[2023-10-08 16:16:15,279][21195] Updated weights for policy 0, policy_version 14100 (0.0009) +[2023-10-08 16:16:15,311][21194] Updated weights for policy 1, policy_version 13990 (0.0008) +[2023-10-08 16:16:15,647][21195] Updated weights for policy 0, policy_version 14110 (0.0010) +[2023-10-08 16:16:15,675][21194] Updated weights for policy 1, policy_version 14000 (0.0009) +[2023-10-08 16:16:16,044][21194] Updated weights for policy 1, policy_version 14010 (0.0009) +[2023-10-08 16:16:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 28803072. Throughput: 0: 1735.2, 1: 1709.9. Samples: 7210770. Policy #0 lag: (min: 17.0, avg: 27.7, max: 49.0) +[2023-10-08 16:16:18,803][19739] Avg episode reward: [(0, '204.220'), (1, '476.650')] +[2023-10-08 16:16:19,646][21195] Updated weights for policy 0, policy_version 14120 (0.0008) +[2023-10-08 16:16:20,014][21195] Updated weights for policy 0, policy_version 14130 (0.0007) +[2023-10-08 16:16:20,080][21194] Updated weights for policy 1, policy_version 14020 (0.0008) +[2023-10-08 16:16:20,380][21195] Updated weights for policy 0, policy_version 14140 (0.0007) +[2023-10-08 16:16:20,455][21194] Updated weights for policy 1, policy_version 14030 (0.0009) +[2023-10-08 16:16:20,818][21194] Updated weights for policy 1, policy_version 14040 (0.0009) +[2023-10-08 16:16:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 28868608. Throughput: 0: 1717.1, 1: 1700.2. Samples: 7225758. Policy #0 lag: (min: 17.0, avg: 27.7, max: 49.0) +[2023-10-08 16:16:23,803][19739] Avg episode reward: [(0, '209.380'), (1, '476.880')] +[2023-10-08 16:16:24,269][21195] Updated weights for policy 0, policy_version 14150 (0.0008) +[2023-10-08 16:16:24,647][21195] Updated weights for policy 0, policy_version 14160 (0.0008) +[2023-10-08 16:16:24,916][21194] Updated weights for policy 1, policy_version 14050 (0.0009) +[2023-10-08 16:16:25,025][21195] Updated weights for policy 0, policy_version 14170 (0.0007) +[2023-10-08 16:16:25,278][21194] Updated weights for policy 1, policy_version 14060 (0.0010) +[2023-10-08 16:16:25,641][21194] Updated weights for policy 1, policy_version 14070 (0.0009) +[2023-10-08 16:16:26,008][21194] Updated weights for policy 1, policy_version 14080 (0.0009) +[2023-10-08 16:16:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 28934144. Throughput: 0: 1742.9, 1: 1726.7. Samples: 7247162. Policy #0 lag: (min: 17.0, avg: 27.7, max: 49.0) +[2023-10-08 16:16:28,803][19739] Avg episode reward: [(0, '202.600'), (1, '476.880')] +[2023-10-08 16:16:28,953][21195] Updated weights for policy 0, policy_version 14180 (0.0007) +[2023-10-08 16:16:29,337][21195] Updated weights for policy 0, policy_version 14190 (0.0007) +[2023-10-08 16:16:29,708][21195] Updated weights for policy 0, policy_version 14200 (0.0008) +[2023-10-08 16:16:29,880][21194] Updated weights for policy 1, policy_version 14090 (0.0009) +[2023-10-08 16:16:30,244][21194] Updated weights for policy 1, policy_version 14100 (0.0012) +[2023-10-08 16:16:30,612][21194] Updated weights for policy 1, policy_version 14110 (0.0008) +[2023-10-08 16:16:33,692][21195] Updated weights for policy 0, policy_version 14210 (0.0009) +[2023-10-08 16:16:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 28999680. Throughput: 0: 1739.4, 1: 1694.7. Samples: 7262082. Policy #0 lag: (min: 31.0, avg: 32.7, max: 58.0) +[2023-10-08 16:16:33,804][19739] Avg episode reward: [(0, '201.460'), (1, '476.880')] +[2023-10-08 16:16:34,058][21195] Updated weights for policy 0, policy_version 14220 (0.0010) +[2023-10-08 16:16:34,434][21195] Updated weights for policy 0, policy_version 14230 (0.0008) +[2023-10-08 16:16:34,487][21194] Updated weights for policy 1, policy_version 14120 (0.0008) +[2023-10-08 16:16:34,810][21195] Updated weights for policy 0, policy_version 14240 (0.0009) +[2023-10-08 16:16:34,853][21194] Updated weights for policy 1, policy_version 14130 (0.0008) +[2023-10-08 16:16:35,224][21194] Updated weights for policy 1, policy_version 14140 (0.0008) +[2023-10-08 16:16:38,668][21195] Updated weights for policy 0, policy_version 14250 (0.0009) +[2023-10-08 16:16:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 29065216. Throughput: 0: 1730.6, 1: 1718.3. Samples: 7277630. Policy #0 lag: (min: 31.0, avg: 32.7, max: 58.0) +[2023-10-08 16:16:38,803][19739] Avg episode reward: [(0, '204.210'), (1, '476.880')] +[2023-10-08 16:16:39,044][21195] Updated weights for policy 0, policy_version 14260 (0.0009) +[2023-10-08 16:16:39,258][21194] Updated weights for policy 1, policy_version 14150 (0.0007) +[2023-10-08 16:16:39,409][21195] Updated weights for policy 0, policy_version 14270 (0.0008) +[2023-10-08 16:16:39,621][21194] Updated weights for policy 1, policy_version 14160 (0.0007) +[2023-10-08 16:16:39,987][21194] Updated weights for policy 1, policy_version 14170 (0.0008) +[2023-10-08 16:16:43,449][21195] Updated weights for policy 0, policy_version 14280 (0.0008) +[2023-10-08 16:16:43,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 29130752. Throughput: 0: 1739.2, 1: 1732.6. Samples: 7298956. Policy #0 lag: (min: 31.0, avg: 32.7, max: 58.0) +[2023-10-08 16:16:43,803][19739] Avg episode reward: [(0, '199.150'), (1, '476.880')] +[2023-10-08 16:16:43,814][21195] Updated weights for policy 0, policy_version 14290 (0.0007) +[2023-10-08 16:16:43,901][21194] Updated weights for policy 1, policy_version 14180 (0.0009) +[2023-10-08 16:16:44,182][21195] Updated weights for policy 0, policy_version 14300 (0.0009) +[2023-10-08 16:16:44,276][21194] Updated weights for policy 1, policy_version 14190 (0.0008) +[2023-10-08 16:16:44,641][21194] Updated weights for policy 1, policy_version 14200 (0.0010) +[2023-10-08 16:16:48,130][21195] Updated weights for policy 0, policy_version 14310 (0.0008) +[2023-10-08 16:16:48,508][21195] Updated weights for policy 0, policy_version 14320 (0.0007) +[2023-10-08 16:16:48,566][21194] Updated weights for policy 1, policy_version 14210 (0.0008) +[2023-10-08 16:16:48,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 29196288. Throughput: 0: 1714.0, 1: 1708.1. Samples: 7313284. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:16:48,804][19739] Avg episode reward: [(0, '209.610'), (1, '467.730')] +[2023-10-08 16:16:48,872][21195] Updated weights for policy 0, policy_version 14330 (0.0007) +[2023-10-08 16:16:48,934][21194] Updated weights for policy 1, policy_version 14220 (0.0008) +[2023-10-08 16:16:49,304][21194] Updated weights for policy 1, policy_version 14230 (0.0007) +[2023-10-08 16:16:49,672][21194] Updated weights for policy 1, policy_version 14240 (0.0007) +[2023-10-08 16:16:52,876][21195] Updated weights for policy 0, policy_version 14340 (0.0011) +[2023-10-08 16:16:53,242][21195] Updated weights for policy 0, policy_version 14350 (0.0009) +[2023-10-08 16:16:53,600][21194] Updated weights for policy 1, policy_version 14250 (0.0008) +[2023-10-08 16:16:53,610][21195] Updated weights for policy 0, policy_version 14360 (0.0008) +[2023-10-08 16:16:53,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 29261824. Throughput: 0: 1737.2, 1: 1737.1. Samples: 7329590. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:16:53,803][19739] Avg episode reward: [(0, '209.610'), (1, '467.730')] +[2023-10-08 16:16:53,968][21194] Updated weights for policy 1, policy_version 14260 (0.0008) +[2023-10-08 16:16:54,335][21194] Updated weights for policy 1, policy_version 14270 (0.0007) +[2023-10-08 16:16:57,491][21195] Updated weights for policy 0, policy_version 14370 (0.0008) +[2023-10-08 16:16:57,862][21195] Updated weights for policy 0, policy_version 14380 (0.0008) +[2023-10-08 16:16:58,203][21194] Updated weights for policy 1, policy_version 14280 (0.0007) +[2023-10-08 16:16:58,226][21195] Updated weights for policy 0, policy_version 14390 (0.0008) +[2023-10-08 16:16:58,574][21194] Updated weights for policy 1, policy_version 14290 (0.0008) +[2023-10-08 16:16:58,593][21195] Updated weights for policy 0, policy_version 14400 (0.0007) +[2023-10-08 16:16:58,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 29360128. Throughput: 0: 1726.5, 1: 1733.2. Samples: 7350602. Policy #0 lag: (min: 8.0, avg: 34.1, max: 40.0) +[2023-10-08 16:16:58,803][19739] Avg episode reward: [(0, '216.870'), (1, '472.110')] +[2023-10-08 16:16:58,933][21194] Updated weights for policy 1, policy_version 14300 (0.0009) +[2023-10-08 16:17:02,523][21195] Updated weights for policy 0, policy_version 14410 (0.0010) +[2023-10-08 16:17:02,891][21195] Updated weights for policy 0, policy_version 14420 (0.0009) +[2023-10-08 16:17:02,950][21194] Updated weights for policy 1, policy_version 14310 (0.0009) +[2023-10-08 16:17:03,266][21195] Updated weights for policy 0, policy_version 14430 (0.0009) +[2023-10-08 16:17:03,326][21194] Updated weights for policy 1, policy_version 14320 (0.0007) +[2023-10-08 16:17:03,694][21194] Updated weights for policy 1, policy_version 14330 (0.0010) +[2023-10-08 16:17:03,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 29425664. Throughput: 0: 1706.4, 1: 1727.7. Samples: 7365306. Policy #0 lag: (min: 8.0, avg: 34.1, max: 40.0) +[2023-10-08 16:17:03,803][19739] Avg episode reward: [(0, '217.330'), (1, '485.680')] +[2023-10-08 16:17:07,152][21195] Updated weights for policy 0, policy_version 14440 (0.0009) +[2023-10-08 16:17:07,520][21195] Updated weights for policy 0, policy_version 14450 (0.0009) +[2023-10-08 16:17:07,821][21194] Updated weights for policy 1, policy_version 14340 (0.0009) +[2023-10-08 16:17:07,886][21195] Updated weights for policy 0, policy_version 14460 (0.0008) +[2023-10-08 16:17:08,185][21194] Updated weights for policy 1, policy_version 14350 (0.0008) +[2023-10-08 16:17:08,546][21194] Updated weights for policy 1, policy_version 14360 (0.0008) +[2023-10-08 16:17:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 29491200. Throughput: 0: 1737.1, 1: 1732.8. Samples: 7381902. Policy #0 lag: (min: 8.0, avg: 34.1, max: 40.0) +[2023-10-08 16:17:08,803][19739] Avg episode reward: [(0, '217.330'), (1, '485.680')] +[2023-10-08 16:17:11,790][21195] Updated weights for policy 0, policy_version 14470 (0.0009) +[2023-10-08 16:17:12,165][21195] Updated weights for policy 0, policy_version 14480 (0.0009) +[2023-10-08 16:17:12,501][21194] Updated weights for policy 1, policy_version 14370 (0.0008) +[2023-10-08 16:17:12,534][21195] Updated weights for policy 0, policy_version 14490 (0.0008) +[2023-10-08 16:17:12,869][21194] Updated weights for policy 1, policy_version 14380 (0.0007) +[2023-10-08 16:17:13,230][21194] Updated weights for policy 1, policy_version 14390 (0.0007) +[2023-10-08 16:17:13,599][21194] Updated weights for policy 1, policy_version 14400 (0.0008) +[2023-10-08 16:17:13,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 29589504. Throughput: 0: 1702.9, 1: 1721.2. Samples: 7401244. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:17:13,803][19739] Avg episode reward: [(0, '220.010'), (1, '485.680')] +[2023-10-08 16:17:13,810][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000014496_14843904.pth... +[2023-10-08 16:17:13,810][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000014400_14745600.pth... +[2023-10-08 16:17:13,841][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000012896_13205504.pth +[2023-10-08 16:17:13,854][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000012800_13107200.pth +[2023-10-08 16:17:16,429][21195] Updated weights for policy 0, policy_version 14500 (0.0009) +[2023-10-08 16:17:16,831][21195] Updated weights for policy 0, policy_version 14510 (0.0011) +[2023-10-08 16:17:17,197][21195] Updated weights for policy 0, policy_version 14520 (0.0007) +[2023-10-08 16:17:17,470][21194] Updated weights for policy 1, policy_version 14410 (0.0007) +[2023-10-08 16:17:17,846][21194] Updated weights for policy 1, policy_version 14420 (0.0007) +[2023-10-08 16:17:18,213][21194] Updated weights for policy 1, policy_version 14430 (0.0007) +[2023-10-08 16:17:18,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 29655040. Throughput: 0: 1714.8, 1: 1733.0. Samples: 7417230. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:17:18,803][19739] Avg episode reward: [(0, '220.010'), (1, '498.920')] +[2023-10-08 16:17:18,804][20836] Saving new best policy, reward=498.920! +[2023-10-08 16:17:21,076][21195] Updated weights for policy 0, policy_version 14530 (0.0007) +[2023-10-08 16:17:21,440][21195] Updated weights for policy 0, policy_version 14540 (0.0008) +[2023-10-08 16:17:21,809][21195] Updated weights for policy 0, policy_version 14550 (0.0011) +[2023-10-08 16:17:22,181][21195] Updated weights for policy 0, policy_version 14560 (0.0008) +[2023-10-08 16:17:22,278][21194] Updated weights for policy 1, policy_version 14440 (0.0007) +[2023-10-08 16:17:22,661][21194] Updated weights for policy 1, policy_version 14450 (0.0007) +[2023-10-08 16:17:23,023][21194] Updated weights for policy 1, policy_version 14460 (0.0007) +[2023-10-08 16:17:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 29720576. Throughput: 0: 1721.6, 1: 1726.8. Samples: 7432806. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:17:23,803][19739] Avg episode reward: [(0, '220.010'), (1, '498.920')] +[2023-10-08 16:17:26,047][21195] Updated weights for policy 0, policy_version 14570 (0.0008) +[2023-10-08 16:17:26,420][21195] Updated weights for policy 0, policy_version 14580 (0.0007) +[2023-10-08 16:17:26,794][21195] Updated weights for policy 0, policy_version 14590 (0.0007) +[2023-10-08 16:17:26,991][21194] Updated weights for policy 1, policy_version 14470 (0.0007) +[2023-10-08 16:17:27,360][21194] Updated weights for policy 1, policy_version 14480 (0.0007) +[2023-10-08 16:17:27,718][21194] Updated weights for policy 1, policy_version 14490 (0.0007) +[2023-10-08 16:17:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 29786112. Throughput: 0: 1716.0, 1: 1692.8. Samples: 7452354. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 16:17:28,803][19739] Avg episode reward: [(0, '213.830'), (1, '498.920')] +[2023-10-08 16:17:30,673][21195] Updated weights for policy 0, policy_version 14600 (0.0007) +[2023-10-08 16:17:31,046][21195] Updated weights for policy 0, policy_version 14610 (0.0010) +[2023-10-08 16:17:31,412][21195] Updated weights for policy 0, policy_version 14620 (0.0008) +[2023-10-08 16:17:31,827][21194] Updated weights for policy 1, policy_version 14500 (0.0009) +[2023-10-08 16:17:32,190][21194] Updated weights for policy 1, policy_version 14510 (0.0009) +[2023-10-08 16:17:32,551][21194] Updated weights for policy 1, policy_version 14520 (0.0010) +[2023-10-08 16:17:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 29851648. Throughput: 0: 1736.3, 1: 1719.3. Samples: 7468784. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 16:17:33,804][19739] Avg episode reward: [(0, '220.190'), (1, '498.920')] +[2023-10-08 16:17:35,343][21195] Updated weights for policy 0, policy_version 14630 (0.0008) +[2023-10-08 16:17:35,717][21195] Updated weights for policy 0, policy_version 14640 (0.0008) +[2023-10-08 16:17:36,087][21195] Updated weights for policy 0, policy_version 14650 (0.0007) +[2023-10-08 16:17:36,637][21194] Updated weights for policy 1, policy_version 14530 (0.0008) +[2023-10-08 16:17:36,996][21194] Updated weights for policy 1, policy_version 14540 (0.0011) +[2023-10-08 16:17:37,363][21194] Updated weights for policy 1, policy_version 14550 (0.0011) +[2023-10-08 16:17:37,730][21194] Updated weights for policy 1, policy_version 14560 (0.0011) +[2023-10-08 16:17:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 29917184. Throughput: 0: 1717.5, 1: 1701.0. Samples: 7483422. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 16:17:38,803][19739] Avg episode reward: [(0, '213.890'), (1, '498.180')] +[2023-10-08 16:17:39,958][21195] Updated weights for policy 0, policy_version 14660 (0.0008) +[2023-10-08 16:17:40,325][21195] Updated weights for policy 0, policy_version 14670 (0.0010) +[2023-10-08 16:17:40,687][21195] Updated weights for policy 0, policy_version 14680 (0.0011) +[2023-10-08 16:17:41,632][21194] Updated weights for policy 1, policy_version 14570 (0.0007) +[2023-10-08 16:17:42,003][21194] Updated weights for policy 1, policy_version 14580 (0.0007) +[2023-10-08 16:17:42,368][21194] Updated weights for policy 1, policy_version 14590 (0.0007) +[2023-10-08 16:17:43,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 29982720. Throughput: 0: 1733.8, 1: 1684.8. Samples: 7504442. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:17:43,803][19739] Avg episode reward: [(0, '208.660'), (1, '498.180')] +[2023-10-08 16:17:44,623][21195] Updated weights for policy 0, policy_version 14690 (0.0009) +[2023-10-08 16:17:44,988][21195] Updated weights for policy 0, policy_version 14700 (0.0007) +[2023-10-08 16:17:45,355][21195] Updated weights for policy 0, policy_version 14710 (0.0008) +[2023-10-08 16:17:45,722][21195] Updated weights for policy 0, policy_version 14720 (0.0009) +[2023-10-08 16:17:46,435][21194] Updated weights for policy 1, policy_version 14600 (0.0007) +[2023-10-08 16:17:46,808][21194] Updated weights for policy 1, policy_version 14610 (0.0010) +[2023-10-08 16:17:47,177][21194] Updated weights for policy 1, policy_version 14620 (0.0010) +[2023-10-08 16:17:48,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 30048256. Throughput: 0: 1750.6, 1: 1711.1. Samples: 7521086. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:17:48,804][19739] Avg episode reward: [(0, '208.330'), (1, '498.180')] +[2023-10-08 16:17:49,779][21195] Updated weights for policy 0, policy_version 14730 (0.0009) +[2023-10-08 16:17:50,147][21195] Updated weights for policy 0, policy_version 14740 (0.0008) +[2023-10-08 16:17:50,512][21195] Updated weights for policy 0, policy_version 14750 (0.0007) +[2023-10-08 16:17:51,227][21194] Updated weights for policy 1, policy_version 14630 (0.0010) +[2023-10-08 16:17:51,587][21194] Updated weights for policy 1, policy_version 14640 (0.0010) +[2023-10-08 16:17:51,958][21194] Updated weights for policy 1, policy_version 14650 (0.0009) +[2023-10-08 16:17:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 30113792. Throughput: 0: 1716.3, 1: 1688.6. Samples: 7535120. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:17:53,803][19739] Avg episode reward: [(0, '221.420'), (1, '506.620')] +[2023-10-08 16:17:53,804][20836] Saving new best policy, reward=506.620! +[2023-10-08 16:17:54,567][21195] Updated weights for policy 0, policy_version 14760 (0.0007) +[2023-10-08 16:17:54,934][21195] Updated weights for policy 0, policy_version 14770 (0.0008) +[2023-10-08 16:17:55,305][21195] Updated weights for policy 0, policy_version 14780 (0.0008) +[2023-10-08 16:17:55,989][21194] Updated weights for policy 1, policy_version 14660 (0.0007) +[2023-10-08 16:17:56,350][21194] Updated weights for policy 1, policy_version 14670 (0.0007) +[2023-10-08 16:17:56,717][21194] Updated weights for policy 1, policy_version 14680 (0.0008) +[2023-10-08 16:17:58,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 30179328. Throughput: 0: 1750.4, 1: 1697.8. Samples: 7556410. Policy #0 lag: (min: 14.0, avg: 25.0, max: 46.0) +[2023-10-08 16:17:58,803][19739] Avg episode reward: [(0, '221.820'), (1, '506.620')] +[2023-10-08 16:17:59,193][21195] Updated weights for policy 0, policy_version 14790 (0.0008) +[2023-10-08 16:17:59,562][21195] Updated weights for policy 0, policy_version 14800 (0.0010) +[2023-10-08 16:17:59,933][21195] Updated weights for policy 0, policy_version 14810 (0.0007) +[2023-10-08 16:18:00,592][21194] Updated weights for policy 1, policy_version 14690 (0.0008) +[2023-10-08 16:18:00,961][21194] Updated weights for policy 1, policy_version 14700 (0.0010) +[2023-10-08 16:18:01,327][21194] Updated weights for policy 1, policy_version 14710 (0.0009) +[2023-10-08 16:18:01,685][21194] Updated weights for policy 1, policy_version 14720 (0.0008) +[2023-10-08 16:18:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 30244864. Throughput: 0: 1743.6, 1: 1703.7. Samples: 7572356. Policy #0 lag: (min: 14.0, avg: 25.0, max: 46.0) +[2023-10-08 16:18:03,803][19739] Avg episode reward: [(0, '221.820'), (1, '506.620')] +[2023-10-08 16:18:03,810][21195] Updated weights for policy 0, policy_version 14820 (0.0008) +[2023-10-08 16:18:04,202][21195] Updated weights for policy 0, policy_version 14830 (0.0007) +[2023-10-08 16:18:04,566][21195] Updated weights for policy 0, policy_version 14840 (0.0009) +[2023-10-08 16:18:05,686][21194] Updated weights for policy 1, policy_version 14730 (0.0009) +[2023-10-08 16:18:06,060][21194] Updated weights for policy 1, policy_version 14740 (0.0007) +[2023-10-08 16:18:06,429][21194] Updated weights for policy 1, policy_version 14750 (0.0007) +[2023-10-08 16:18:08,584][21195] Updated weights for policy 0, policy_version 14850 (0.0011) +[2023-10-08 16:18:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 30310400. Throughput: 0: 1733.4, 1: 1691.1. Samples: 7586910. Policy #0 lag: (min: 14.0, avg: 25.0, max: 46.0) +[2023-10-08 16:18:08,803][19739] Avg episode reward: [(0, '221.820'), (1, '506.620')] +[2023-10-08 16:18:08,942][21195] Updated weights for policy 0, policy_version 14860 (0.0008) +[2023-10-08 16:18:09,317][21195] Updated weights for policy 0, policy_version 14870 (0.0009) +[2023-10-08 16:18:09,688][21195] Updated weights for policy 0, policy_version 14880 (0.0009) +[2023-10-08 16:18:10,314][21194] Updated weights for policy 1, policy_version 14760 (0.0010) +[2023-10-08 16:18:10,688][21194] Updated weights for policy 1, policy_version 14770 (0.0009) +[2023-10-08 16:18:11,049][21194] Updated weights for policy 1, policy_version 14780 (0.0010) +[2023-10-08 16:18:13,650][21195] Updated weights for policy 0, policy_version 14890 (0.0009) +[2023-10-08 16:18:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 30375936. Throughput: 0: 1738.4, 1: 1720.0. Samples: 7607982. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:18:13,803][19739] Avg episode reward: [(0, '221.980'), (1, '506.620')] +[2023-10-08 16:18:14,030][21195] Updated weights for policy 0, policy_version 14900 (0.0010) +[2023-10-08 16:18:14,390][21195] Updated weights for policy 0, policy_version 14910 (0.0010) +[2023-10-08 16:18:15,112][21194] Updated weights for policy 1, policy_version 14790 (0.0009) +[2023-10-08 16:18:15,477][21194] Updated weights for policy 1, policy_version 14800 (0.0009) +[2023-10-08 16:18:15,851][21194] Updated weights for policy 1, policy_version 14810 (0.0008) +[2023-10-08 16:18:18,522][21195] Updated weights for policy 0, policy_version 14920 (0.0010) +[2023-10-08 16:18:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 30441472. Throughput: 0: 1723.7, 1: 1696.0. Samples: 7622670. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:18:18,803][19739] Avg episode reward: [(0, '221.980'), (1, '506.620')] +[2023-10-08 16:18:18,889][21195] Updated weights for policy 0, policy_version 14930 (0.0011) +[2023-10-08 16:18:19,263][21195] Updated weights for policy 0, policy_version 14940 (0.0011) +[2023-10-08 16:18:19,756][21194] Updated weights for policy 1, policy_version 14820 (0.0011) +[2023-10-08 16:18:20,122][21194] Updated weights for policy 1, policy_version 14830 (0.0007) +[2023-10-08 16:18:20,483][21194] Updated weights for policy 1, policy_version 14840 (0.0008) +[2023-10-08 16:18:23,172][21195] Updated weights for policy 0, policy_version 14950 (0.0010) +[2023-10-08 16:18:23,552][21195] Updated weights for policy 0, policy_version 14960 (0.0010) +[2023-10-08 16:18:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 30507008. Throughput: 0: 1733.6, 1: 1708.5. Samples: 7638320. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:18:23,803][19739] Avg episode reward: [(0, '228.340'), (1, '506.620')] +[2023-10-08 16:18:23,921][21195] Updated weights for policy 0, policy_version 14970 (0.0009) +[2023-10-08 16:18:24,529][21194] Updated weights for policy 1, policy_version 14850 (0.0008) +[2023-10-08 16:18:24,895][21194] Updated weights for policy 1, policy_version 14860 (0.0008) +[2023-10-08 16:18:25,260][21194] Updated weights for policy 1, policy_version 14870 (0.0007) +[2023-10-08 16:18:25,623][21194] Updated weights for policy 1, policy_version 14880 (0.0007) +[2023-10-08 16:18:27,798][21195] Updated weights for policy 0, policy_version 14980 (0.0008) +[2023-10-08 16:18:28,171][21195] Updated weights for policy 0, policy_version 14990 (0.0008) +[2023-10-08 16:18:28,537][21195] Updated weights for policy 0, policy_version 15000 (0.0009) +[2023-10-08 16:18:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 30572544. Throughput: 0: 1722.8, 1: 1728.2. Samples: 7659736. Policy #0 lag: (min: 5.0, avg: 5.0, max: 6.0) +[2023-10-08 16:18:28,803][19739] Avg episode reward: [(0, '228.590'), (1, '514.250')] +[2023-10-08 16:18:28,811][20836] Saving new best policy, reward=514.250! +[2023-10-08 16:18:29,414][21194] Updated weights for policy 1, policy_version 14890 (0.0007) +[2023-10-08 16:18:29,782][21194] Updated weights for policy 1, policy_version 14900 (0.0007) +[2023-10-08 16:18:30,160][21194] Updated weights for policy 1, policy_version 14910 (0.0007) +[2023-10-08 16:18:32,362][21195] Updated weights for policy 0, policy_version 15010 (0.0009) +[2023-10-08 16:18:32,741][21195] Updated weights for policy 0, policy_version 15020 (0.0009) +[2023-10-08 16:18:33,116][21195] Updated weights for policy 0, policy_version 15030 (0.0009) +[2023-10-08 16:18:33,485][21195] Updated weights for policy 0, policy_version 15040 (0.0008) +[2023-10-08 16:18:33,803][19739] Fps is (10 sec: 16383.7, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 30670848. Throughput: 0: 1698.6, 1: 1696.7. Samples: 7673876. Policy #0 lag: (min: 5.0, avg: 5.0, max: 6.0) +[2023-10-08 16:18:33,804][19739] Avg episode reward: [(0, '234.200'), (1, '521.020')] +[2023-10-08 16:18:34,135][21194] Updated weights for policy 1, policy_version 14920 (0.0009) +[2023-10-08 16:18:34,508][21194] Updated weights for policy 1, policy_version 14930 (0.0007) +[2023-10-08 16:18:34,869][21194] Updated weights for policy 1, policy_version 14940 (0.0008) +[2023-10-08 16:18:35,011][20836] Saving new best policy, reward=521.020! +[2023-10-08 16:18:37,410][21195] Updated weights for policy 0, policy_version 15050 (0.0008) +[2023-10-08 16:18:37,780][21195] Updated weights for policy 0, policy_version 15060 (0.0008) +[2023-10-08 16:18:38,150][21195] Updated weights for policy 0, policy_version 15070 (0.0008) +[2023-10-08 16:18:38,735][21194] Updated weights for policy 1, policy_version 14950 (0.0008) +[2023-10-08 16:18:38,803][19739] Fps is (10 sec: 16383.8, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 30736384. Throughput: 0: 1730.6, 1: 1726.8. Samples: 7690704. Policy #0 lag: (min: 23.0, avg: 23.3, max: 35.0) +[2023-10-08 16:18:38,803][19739] Avg episode reward: [(0, '233.040'), (1, '521.020')] +[2023-10-08 16:18:39,101][21194] Updated weights for policy 1, policy_version 14960 (0.0009) +[2023-10-08 16:18:39,471][21194] Updated weights for policy 1, policy_version 14970 (0.0010) +[2023-10-08 16:18:41,930][21195] Updated weights for policy 0, policy_version 15080 (0.0010) +[2023-10-08 16:18:42,294][21195] Updated weights for policy 0, policy_version 15090 (0.0010) +[2023-10-08 16:18:42,682][21195] Updated weights for policy 0, policy_version 15100 (0.0010) +[2023-10-08 16:18:43,467][21194] Updated weights for policy 1, policy_version 14980 (0.0008) +[2023-10-08 16:18:43,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 30801920. Throughput: 0: 1700.2, 1: 1730.5. Samples: 7710790. Policy #0 lag: (min: 23.0, avg: 23.3, max: 35.0) +[2023-10-08 16:18:43,803][19739] Avg episode reward: [(0, '233.040'), (1, '521.460')] +[2023-10-08 16:18:43,835][21194] Updated weights for policy 1, policy_version 14990 (0.0008) +[2023-10-08 16:18:44,203][21194] Updated weights for policy 1, policy_version 15000 (0.0009) +[2023-10-08 16:18:44,488][20836] Saving new best policy, reward=521.460! +[2023-10-08 16:18:46,705][21195] Updated weights for policy 0, policy_version 15110 (0.0009) +[2023-10-08 16:18:47,071][21195] Updated weights for policy 0, policy_version 15120 (0.0008) +[2023-10-08 16:18:47,444][21195] Updated weights for policy 0, policy_version 15130 (0.0010) +[2023-10-08 16:18:48,192][21194] Updated weights for policy 1, policy_version 15010 (0.0008) +[2023-10-08 16:18:48,556][21194] Updated weights for policy 1, policy_version 15020 (0.0011) +[2023-10-08 16:18:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 30867456. Throughput: 0: 1700.1, 1: 1713.0. Samples: 7725944. Policy #0 lag: (min: 23.0, avg: 23.3, max: 35.0) +[2023-10-08 16:18:48,803][19739] Avg episode reward: [(0, '240.690'), (1, '521.460')] +[2023-10-08 16:18:48,926][21194] Updated weights for policy 1, policy_version 15030 (0.0011) +[2023-10-08 16:18:49,291][21194] Updated weights for policy 1, policy_version 15040 (0.0009) +[2023-10-08 16:18:51,607][21195] Updated weights for policy 0, policy_version 15140 (0.0010) +[2023-10-08 16:18:51,989][21195] Updated weights for policy 0, policy_version 15150 (0.0007) +[2023-10-08 16:18:52,348][21195] Updated weights for policy 0, policy_version 15160 (0.0008) +[2023-10-08 16:18:53,301][21194] Updated weights for policy 1, policy_version 15050 (0.0007) +[2023-10-08 16:18:53,663][21194] Updated weights for policy 1, policy_version 15060 (0.0008) +[2023-10-08 16:18:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 30932992. Throughput: 0: 1717.6, 1: 1727.7. Samples: 7741950. Policy #0 lag: (min: 31.0, avg: 31.0, max: 33.0) +[2023-10-08 16:18:53,803][19739] Avg episode reward: [(0, '229.020'), (1, '521.460')] +[2023-10-08 16:18:54,032][21194] Updated weights for policy 1, policy_version 15070 (0.0008) +[2023-10-08 16:18:56,090][21195] Updated weights for policy 0, policy_version 15170 (0.0009) +[2023-10-08 16:18:56,461][21195] Updated weights for policy 0, policy_version 15180 (0.0010) +[2023-10-08 16:18:56,830][21195] Updated weights for policy 0, policy_version 15190 (0.0009) +[2023-10-08 16:18:57,204][21195] Updated weights for policy 0, policy_version 15200 (0.0009) +[2023-10-08 16:18:58,076][21194] Updated weights for policy 1, policy_version 15080 (0.0009) +[2023-10-08 16:18:58,445][21194] Updated weights for policy 1, policy_version 15090 (0.0007) +[2023-10-08 16:18:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 30998528. Throughput: 0: 1706.7, 1: 1729.3. Samples: 7762602. Policy #0 lag: (min: 31.0, avg: 31.0, max: 33.0) +[2023-10-08 16:18:58,803][19739] Avg episode reward: [(0, '230.050'), (1, '521.460')] +[2023-10-08 16:18:58,809][21194] Updated weights for policy 1, policy_version 15100 (0.0007) +[2023-10-08 16:19:01,064][21195] Updated weights for policy 0, policy_version 15210 (0.0008) +[2023-10-08 16:19:01,437][21195] Updated weights for policy 0, policy_version 15220 (0.0009) +[2023-10-08 16:19:01,816][21195] Updated weights for policy 0, policy_version 15230 (0.0009) +[2023-10-08 16:19:02,685][21194] Updated weights for policy 1, policy_version 15110 (0.0007) +[2023-10-08 16:19:03,064][21194] Updated weights for policy 1, policy_version 15120 (0.0008) +[2023-10-08 16:19:03,435][21194] Updated weights for policy 1, policy_version 15130 (0.0010) +[2023-10-08 16:19:03,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 31096832. Throughput: 0: 1731.4, 1: 1732.6. Samples: 7778548. Policy #0 lag: (min: 31.0, avg: 31.0, max: 33.0) +[2023-10-08 16:19:03,804][19739] Avg episode reward: [(0, '216.200'), (1, '511.530')] +[2023-10-08 16:19:05,716][21195] Updated weights for policy 0, policy_version 15240 (0.0009) +[2023-10-08 16:19:06,092][21195] Updated weights for policy 0, policy_version 15250 (0.0008) +[2023-10-08 16:19:06,469][21195] Updated weights for policy 0, policy_version 15260 (0.0010) +[2023-10-08 16:19:07,415][21194] Updated weights for policy 1, policy_version 15140 (0.0008) +[2023-10-08 16:19:07,776][21194] Updated weights for policy 1, policy_version 15150 (0.0009) +[2023-10-08 16:19:08,142][21194] Updated weights for policy 1, policy_version 15160 (0.0008) +[2023-10-08 16:19:08,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 31162368. Throughput: 0: 1719.8, 1: 1740.4. Samples: 7794026. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 16:19:08,803][19739] Avg episode reward: [(0, '218.590'), (1, '511.530')] +[2023-10-08 16:19:10,444][21195] Updated weights for policy 0, policy_version 15270 (0.0010) +[2023-10-08 16:19:10,822][21195] Updated weights for policy 0, policy_version 15280 (0.0009) +[2023-10-08 16:19:11,190][21195] Updated weights for policy 0, policy_version 15290 (0.0010) +[2023-10-08 16:19:12,089][21194] Updated weights for policy 1, policy_version 15170 (0.0008) +[2023-10-08 16:19:12,459][21194] Updated weights for policy 1, policy_version 15180 (0.0008) +[2023-10-08 16:19:12,822][21194] Updated weights for policy 1, policy_version 15190 (0.0010) +[2023-10-08 16:19:13,190][21194] Updated weights for policy 1, policy_version 15200 (0.0007) +[2023-10-08 16:19:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 31227904. Throughput: 0: 1722.3, 1: 1713.9. Samples: 7814368. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 16:19:13,804][19739] Avg episode reward: [(0, '221.250'), (1, '506.880')] +[2023-10-08 16:19:13,814][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000015200_15564800.pth... +[2023-10-08 16:19:13,814][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000015296_15663104.pth... +[2023-10-08 16:19:13,846][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000013696_14024704.pth +[2023-10-08 16:19:13,847][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000013600_13926400.pth +[2023-10-08 16:19:15,081][21195] Updated weights for policy 0, policy_version 15300 (0.0008) +[2023-10-08 16:19:15,456][21195] Updated weights for policy 0, policy_version 15310 (0.0008) +[2023-10-08 16:19:15,824][21195] Updated weights for policy 0, policy_version 15320 (0.0008) +[2023-10-08 16:19:17,105][21194] Updated weights for policy 1, policy_version 15210 (0.0007) +[2023-10-08 16:19:17,462][21194] Updated weights for policy 1, policy_version 15220 (0.0010) +[2023-10-08 16:19:17,827][21194] Updated weights for policy 1, policy_version 15230 (0.0010) +[2023-10-08 16:19:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 31293440. Throughput: 0: 1742.6, 1: 1739.8. Samples: 7830584. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 16:19:18,803][19739] Avg episode reward: [(0, '221.250'), (1, '509.350')] +[2023-10-08 16:19:19,788][21195] Updated weights for policy 0, policy_version 15330 (0.0009) +[2023-10-08 16:19:20,159][21195] Updated weights for policy 0, policy_version 15340 (0.0010) +[2023-10-08 16:19:20,530][21195] Updated weights for policy 0, policy_version 15350 (0.0008) +[2023-10-08 16:19:20,903][21195] Updated weights for policy 0, policy_version 15360 (0.0010) +[2023-10-08 16:19:21,901][21194] Updated weights for policy 1, policy_version 15240 (0.0008) +[2023-10-08 16:19:22,264][21194] Updated weights for policy 1, policy_version 15250 (0.0008) +[2023-10-08 16:19:22,631][21194] Updated weights for policy 1, policy_version 15260 (0.0007) +[2023-10-08 16:19:23,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 31358976. Throughput: 0: 1714.1, 1: 1718.7. Samples: 7845180. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:19:23,803][19739] Avg episode reward: [(0, '231.870'), (1, '515.140')] +[2023-10-08 16:19:24,831][21195] Updated weights for policy 0, policy_version 15370 (0.0008) +[2023-10-08 16:19:25,200][21195] Updated weights for policy 0, policy_version 15380 (0.0008) +[2023-10-08 16:19:25,573][21195] Updated weights for policy 0, policy_version 15390 (0.0008) +[2023-10-08 16:19:26,543][21194] Updated weights for policy 1, policy_version 15270 (0.0007) +[2023-10-08 16:19:26,911][21194] Updated weights for policy 1, policy_version 15280 (0.0007) +[2023-10-08 16:19:27,288][21194] Updated weights for policy 1, policy_version 15290 (0.0010) +[2023-10-08 16:19:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 31424512. Throughput: 0: 1748.1, 1: 1700.0. Samples: 7865954. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:19:28,803][19739] Avg episode reward: [(0, '231.010'), (1, '515.140')] +[2023-10-08 16:19:29,398][21195] Updated weights for policy 0, policy_version 15400 (0.0007) +[2023-10-08 16:19:29,768][21195] Updated weights for policy 0, policy_version 15410 (0.0008) +[2023-10-08 16:19:30,149][21195] Updated weights for policy 0, policy_version 15420 (0.0009) +[2023-10-08 16:19:31,288][21194] Updated weights for policy 1, policy_version 15300 (0.0008) +[2023-10-08 16:19:31,657][21194] Updated weights for policy 1, policy_version 15310 (0.0009) +[2023-10-08 16:19:32,021][21194] Updated weights for policy 1, policy_version 15320 (0.0009) +[2023-10-08 16:19:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 31490048. Throughput: 0: 1756.4, 1: 1728.4. Samples: 7882760. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:19:33,803][19739] Avg episode reward: [(0, '231.010'), (1, '526.030')] +[2023-10-08 16:19:33,804][20836] Saving new best policy, reward=526.030! +[2023-10-08 16:19:34,063][21195] Updated weights for policy 0, policy_version 15430 (0.0010) +[2023-10-08 16:19:34,432][21195] Updated weights for policy 0, policy_version 15440 (0.0009) +[2023-10-08 16:19:34,808][21195] Updated weights for policy 0, policy_version 15450 (0.0007) +[2023-10-08 16:19:36,025][21194] Updated weights for policy 1, policy_version 15330 (0.0007) +[2023-10-08 16:19:36,385][21194] Updated weights for policy 1, policy_version 15340 (0.0009) +[2023-10-08 16:19:36,754][21194] Updated weights for policy 1, policy_version 15350 (0.0007) +[2023-10-08 16:19:37,118][21194] Updated weights for policy 1, policy_version 15360 (0.0007) +[2023-10-08 16:19:38,593][21195] Updated weights for policy 0, policy_version 15460 (0.0007) +[2023-10-08 16:19:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 31555584. Throughput: 0: 1745.8, 1: 1703.9. Samples: 7897184. Policy #0 lag: (min: 30.0, avg: 35.7, max: 62.0) +[2023-10-08 16:19:38,803][19739] Avg episode reward: [(0, '231.010'), (1, '538.570')] +[2023-10-08 16:19:38,804][20836] Saving new best policy, reward=538.570! +[2023-10-08 16:19:38,989][21195] Updated weights for policy 0, policy_version 15470 (0.0008) +[2023-10-08 16:19:39,354][21195] Updated weights for policy 0, policy_version 15480 (0.0007) +[2023-10-08 16:19:41,058][21194] Updated weights for policy 1, policy_version 15370 (0.0009) +[2023-10-08 16:19:41,425][21194] Updated weights for policy 1, policy_version 15380 (0.0007) +[2023-10-08 16:19:41,795][21194] Updated weights for policy 1, policy_version 15390 (0.0009) +[2023-10-08 16:19:43,279][21195] Updated weights for policy 0, policy_version 15490 (0.0009) +[2023-10-08 16:19:43,642][21195] Updated weights for policy 0, policy_version 15500 (0.0007) +[2023-10-08 16:19:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 31621120. Throughput: 0: 1760.7, 1: 1700.9. Samples: 7918372. Policy #0 lag: (min: 30.0, avg: 35.7, max: 62.0) +[2023-10-08 16:19:43,803][19739] Avg episode reward: [(0, '231.690'), (1, '538.570')] +[2023-10-08 16:19:44,009][21195] Updated weights for policy 0, policy_version 15510 (0.0008) +[2023-10-08 16:19:44,381][21195] Updated weights for policy 0, policy_version 15520 (0.0007) +[2023-10-08 16:19:45,781][21194] Updated weights for policy 1, policy_version 15400 (0.0008) +[2023-10-08 16:19:46,163][21194] Updated weights for policy 1, policy_version 15410 (0.0008) +[2023-10-08 16:19:46,526][21194] Updated weights for policy 1, policy_version 15420 (0.0007) +[2023-10-08 16:19:48,041][21195] Updated weights for policy 0, policy_version 15530 (0.0010) +[2023-10-08 16:19:48,414][21195] Updated weights for policy 0, policy_version 15540 (0.0008) +[2023-10-08 16:19:48,784][21195] Updated weights for policy 0, policy_version 15550 (0.0010) +[2023-10-08 16:19:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 31686656. Throughput: 0: 1734.3, 1: 1709.4. Samples: 7933514. Policy #0 lag: (min: 30.0, avg: 35.7, max: 62.0) +[2023-10-08 16:19:48,803][19739] Avg episode reward: [(0, '225.730'), (1, '534.310')] +[2023-10-08 16:19:50,408][21194] Updated weights for policy 1, policy_version 15430 (0.0009) +[2023-10-08 16:19:50,772][21194] Updated weights for policy 1, policy_version 15440 (0.0007) +[2023-10-08 16:19:51,142][21194] Updated weights for policy 1, policy_version 15450 (0.0007) +[2023-10-08 16:19:52,734][21195] Updated weights for policy 0, policy_version 15560 (0.0009) +[2023-10-08 16:19:53,112][21195] Updated weights for policy 0, policy_version 15570 (0.0010) +[2023-10-08 16:19:53,497][21195] Updated weights for policy 0, policy_version 15580 (0.0010) +[2023-10-08 16:19:53,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 31784960. Throughput: 0: 1763.0, 1: 1688.0. Samples: 7949320. Policy #0 lag: (min: 31.0, avg: 42.9, max: 63.0) +[2023-10-08 16:19:53,803][19739] Avg episode reward: [(0, '225.730'), (1, '534.310')] +[2023-10-08 16:19:54,957][21194] Updated weights for policy 1, policy_version 15460 (0.0007) +[2023-10-08 16:19:55,327][21194] Updated weights for policy 1, policy_version 15470 (0.0007) +[2023-10-08 16:19:55,695][21194] Updated weights for policy 1, policy_version 15480 (0.0007) +[2023-10-08 16:19:57,228][21195] Updated weights for policy 0, policy_version 15590 (0.0011) +[2023-10-08 16:19:57,595][21195] Updated weights for policy 0, policy_version 15600 (0.0009) +[2023-10-08 16:19:57,964][21195] Updated weights for policy 0, policy_version 15610 (0.0011) +[2023-10-08 16:19:58,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 31850496. Throughput: 0: 1749.6, 1: 1715.4. Samples: 7970290. Policy #0 lag: (min: 31.0, avg: 42.9, max: 63.0) +[2023-10-08 16:19:58,803][19739] Avg episode reward: [(0, '227.800'), (1, '548.440')] +[2023-10-08 16:19:58,812][20836] Saving new best policy, reward=548.440! +[2023-10-08 16:19:59,790][21194] Updated weights for policy 1, policy_version 15490 (0.0008) +[2023-10-08 16:20:00,165][21194] Updated weights for policy 1, policy_version 15500 (0.0009) +[2023-10-08 16:20:00,532][21194] Updated weights for policy 1, policy_version 15510 (0.0009) +[2023-10-08 16:20:00,888][21194] Updated weights for policy 1, policy_version 15520 (0.0011) +[2023-10-08 16:20:01,905][21195] Updated weights for policy 0, policy_version 15620 (0.0010) +[2023-10-08 16:20:02,275][21195] Updated weights for policy 0, policy_version 15630 (0.0008) +[2023-10-08 16:20:02,642][21195] Updated weights for policy 0, policy_version 15640 (0.0007) +[2023-10-08 16:20:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 31916032. Throughput: 0: 1744.4, 1: 1689.6. Samples: 7985116. Policy #0 lag: (min: 15.0, avg: 23.8, max: 47.0) +[2023-10-08 16:20:03,803][19739] Avg episode reward: [(0, '229.620'), (1, '562.030')] +[2023-10-08 16:20:03,804][20836] Saving new best policy, reward=562.030! +[2023-10-08 16:20:04,827][21194] Updated weights for policy 1, policy_version 15530 (0.0009) +[2023-10-08 16:20:05,190][21194] Updated weights for policy 1, policy_version 15540 (0.0011) +[2023-10-08 16:20:05,556][21194] Updated weights for policy 1, policy_version 15550 (0.0010) +[2023-10-08 16:20:06,469][21195] Updated weights for policy 0, policy_version 15650 (0.0007) +[2023-10-08 16:20:06,847][21195] Updated weights for policy 0, policy_version 15660 (0.0010) +[2023-10-08 16:20:07,213][21195] Updated weights for policy 0, policy_version 15670 (0.0008) +[2023-10-08 16:20:07,584][21195] Updated weights for policy 0, policy_version 15680 (0.0010) +[2023-10-08 16:20:08,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 31981568. Throughput: 0: 1766.5, 1: 1713.1. Samples: 8001764. Policy #0 lag: (min: 15.0, avg: 23.8, max: 47.0) +[2023-10-08 16:20:08,803][19739] Avg episode reward: [(0, '229.620'), (1, '585.040')] +[2023-10-08 16:20:08,804][20836] Saving new best policy, reward=585.040! +[2023-10-08 16:20:09,305][21194] Updated weights for policy 1, policy_version 15560 (0.0011) +[2023-10-08 16:20:09,674][21194] Updated weights for policy 1, policy_version 15570 (0.0009) +[2023-10-08 16:20:10,041][21194] Updated weights for policy 1, policy_version 15580 (0.0007) +[2023-10-08 16:20:11,555][21195] Updated weights for policy 0, policy_version 15690 (0.0008) +[2023-10-08 16:20:11,922][21195] Updated weights for policy 0, policy_version 15700 (0.0009) +[2023-10-08 16:20:12,290][21195] Updated weights for policy 0, policy_version 15710 (0.0008) +[2023-10-08 16:20:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 32047104. Throughput: 0: 1737.1, 1: 1733.0. Samples: 8022110. Policy #0 lag: (min: 15.0, avg: 23.8, max: 47.0) +[2023-10-08 16:20:13,803][19739] Avg episode reward: [(0, '224.730'), (1, '585.040')] +[2023-10-08 16:20:13,968][21194] Updated weights for policy 1, policy_version 15590 (0.0008) +[2023-10-08 16:20:14,338][21194] Updated weights for policy 1, policy_version 15600 (0.0009) +[2023-10-08 16:20:14,704][21194] Updated weights for policy 1, policy_version 15610 (0.0008) +[2023-10-08 16:20:16,227][21195] Updated weights for policy 0, policy_version 15720 (0.0011) +[2023-10-08 16:20:16,593][21195] Updated weights for policy 0, policy_version 15730 (0.0010) +[2023-10-08 16:20:16,963][21195] Updated weights for policy 0, policy_version 15740 (0.0009) +[2023-10-08 16:20:18,692][21194] Updated weights for policy 1, policy_version 15620 (0.0008) +[2023-10-08 16:20:18,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 32112640. Throughput: 0: 1734.7, 1: 1704.8. Samples: 8037536. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:20:18,804][19739] Avg episode reward: [(0, '224.730'), (1, '600.230')] +[2023-10-08 16:20:19,058][21194] Updated weights for policy 1, policy_version 15630 (0.0009) +[2023-10-08 16:20:19,428][21194] Updated weights for policy 1, policy_version 15640 (0.0010) +[2023-10-08 16:20:19,722][20836] Saving new best policy, reward=600.230! +[2023-10-08 16:20:20,980][21195] Updated weights for policy 0, policy_version 15750 (0.0007) +[2023-10-08 16:20:21,345][21195] Updated weights for policy 0, policy_version 15760 (0.0009) +[2023-10-08 16:20:21,717][21195] Updated weights for policy 0, policy_version 15770 (0.0011) +[2023-10-08 16:20:23,624][21194] Updated weights for policy 1, policy_version 15650 (0.0010) +[2023-10-08 16:20:23,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 32178176. Throughput: 0: 1738.2, 1: 1729.5. Samples: 8053230. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:20:23,803][19739] Avg episode reward: [(0, '224.730'), (1, '615.190')] +[2023-10-08 16:20:23,986][21194] Updated weights for policy 1, policy_version 15660 (0.0010) +[2023-10-08 16:20:24,353][21194] Updated weights for policy 1, policy_version 15670 (0.0008) +[2023-10-08 16:20:24,715][20836] Saving new best policy, reward=615.190! +[2023-10-08 16:20:24,721][21194] Updated weights for policy 1, policy_version 15680 (0.0007) +[2023-10-08 16:20:25,519][21195] Updated weights for policy 0, policy_version 15780 (0.0010) +[2023-10-08 16:20:25,891][21195] Updated weights for policy 0, policy_version 15790 (0.0009) +[2023-10-08 16:20:26,269][21195] Updated weights for policy 0, policy_version 15800 (0.0008) +[2023-10-08 16:20:28,752][21194] Updated weights for policy 1, policy_version 15690 (0.0007) +[2023-10-08 16:20:28,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 32243712. Throughput: 0: 1731.5, 1: 1729.8. Samples: 8074128. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:20:28,803][19739] Avg episode reward: [(0, '221.200'), (1, '615.190')] +[2023-10-08 16:20:29,124][21194] Updated weights for policy 1, policy_version 15700 (0.0008) +[2023-10-08 16:20:29,500][21194] Updated weights for policy 1, policy_version 15710 (0.0011) +[2023-10-08 16:20:30,026][21195] Updated weights for policy 0, policy_version 15810 (0.0007) +[2023-10-08 16:20:30,388][21195] Updated weights for policy 0, policy_version 15820 (0.0008) +[2023-10-08 16:20:30,759][21195] Updated weights for policy 0, policy_version 15830 (0.0010) +[2023-10-08 16:20:31,136][21195] Updated weights for policy 0, policy_version 15840 (0.0009) +[2023-10-08 16:20:33,468][21194] Updated weights for policy 1, policy_version 15720 (0.0008) +[2023-10-08 16:20:33,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 32309248. Throughput: 0: 1756.6, 1: 1717.8. Samples: 8089862. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:20:33,804][19739] Avg episode reward: [(0, '221.200'), (1, '615.190')] +[2023-10-08 16:20:33,851][21194] Updated weights for policy 1, policy_version 15730 (0.0009) +[2023-10-08 16:20:34,211][21194] Updated weights for policy 1, policy_version 15740 (0.0008) +[2023-10-08 16:20:34,876][21195] Updated weights for policy 0, policy_version 15850 (0.0009) +[2023-10-08 16:20:35,243][21195] Updated weights for policy 0, policy_version 15860 (0.0009) +[2023-10-08 16:20:35,607][21195] Updated weights for policy 0, policy_version 15870 (0.0009) +[2023-10-08 16:20:38,222][21194] Updated weights for policy 1, policy_version 15750 (0.0007) +[2023-10-08 16:20:38,592][21194] Updated weights for policy 1, policy_version 15760 (0.0007) +[2023-10-08 16:20:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 32374784. Throughput: 0: 1729.2, 1: 1733.2. Samples: 8105130. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:20:38,803][19739] Avg episode reward: [(0, '225.450'), (1, '619.180')] +[2023-10-08 16:20:38,950][21194] Updated weights for policy 1, policy_version 15770 (0.0007) +[2023-10-08 16:20:39,165][20836] Saving new best policy, reward=619.180! +[2023-10-08 16:20:39,753][21195] Updated weights for policy 0, policy_version 15880 (0.0010) +[2023-10-08 16:20:40,127][21195] Updated weights for policy 0, policy_version 15890 (0.0011) +[2023-10-08 16:20:40,496][21195] Updated weights for policy 0, policy_version 15900 (0.0008) +[2023-10-08 16:20:42,948][21194] Updated weights for policy 1, policy_version 15780 (0.0007) +[2023-10-08 16:20:43,314][21194] Updated weights for policy 1, policy_version 15790 (0.0010) +[2023-10-08 16:20:43,686][21194] Updated weights for policy 1, policy_version 15800 (0.0010) +[2023-10-08 16:20:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 32440320. Throughput: 0: 1737.4, 1: 1722.3. Samples: 8125978. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:20:43,804][19739] Avg episode reward: [(0, '229.470'), (1, '619.180')] +[2023-10-08 16:20:44,299][21195] Updated weights for policy 0, policy_version 15910 (0.0008) +[2023-10-08 16:20:44,673][21195] Updated weights for policy 0, policy_version 15920 (0.0008) +[2023-10-08 16:20:45,036][21195] Updated weights for policy 0, policy_version 15930 (0.0009) +[2023-10-08 16:20:47,632][21194] Updated weights for policy 1, policy_version 15810 (0.0008) +[2023-10-08 16:20:47,994][21194] Updated weights for policy 1, policy_version 15820 (0.0009) +[2023-10-08 16:20:48,355][21194] Updated weights for policy 1, policy_version 15830 (0.0010) +[2023-10-08 16:20:48,725][21194] Updated weights for policy 1, policy_version 15840 (0.0008) +[2023-10-08 16:20:48,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 32538624. Throughput: 0: 1749.6, 1: 1732.2. Samples: 8141796. Policy #0 lag: (min: 31.0, avg: 41.6, max: 63.0) +[2023-10-08 16:20:48,803][19739] Avg episode reward: [(0, '236.460'), (1, '619.180')] +[2023-10-08 16:20:49,028][21195] Updated weights for policy 0, policy_version 15940 (0.0009) +[2023-10-08 16:20:49,395][21195] Updated weights for policy 0, policy_version 15950 (0.0011) +[2023-10-08 16:20:49,766][21195] Updated weights for policy 0, policy_version 15960 (0.0011) +[2023-10-08 16:20:52,836][21194] Updated weights for policy 1, policy_version 15850 (0.0007) +[2023-10-08 16:20:53,209][21194] Updated weights for policy 1, policy_version 15860 (0.0008) +[2023-10-08 16:20:53,570][21194] Updated weights for policy 1, policy_version 15870 (0.0008) +[2023-10-08 16:20:53,681][21195] Updated weights for policy 0, policy_version 15970 (0.0011) +[2023-10-08 16:20:53,802][19739] Fps is (10 sec: 16384.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 32604160. Throughput: 0: 1725.7, 1: 1720.5. Samples: 8156846. Policy #0 lag: (min: 31.0, avg: 41.6, max: 63.0) +[2023-10-08 16:20:53,803][19739] Avg episode reward: [(0, '250.060'), (1, '627.120')] +[2023-10-08 16:20:53,804][20836] Saving new best policy, reward=627.120! +[2023-10-08 16:20:54,048][21195] Updated weights for policy 0, policy_version 15980 (0.0007) +[2023-10-08 16:20:54,423][21195] Updated weights for policy 0, policy_version 15990 (0.0011) +[2023-10-08 16:20:54,795][21195] Updated weights for policy 0, policy_version 16000 (0.0011) +[2023-10-08 16:20:57,435][21194] Updated weights for policy 1, policy_version 15880 (0.0007) +[2023-10-08 16:20:57,796][21194] Updated weights for policy 1, policy_version 15890 (0.0007) +[2023-10-08 16:20:58,165][21194] Updated weights for policy 1, policy_version 15900 (0.0008) +[2023-10-08 16:20:58,703][21195] Updated weights for policy 0, policy_version 16010 (0.0009) +[2023-10-08 16:20:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 32669696. Throughput: 0: 1752.1, 1: 1702.1. Samples: 8177552. Policy #0 lag: (min: 31.0, avg: 41.6, max: 63.0) +[2023-10-08 16:20:58,803][19739] Avg episode reward: [(0, '252.870'), (1, '627.120')] +[2023-10-08 16:20:59,077][21195] Updated weights for policy 0, policy_version 16020 (0.0010) +[2023-10-08 16:20:59,443][21195] Updated weights for policy 0, policy_version 16030 (0.0009) +[2023-10-08 16:21:02,177][21194] Updated weights for policy 1, policy_version 15910 (0.0009) +[2023-10-08 16:21:02,543][21194] Updated weights for policy 1, policy_version 15920 (0.0009) +[2023-10-08 16:21:02,904][21194] Updated weights for policy 1, policy_version 15930 (0.0007) +[2023-10-08 16:21:03,503][21195] Updated weights for policy 0, policy_version 16040 (0.0008) +[2023-10-08 16:21:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 32735232. Throughput: 0: 1736.2, 1: 1723.3. Samples: 8193212. Policy #0 lag: (min: 23.0, avg: 28.9, max: 55.0) +[2023-10-08 16:21:03,803][19739] Avg episode reward: [(0, '252.870'), (1, '627.120')] +[2023-10-08 16:21:03,877][21195] Updated weights for policy 0, policy_version 16050 (0.0009) +[2023-10-08 16:21:04,246][21195] Updated weights for policy 0, policy_version 16060 (0.0012) +[2023-10-08 16:21:06,654][21194] Updated weights for policy 1, policy_version 15940 (0.0009) +[2023-10-08 16:21:07,024][21194] Updated weights for policy 1, policy_version 15950 (0.0008) +[2023-10-08 16:21:07,391][21194] Updated weights for policy 1, policy_version 15960 (0.0007) +[2023-10-08 16:21:07,973][21195] Updated weights for policy 0, policy_version 16070 (0.0009) +[2023-10-08 16:21:08,338][21195] Updated weights for policy 0, policy_version 16080 (0.0008) +[2023-10-08 16:21:08,714][21195] Updated weights for policy 0, policy_version 16090 (0.0007) +[2023-10-08 16:21:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 32800768. Throughput: 0: 1739.4, 1: 1711.5. Samples: 8208518. Policy #0 lag: (min: 23.0, avg: 28.9, max: 55.0) +[2023-10-08 16:21:08,803][19739] Avg episode reward: [(0, '248.810'), (1, '627.120')] +[2023-10-08 16:21:11,121][21194] Updated weights for policy 1, policy_version 15970 (0.0008) +[2023-10-08 16:21:11,481][21194] Updated weights for policy 1, policy_version 15980 (0.0007) +[2023-10-08 16:21:11,849][21194] Updated weights for policy 1, policy_version 15990 (0.0008) +[2023-10-08 16:21:12,214][21194] Updated weights for policy 1, policy_version 16000 (0.0008) +[2023-10-08 16:21:12,790][21195] Updated weights for policy 0, policy_version 16100 (0.0007) +[2023-10-08 16:21:13,189][21195] Updated weights for policy 0, policy_version 16110 (0.0007) +[2023-10-08 16:21:13,565][21195] Updated weights for policy 0, policy_version 16120 (0.0009) +[2023-10-08 16:21:13,803][19739] Fps is (10 sec: 13106.6, 60 sec: 13653.2, 300 sec: 13773.7). Total num frames: 32866304. Throughput: 0: 1740.1, 1: 1703.8. Samples: 8229104. Policy #0 lag: (min: 23.0, avg: 28.9, max: 55.0) +[2023-10-08 16:21:13,804][19739] Avg episode reward: [(0, '248.810'), (1, '628.570')] +[2023-10-08 16:21:13,813][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000016000_16384000.pth... +[2023-10-08 16:21:13,854][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000014400_14745600.pth +[2023-10-08 16:21:13,856][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000016128_16515072.pth... +[2023-10-08 16:21:13,858][20836] Saving new best policy, reward=628.570! +[2023-10-08 16:21:13,886][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000014496_14843904.pth +[2023-10-08 16:21:13,890][20740] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p0/milestones/checkpoint_000016128_16515072.pth +[2023-10-08 16:21:13,891][20836] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p1/milestones/checkpoint_000016000_16384000.pth +[2023-10-08 16:21:16,286][21194] Updated weights for policy 1, policy_version 16010 (0.0008) +[2023-10-08 16:21:16,656][21194] Updated weights for policy 1, policy_version 16020 (0.0007) +[2023-10-08 16:21:17,029][21194] Updated weights for policy 1, policy_version 16030 (0.0008) +[2023-10-08 16:21:17,381][21195] Updated weights for policy 0, policy_version 16130 (0.0008) +[2023-10-08 16:21:17,749][21195] Updated weights for policy 0, policy_version 16140 (0.0009) +[2023-10-08 16:21:18,118][21195] Updated weights for policy 0, policy_version 16150 (0.0007) +[2023-10-08 16:21:18,488][21195] Updated weights for policy 0, policy_version 16160 (0.0010) +[2023-10-08 16:21:18,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 32964608. Throughput: 0: 1706.0, 1: 1728.7. Samples: 8244422. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:21:18,803][19739] Avg episode reward: [(0, '248.810'), (1, '643.340')] +[2023-10-08 16:21:18,804][20836] Saving new best policy, reward=643.340! +[2023-10-08 16:21:20,932][21194] Updated weights for policy 1, policy_version 16040 (0.0010) +[2023-10-08 16:21:21,291][21194] Updated weights for policy 1, policy_version 16050 (0.0008) +[2023-10-08 16:21:21,666][21194] Updated weights for policy 1, policy_version 16060 (0.0008) +[2023-10-08 16:21:22,566][21195] Updated weights for policy 0, policy_version 16170 (0.0007) +[2023-10-08 16:21:22,941][21195] Updated weights for policy 0, policy_version 16180 (0.0007) +[2023-10-08 16:21:23,309][21195] Updated weights for policy 0, policy_version 16190 (0.0008) +[2023-10-08 16:21:23,803][19739] Fps is (10 sec: 16384.6, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 33030144. Throughput: 0: 1735.0, 1: 1705.7. Samples: 8259960. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:21:23,803][19739] Avg episode reward: [(0, '249.650'), (1, '634.780')] +[2023-10-08 16:21:25,792][21194] Updated weights for policy 1, policy_version 16070 (0.0007) +[2023-10-08 16:21:26,162][21194] Updated weights for policy 1, policy_version 16080 (0.0007) +[2023-10-08 16:21:26,529][21194] Updated weights for policy 1, policy_version 16090 (0.0009) +[2023-10-08 16:21:27,032][21195] Updated weights for policy 0, policy_version 16200 (0.0008) +[2023-10-08 16:21:27,406][21195] Updated weights for policy 0, policy_version 16210 (0.0008) +[2023-10-08 16:21:27,774][21195] Updated weights for policy 0, policy_version 16220 (0.0009) +[2023-10-08 16:21:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 33095680. Throughput: 0: 1722.1, 1: 1710.8. Samples: 8280458. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:21:28,803][19739] Avg episode reward: [(0, '249.650'), (1, '634.780')] +[2023-10-08 16:21:30,573][21194] Updated weights for policy 1, policy_version 16100 (0.0007) +[2023-10-08 16:21:30,943][21194] Updated weights for policy 1, policy_version 16110 (0.0008) +[2023-10-08 16:21:31,301][21194] Updated weights for policy 1, policy_version 16120 (0.0009) +[2023-10-08 16:21:31,775][21195] Updated weights for policy 0, policy_version 16230 (0.0008) +[2023-10-08 16:21:32,145][21195] Updated weights for policy 0, policy_version 16240 (0.0008) +[2023-10-08 16:21:32,527][21195] Updated weights for policy 0, policy_version 16250 (0.0009) +[2023-10-08 16:21:33,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 33161216. Throughput: 0: 1712.6, 1: 1716.9. Samples: 8296126. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:21:33,803][19739] Avg episode reward: [(0, '251.490'), (1, '640.960')] +[2023-10-08 16:21:35,137][21194] Updated weights for policy 1, policy_version 16130 (0.0007) +[2023-10-08 16:21:35,501][21194] Updated weights for policy 1, policy_version 16140 (0.0008) +[2023-10-08 16:21:35,866][21194] Updated weights for policy 1, policy_version 16150 (0.0009) +[2023-10-08 16:21:36,229][21194] Updated weights for policy 1, policy_version 16160 (0.0008) +[2023-10-08 16:21:36,545][21195] Updated weights for policy 0, policy_version 16260 (0.0010) +[2023-10-08 16:21:36,915][21195] Updated weights for policy 0, policy_version 16270 (0.0007) +[2023-10-08 16:21:37,293][21195] Updated weights for policy 0, policy_version 16280 (0.0010) +[2023-10-08 16:21:38,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 33226752. Throughput: 0: 1729.8, 1: 1711.9. Samples: 8311722. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:21:38,803][19739] Avg episode reward: [(0, '260.720'), (1, '640.960')] +[2023-10-08 16:21:40,077][21194] Updated weights for policy 1, policy_version 16170 (0.0009) +[2023-10-08 16:21:40,442][21194] Updated weights for policy 1, policy_version 16180 (0.0007) +[2023-10-08 16:21:40,805][21194] Updated weights for policy 1, policy_version 16190 (0.0009) +[2023-10-08 16:21:41,089][21195] Updated weights for policy 0, policy_version 16290 (0.0008) +[2023-10-08 16:21:41,457][21195] Updated weights for policy 0, policy_version 16300 (0.0007) +[2023-10-08 16:21:41,824][21195] Updated weights for policy 0, policy_version 16310 (0.0009) +[2023-10-08 16:21:42,186][21195] Updated weights for policy 0, policy_version 16320 (0.0011) +[2023-10-08 16:21:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 33292288. Throughput: 0: 1711.2, 1: 1732.8. Samples: 8332534. Policy #0 lag: (min: 31.0, avg: 34.4, max: 63.0) +[2023-10-08 16:21:43,803][19739] Avg episode reward: [(0, '260.720'), (1, '640.960')] +[2023-10-08 16:21:44,802][21194] Updated weights for policy 1, policy_version 16200 (0.0007) +[2023-10-08 16:21:45,178][21194] Updated weights for policy 1, policy_version 16210 (0.0008) +[2023-10-08 16:21:45,547][21194] Updated weights for policy 1, policy_version 16220 (0.0008) +[2023-10-08 16:21:46,142][21195] Updated weights for policy 0, policy_version 16330 (0.0007) +[2023-10-08 16:21:46,507][21195] Updated weights for policy 0, policy_version 16340 (0.0007) +[2023-10-08 16:21:46,882][21195] Updated weights for policy 0, policy_version 16350 (0.0007) +[2023-10-08 16:21:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 33357824. Throughput: 0: 1725.9, 1: 1712.7. Samples: 8347946. Policy #0 lag: (min: 31.0, avg: 34.4, max: 63.0) +[2023-10-08 16:21:48,803][19739] Avg episode reward: [(0, '260.720'), (1, '640.960')] +[2023-10-08 16:21:49,296][21194] Updated weights for policy 1, policy_version 16230 (0.0008) +[2023-10-08 16:21:49,656][21194] Updated weights for policy 1, policy_version 16240 (0.0007) +[2023-10-08 16:21:50,022][21194] Updated weights for policy 1, policy_version 16250 (0.0007) +[2023-10-08 16:21:50,894][21195] Updated weights for policy 0, policy_version 16360 (0.0009) +[2023-10-08 16:21:51,264][21195] Updated weights for policy 0, policy_version 16370 (0.0008) +[2023-10-08 16:21:51,641][21195] Updated weights for policy 0, policy_version 16380 (0.0009) +[2023-10-08 16:21:53,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 33423360. Throughput: 0: 1716.7, 1: 1728.6. Samples: 8363558. Policy #0 lag: (min: 31.0, avg: 34.4, max: 63.0) +[2023-10-08 16:21:53,804][19739] Avg episode reward: [(0, '266.800'), (1, '640.960')] +[2023-10-08 16:21:54,132][21194] Updated weights for policy 1, policy_version 16260 (0.0009) +[2023-10-08 16:21:54,489][21194] Updated weights for policy 1, policy_version 16270 (0.0008) +[2023-10-08 16:21:54,859][21194] Updated weights for policy 1, policy_version 16280 (0.0008) +[2023-10-08 16:21:55,397][21195] Updated weights for policy 0, policy_version 16390 (0.0009) +[2023-10-08 16:21:55,763][21195] Updated weights for policy 0, policy_version 16400 (0.0010) +[2023-10-08 16:21:56,138][21195] Updated weights for policy 0, policy_version 16410 (0.0009) +[2023-10-08 16:21:58,767][21194] Updated weights for policy 1, policy_version 16290 (0.0008) +[2023-10-08 16:21:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 33488896. Throughput: 0: 1720.3, 1: 1737.8. Samples: 8384718. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:21:58,803][19739] Avg episode reward: [(0, '269.400'), (1, '640.960')] +[2023-10-08 16:21:59,135][21194] Updated weights for policy 1, policy_version 16300 (0.0009) +[2023-10-08 16:21:59,509][21194] Updated weights for policy 1, policy_version 16310 (0.0008) +[2023-10-08 16:21:59,871][21194] Updated weights for policy 1, policy_version 16320 (0.0010) +[2023-10-08 16:22:00,074][21195] Updated weights for policy 0, policy_version 16420 (0.0009) +[2023-10-08 16:22:00,468][21195] Updated weights for policy 0, policy_version 16430 (0.0008) +[2023-10-08 16:22:00,829][21195] Updated weights for policy 0, policy_version 16440 (0.0010) +[2023-10-08 16:22:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 33554432. Throughput: 0: 1747.8, 1: 1711.2. Samples: 8400078. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:22:03,804][19739] Avg episode reward: [(0, '269.540'), (1, '640.960')] +[2023-10-08 16:22:03,907][21194] Updated weights for policy 1, policy_version 16330 (0.0010) +[2023-10-08 16:22:04,279][21194] Updated weights for policy 1, policy_version 16340 (0.0010) +[2023-10-08 16:22:04,639][21194] Updated weights for policy 1, policy_version 16350 (0.0008) +[2023-10-08 16:22:04,813][21195] Updated weights for policy 0, policy_version 16450 (0.0008) +[2023-10-08 16:22:05,181][21195] Updated weights for policy 0, policy_version 16460 (0.0009) +[2023-10-08 16:22:05,554][21195] Updated weights for policy 0, policy_version 16470 (0.0009) +[2023-10-08 16:22:05,925][21195] Updated weights for policy 0, policy_version 16480 (0.0007) +[2023-10-08 16:22:08,626][21194] Updated weights for policy 1, policy_version 16360 (0.0008) +[2023-10-08 16:22:08,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 33619968. Throughput: 0: 1718.8, 1: 1735.2. Samples: 8415394. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:22:08,803][19739] Avg episode reward: [(0, '266.680'), (1, '640.960')] +[2023-10-08 16:22:08,999][21194] Updated weights for policy 1, policy_version 16370 (0.0007) +[2023-10-08 16:22:09,362][21194] Updated weights for policy 1, policy_version 16380 (0.0008) +[2023-10-08 16:22:09,757][21195] Updated weights for policy 0, policy_version 16490 (0.0008) +[2023-10-08 16:22:10,130][21195] Updated weights for policy 0, policy_version 16500 (0.0008) +[2023-10-08 16:22:10,500][21195] Updated weights for policy 0, policy_version 16510 (0.0008) +[2023-10-08 16:22:13,494][21194] Updated weights for policy 1, policy_version 16390 (0.0008) +[2023-10-08 16:22:13,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 33685504. Throughput: 0: 1740.3, 1: 1732.5. Samples: 8436736. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:22:13,803][19739] Avg episode reward: [(0, '263.930'), (1, '633.670')] +[2023-10-08 16:22:13,864][21194] Updated weights for policy 1, policy_version 16400 (0.0008) +[2023-10-08 16:22:14,231][21194] Updated weights for policy 1, policy_version 16410 (0.0007) +[2023-10-08 16:22:14,334][21195] Updated weights for policy 0, policy_version 16520 (0.0007) +[2023-10-08 16:22:14,707][21195] Updated weights for policy 0, policy_version 16530 (0.0007) +[2023-10-08 16:22:15,080][21195] Updated weights for policy 0, policy_version 16540 (0.0007) +[2023-10-08 16:22:18,158][21194] Updated weights for policy 1, policy_version 16420 (0.0008) +[2023-10-08 16:22:18,526][21194] Updated weights for policy 1, policy_version 16430 (0.0009) +[2023-10-08 16:22:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 33751040. Throughput: 0: 1745.8, 1: 1719.9. Samples: 8452082. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:22:18,803][19739] Avg episode reward: [(0, '263.930'), (1, '633.670')] +[2023-10-08 16:22:18,889][21194] Updated weights for policy 1, policy_version 16440 (0.0009) +[2023-10-08 16:22:18,993][21195] Updated weights for policy 0, policy_version 16550 (0.0009) +[2023-10-08 16:22:19,370][21195] Updated weights for policy 0, policy_version 16560 (0.0007) +[2023-10-08 16:22:19,749][21195] Updated weights for policy 0, policy_version 16570 (0.0008) +[2023-10-08 16:22:22,924][21194] Updated weights for policy 1, policy_version 16450 (0.0008) +[2023-10-08 16:22:23,290][21194] Updated weights for policy 1, policy_version 16460 (0.0011) +[2023-10-08 16:22:23,657][21194] Updated weights for policy 1, policy_version 16470 (0.0010) +[2023-10-08 16:22:23,766][21195] Updated weights for policy 0, policy_version 16580 (0.0010) +[2023-10-08 16:22:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 33816576. Throughput: 0: 1727.9, 1: 1727.6. Samples: 8467216. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:22:23,803][19739] Avg episode reward: [(0, '249.820'), (1, '633.670')] +[2023-10-08 16:22:24,025][21194] Updated weights for policy 1, policy_version 16480 (0.0008) +[2023-10-08 16:22:24,137][21195] Updated weights for policy 0, policy_version 16590 (0.0009) +[2023-10-08 16:22:24,507][21195] Updated weights for policy 0, policy_version 16600 (0.0009) +[2023-10-08 16:22:27,949][21194] Updated weights for policy 1, policy_version 16490 (0.0008) +[2023-10-08 16:22:28,314][21194] Updated weights for policy 1, policy_version 16500 (0.0007) +[2023-10-08 16:22:28,556][21195] Updated weights for policy 0, policy_version 16610 (0.0009) +[2023-10-08 16:22:28,679][21194] Updated weights for policy 1, policy_version 16510 (0.0007) +[2023-10-08 16:22:28,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 33914880. Throughput: 0: 1745.6, 1: 1711.1. Samples: 8488082. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:22:28,803][19739] Avg episode reward: [(0, '249.820'), (1, '640.120')] +[2023-10-08 16:22:28,926][21195] Updated weights for policy 0, policy_version 16620 (0.0008) +[2023-10-08 16:22:29,306][21195] Updated weights for policy 0, policy_version 16630 (0.0007) +[2023-10-08 16:22:29,679][21195] Updated weights for policy 0, policy_version 16640 (0.0009) +[2023-10-08 16:22:32,536][21194] Updated weights for policy 1, policy_version 16520 (0.0008) +[2023-10-08 16:22:32,901][21194] Updated weights for policy 1, policy_version 16530 (0.0007) +[2023-10-08 16:22:33,262][21194] Updated weights for policy 1, policy_version 16540 (0.0009) +[2023-10-08 16:22:33,535][21195] Updated weights for policy 0, policy_version 16650 (0.0008) +[2023-10-08 16:22:33,803][19739] Fps is (10 sec: 16383.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 33980416. Throughput: 0: 1729.1, 1: 1721.4. Samples: 8503222. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:22:33,804][19739] Avg episode reward: [(0, '249.820'), (1, '640.120')] +[2023-10-08 16:22:33,897][21195] Updated weights for policy 0, policy_version 16660 (0.0009) +[2023-10-08 16:22:34,271][21195] Updated weights for policy 0, policy_version 16670 (0.0008) +[2023-10-08 16:22:37,266][21194] Updated weights for policy 1, policy_version 16550 (0.0007) +[2023-10-08 16:22:37,638][21194] Updated weights for policy 1, policy_version 16560 (0.0008) +[2023-10-08 16:22:38,001][21194] Updated weights for policy 1, policy_version 16570 (0.0009) +[2023-10-08 16:22:38,357][21195] Updated weights for policy 0, policy_version 16680 (0.0010) +[2023-10-08 16:22:38,728][21195] Updated weights for policy 0, policy_version 16690 (0.0009) +[2023-10-08 16:22:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 34045952. Throughput: 0: 1737.3, 1: 1723.6. Samples: 8519296. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:22:38,803][19739] Avg episode reward: [(0, '257.840'), (1, '640.120')] +[2023-10-08 16:22:39,103][21195] Updated weights for policy 0, policy_version 16700 (0.0010) +[2023-10-08 16:22:42,059][21194] Updated weights for policy 1, policy_version 16580 (0.0009) +[2023-10-08 16:22:42,422][21194] Updated weights for policy 1, policy_version 16590 (0.0007) +[2023-10-08 16:22:42,793][21194] Updated weights for policy 1, policy_version 16600 (0.0008) +[2023-10-08 16:22:43,067][21195] Updated weights for policy 0, policy_version 16710 (0.0008) +[2023-10-08 16:22:43,436][21195] Updated weights for policy 0, policy_version 16720 (0.0008) +[2023-10-08 16:22:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 34111488. Throughput: 0: 1735.0, 1: 1700.8. Samples: 8539332. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 16:22:43,803][19739] Avg episode reward: [(0, '267.370'), (1, '646.900')] +[2023-10-08 16:22:43,810][21195] Updated weights for policy 0, policy_version 16730 (0.0008) +[2023-10-08 16:22:43,811][20836] Saving new best policy, reward=646.900! +[2023-10-08 16:22:46,876][21194] Updated weights for policy 1, policy_version 16610 (0.0008) +[2023-10-08 16:22:47,248][21194] Updated weights for policy 1, policy_version 16620 (0.0008) +[2023-10-08 16:22:47,605][21194] Updated weights for policy 1, policy_version 16630 (0.0008) +[2023-10-08 16:22:47,754][21195] Updated weights for policy 0, policy_version 16740 (0.0008) +[2023-10-08 16:22:47,972][21194] Updated weights for policy 1, policy_version 16640 (0.0008) +[2023-10-08 16:22:48,147][21195] Updated weights for policy 0, policy_version 16750 (0.0008) +[2023-10-08 16:22:48,525][21195] Updated weights for policy 0, policy_version 16760 (0.0007) +[2023-10-08 16:22:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 34177024. Throughput: 0: 1704.4, 1: 1722.9. Samples: 8554304. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 16:22:48,803][19739] Avg episode reward: [(0, '267.370'), (1, '646.900')] +[2023-10-08 16:22:51,964][21194] Updated weights for policy 1, policy_version 16650 (0.0010) +[2023-10-08 16:22:52,333][21194] Updated weights for policy 1, policy_version 16660 (0.0009) +[2023-10-08 16:22:52,402][21195] Updated weights for policy 0, policy_version 16770 (0.0008) +[2023-10-08 16:22:52,699][21194] Updated weights for policy 1, policy_version 16670 (0.0008) +[2023-10-08 16:22:52,770][21195] Updated weights for policy 0, policy_version 16780 (0.0007) +[2023-10-08 16:22:53,146][21195] Updated weights for policy 0, policy_version 16790 (0.0007) +[2023-10-08 16:22:53,521][21195] Updated weights for policy 0, policy_version 16800 (0.0007) +[2023-10-08 16:22:53,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 34275328. Throughput: 0: 1731.8, 1: 1711.1. Samples: 8570324. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 16:22:53,803][19739] Avg episode reward: [(0, '274.320'), (1, '646.900')] +[2023-10-08 16:22:56,326][21194] Updated weights for policy 1, policy_version 16680 (0.0009) +[2023-10-08 16:22:56,703][21194] Updated weights for policy 1, policy_version 16690 (0.0009) +[2023-10-08 16:22:57,067][21194] Updated weights for policy 1, policy_version 16700 (0.0007) +[2023-10-08 16:22:57,456][21195] Updated weights for policy 0, policy_version 16810 (0.0008) +[2023-10-08 16:22:57,825][21195] Updated weights for policy 0, policy_version 16820 (0.0010) +[2023-10-08 16:22:58,190][21195] Updated weights for policy 0, policy_version 16830 (0.0011) +[2023-10-08 16:22:58,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 34340864. Throughput: 0: 1711.2, 1: 1696.4. Samples: 8590078. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 16:22:58,803][19739] Avg episode reward: [(0, '270.100'), (1, '646.900')] +[2023-10-08 16:23:01,184][21194] Updated weights for policy 1, policy_version 16710 (0.0009) +[2023-10-08 16:23:01,547][21194] Updated weights for policy 1, policy_version 16720 (0.0009) +[2023-10-08 16:23:01,915][21194] Updated weights for policy 1, policy_version 16730 (0.0008) +[2023-10-08 16:23:02,188][21195] Updated weights for policy 0, policy_version 16840 (0.0009) +[2023-10-08 16:23:02,553][21195] Updated weights for policy 0, policy_version 16850 (0.0007) +[2023-10-08 16:23:02,927][21195] Updated weights for policy 0, policy_version 16860 (0.0008) +[2023-10-08 16:23:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 34406400. Throughput: 0: 1705.2, 1: 1722.9. Samples: 8606344. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 16:23:03,803][19739] Avg episode reward: [(0, '284.930'), (1, '646.900')] +[2023-10-08 16:23:03,804][20740] Saving new best policy, reward=284.930! +[2023-10-08 16:23:05,935][21194] Updated weights for policy 1, policy_version 16740 (0.0007) +[2023-10-08 16:23:06,308][21194] Updated weights for policy 1, policy_version 16750 (0.0007) +[2023-10-08 16:23:06,679][21194] Updated weights for policy 1, policy_version 16760 (0.0007) +[2023-10-08 16:23:06,712][21195] Updated weights for policy 0, policy_version 16870 (0.0008) +[2023-10-08 16:23:07,074][21195] Updated weights for policy 0, policy_version 16880 (0.0009) +[2023-10-08 16:23:07,441][21195] Updated weights for policy 0, policy_version 16890 (0.0008) +[2023-10-08 16:23:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 34471936. Throughput: 0: 1732.9, 1: 1697.6. Samples: 8621592. Policy #0 lag: (min: 31.0, avg: 40.4, max: 63.0) +[2023-10-08 16:23:08,803][19739] Avg episode reward: [(0, '266.080'), (1, '646.900')] +[2023-10-08 16:23:10,511][21194] Updated weights for policy 1, policy_version 16770 (0.0008) +[2023-10-08 16:23:10,884][21194] Updated weights for policy 1, policy_version 16780 (0.0008) +[2023-10-08 16:23:11,256][21194] Updated weights for policy 1, policy_version 16790 (0.0008) +[2023-10-08 16:23:11,282][21195] Updated weights for policy 0, policy_version 16900 (0.0008) +[2023-10-08 16:23:11,616][21194] Updated weights for policy 1, policy_version 16800 (0.0010) +[2023-10-08 16:23:11,649][21195] Updated weights for policy 0, policy_version 16910 (0.0009) +[2023-10-08 16:23:12,021][21195] Updated weights for policy 0, policy_version 16920 (0.0008) +[2023-10-08 16:23:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 34537472. Throughput: 0: 1711.0, 1: 1713.6. Samples: 8642188. Policy #0 lag: (min: 31.0, avg: 40.4, max: 63.0) +[2023-10-08 16:23:13,803][19739] Avg episode reward: [(0, '275.930'), (1, '646.900')] +[2023-10-08 16:23:13,813][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000016800_17203200.pth... +[2023-10-08 16:23:13,813][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000016928_17334272.pth... +[2023-10-08 16:23:13,852][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000015200_15564800.pth +[2023-10-08 16:23:13,854][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000015296_15663104.pth +[2023-10-08 16:23:15,529][21194] Updated weights for policy 1, policy_version 16810 (0.0010) +[2023-10-08 16:23:15,895][21194] Updated weights for policy 1, policy_version 16820 (0.0011) +[2023-10-08 16:23:16,126][21195] Updated weights for policy 0, policy_version 16930 (0.0008) +[2023-10-08 16:23:16,262][21194] Updated weights for policy 1, policy_version 16830 (0.0008) +[2023-10-08 16:23:16,501][21195] Updated weights for policy 0, policy_version 16940 (0.0009) +[2023-10-08 16:23:16,862][21195] Updated weights for policy 0, policy_version 16950 (0.0011) +[2023-10-08 16:23:17,229][21195] Updated weights for policy 0, policy_version 16960 (0.0009) +[2023-10-08 16:23:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 34603008. Throughput: 0: 1722.4, 1: 1711.8. Samples: 8657762. Policy #0 lag: (min: 31.0, avg: 40.4, max: 63.0) +[2023-10-08 16:23:18,803][19739] Avg episode reward: [(0, '273.340'), (1, '646.900')] +[2023-10-08 16:23:20,254][21194] Updated weights for policy 1, policy_version 16840 (0.0009) +[2023-10-08 16:23:20,621][21194] Updated weights for policy 1, policy_version 16850 (0.0010) +[2023-10-08 16:23:20,992][21194] Updated weights for policy 1, policy_version 16860 (0.0009) +[2023-10-08 16:23:21,217][21195] Updated weights for policy 0, policy_version 16970 (0.0008) +[2023-10-08 16:23:21,583][21195] Updated weights for policy 0, policy_version 16980 (0.0009) +[2023-10-08 16:23:21,959][21195] Updated weights for policy 0, policy_version 16990 (0.0009) +[2023-10-08 16:23:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 34668544. Throughput: 0: 1717.0, 1: 1699.8. Samples: 8673054. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:23:23,803][19739] Avg episode reward: [(0, '273.590'), (1, '646.900')] +[2023-10-08 16:23:25,037][21194] Updated weights for policy 1, policy_version 16870 (0.0008) +[2023-10-08 16:23:25,404][21194] Updated weights for policy 1, policy_version 16880 (0.0009) +[2023-10-08 16:23:25,776][21194] Updated weights for policy 1, policy_version 16890 (0.0008) +[2023-10-08 16:23:25,928][21195] Updated weights for policy 0, policy_version 17000 (0.0008) +[2023-10-08 16:23:26,292][21195] Updated weights for policy 0, policy_version 17010 (0.0009) +[2023-10-08 16:23:26,659][21195] Updated weights for policy 0, policy_version 17020 (0.0008) +[2023-10-08 16:23:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 34734080. Throughput: 0: 1715.3, 1: 1724.6. Samples: 8694128. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:23:28,803][19739] Avg episode reward: [(0, '263.030'), (1, '647.720')] +[2023-10-08 16:23:28,811][20836] Saving new best policy, reward=647.720! +[2023-10-08 16:23:29,639][21194] Updated weights for policy 1, policy_version 16900 (0.0008) +[2023-10-08 16:23:30,001][21194] Updated weights for policy 1, policy_version 16910 (0.0007) +[2023-10-08 16:23:30,373][21194] Updated weights for policy 1, policy_version 16920 (0.0009) +[2023-10-08 16:23:30,573][21195] Updated weights for policy 0, policy_version 17030 (0.0007) +[2023-10-08 16:23:30,937][21195] Updated weights for policy 0, policy_version 17040 (0.0010) +[2023-10-08 16:23:31,303][21195] Updated weights for policy 0, policy_version 17050 (0.0008) +[2023-10-08 16:23:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 34799616. Throughput: 0: 1749.4, 1: 1699.0. Samples: 8709482. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:23:33,803][19739] Avg episode reward: [(0, '254.510'), (1, '661.610')] +[2023-10-08 16:23:33,804][20836] Saving new best policy, reward=661.610! +[2023-10-08 16:23:34,325][21194] Updated weights for policy 1, policy_version 16930 (0.0008) +[2023-10-08 16:23:34,690][21194] Updated weights for policy 1, policy_version 16940 (0.0010) +[2023-10-08 16:23:35,058][21194] Updated weights for policy 1, policy_version 16950 (0.0008) +[2023-10-08 16:23:35,217][21195] Updated weights for policy 0, policy_version 17060 (0.0009) +[2023-10-08 16:23:35,425][21194] Updated weights for policy 1, policy_version 16960 (0.0008) +[2023-10-08 16:23:35,603][21195] Updated weights for policy 0, policy_version 17070 (0.0007) +[2023-10-08 16:23:35,967][21195] Updated weights for policy 0, policy_version 17080 (0.0009) +[2023-10-08 16:23:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 34865152. Throughput: 0: 1721.6, 1: 1715.7. Samples: 8725002. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:23:38,803][19739] Avg episode reward: [(0, '254.510'), (1, '661.610')] +[2023-10-08 16:23:39,336][21194] Updated weights for policy 1, policy_version 16970 (0.0011) +[2023-10-08 16:23:39,699][21194] Updated weights for policy 1, policy_version 16980 (0.0010) +[2023-10-08 16:23:39,738][21195] Updated weights for policy 0, policy_version 17090 (0.0009) +[2023-10-08 16:23:40,065][21194] Updated weights for policy 1, policy_version 16990 (0.0007) +[2023-10-08 16:23:40,096][21195] Updated weights for policy 0, policy_version 17100 (0.0008) +[2023-10-08 16:23:40,472][21195] Updated weights for policy 0, policy_version 17110 (0.0009) +[2023-10-08 16:23:40,840][21195] Updated weights for policy 0, policy_version 17120 (0.0008) +[2023-10-08 16:23:43,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 34930688. Throughput: 0: 1747.9, 1: 1733.7. Samples: 8746752. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:23:43,804][19739] Avg episode reward: [(0, '254.510'), (1, '661.610')] +[2023-10-08 16:23:44,209][21194] Updated weights for policy 1, policy_version 17000 (0.0008) +[2023-10-08 16:23:44,511][21195] Updated weights for policy 0, policy_version 17130 (0.0008) +[2023-10-08 16:23:44,587][21194] Updated weights for policy 1, policy_version 17010 (0.0007) +[2023-10-08 16:23:44,880][21195] Updated weights for policy 0, policy_version 17140 (0.0009) +[2023-10-08 16:23:44,952][21194] Updated weights for policy 1, policy_version 17020 (0.0007) +[2023-10-08 16:23:45,252][21195] Updated weights for policy 0, policy_version 17150 (0.0009) +[2023-10-08 16:23:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 34996224. Throughput: 0: 1753.1, 1: 1705.0. Samples: 8761960. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:23:48,803][19739] Avg episode reward: [(0, '261.710'), (1, '661.850')] +[2023-10-08 16:23:48,822][21194] Updated weights for policy 1, policy_version 17030 (0.0008) +[2023-10-08 16:23:49,146][21195] Updated weights for policy 0, policy_version 17160 (0.0008) +[2023-10-08 16:23:49,184][21194] Updated weights for policy 1, policy_version 17040 (0.0010) +[2023-10-08 16:23:49,516][21195] Updated weights for policy 0, policy_version 17170 (0.0007) +[2023-10-08 16:23:49,544][21194] Updated weights for policy 1, policy_version 17050 (0.0007) +[2023-10-08 16:23:49,760][20836] Saving new best policy, reward=661.850! +[2023-10-08 16:23:49,892][21195] Updated weights for policy 0, policy_version 17180 (0.0008) +[2023-10-08 16:23:53,587][21194] Updated weights for policy 1, policy_version 17060 (0.0009) +[2023-10-08 16:23:53,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 35061760. Throughput: 0: 1726.0, 1: 1732.8. Samples: 8777240. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 16:23:53,803][19739] Avg episode reward: [(0, '248.720'), (1, '648.190')] +[2023-10-08 16:23:53,899][21195] Updated weights for policy 0, policy_version 17190 (0.0009) +[2023-10-08 16:23:53,950][21194] Updated weights for policy 1, policy_version 17070 (0.0007) +[2023-10-08 16:23:54,269][21195] Updated weights for policy 0, policy_version 17200 (0.0008) +[2023-10-08 16:23:54,319][21194] Updated weights for policy 1, policy_version 17080 (0.0008) +[2023-10-08 16:23:54,635][21195] Updated weights for policy 0, policy_version 17210 (0.0008) +[2023-10-08 16:23:58,308][21194] Updated weights for policy 1, policy_version 17090 (0.0009) +[2023-10-08 16:23:58,584][21195] Updated weights for policy 0, policy_version 17220 (0.0008) +[2023-10-08 16:23:58,663][21194] Updated weights for policy 1, policy_version 17100 (0.0008) +[2023-10-08 16:23:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 35127296. Throughput: 0: 1744.9, 1: 1730.7. Samples: 8798590. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 16:23:58,803][19739] Avg episode reward: [(0, '248.320'), (1, '636.020')] +[2023-10-08 16:23:58,952][21195] Updated weights for policy 0, policy_version 17230 (0.0008) +[2023-10-08 16:23:59,022][21194] Updated weights for policy 1, policy_version 17110 (0.0008) +[2023-10-08 16:23:59,324][21195] Updated weights for policy 0, policy_version 17240 (0.0007) +[2023-10-08 16:23:59,387][21194] Updated weights for policy 1, policy_version 17120 (0.0008) +[2023-10-08 16:24:03,287][21195] Updated weights for policy 0, policy_version 17250 (0.0008) +[2023-10-08 16:24:03,327][21194] Updated weights for policy 1, policy_version 17130 (0.0007) +[2023-10-08 16:24:03,653][21195] Updated weights for policy 0, policy_version 17260 (0.0009) +[2023-10-08 16:24:03,691][21194] Updated weights for policy 1, policy_version 17140 (0.0008) +[2023-10-08 16:24:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 35192832. Throughput: 0: 1734.8, 1: 1722.6. Samples: 8813342. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 16:24:03,803][19739] Avg episode reward: [(0, '260.230'), (1, '636.020')] +[2023-10-08 16:24:04,024][21195] Updated weights for policy 0, policy_version 17270 (0.0008) +[2023-10-08 16:24:04,058][21194] Updated weights for policy 1, policy_version 17150 (0.0009) +[2023-10-08 16:24:04,402][21195] Updated weights for policy 0, policy_version 17280 (0.0008) +[2023-10-08 16:24:07,736][21194] Updated weights for policy 1, policy_version 17160 (0.0009) +[2023-10-08 16:24:08,111][21194] Updated weights for policy 1, policy_version 17170 (0.0010) +[2023-10-08 16:24:08,340][21195] Updated weights for policy 0, policy_version 17290 (0.0007) +[2023-10-08 16:24:08,478][21194] Updated weights for policy 1, policy_version 17180 (0.0008) +[2023-10-08 16:24:08,708][21195] Updated weights for policy 0, policy_version 17300 (0.0007) +[2023-10-08 16:24:08,802][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 35291136. Throughput: 0: 1739.9, 1: 1737.1. Samples: 8829516. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:24:08,803][19739] Avg episode reward: [(0, '260.230'), (1, '636.020')] +[2023-10-08 16:24:09,075][21195] Updated weights for policy 0, policy_version 17310 (0.0009) +[2023-10-08 16:24:12,521][21194] Updated weights for policy 1, policy_version 17190 (0.0008) +[2023-10-08 16:24:12,895][21194] Updated weights for policy 1, policy_version 17200 (0.0007) +[2023-10-08 16:24:12,898][21195] Updated weights for policy 0, policy_version 17320 (0.0008) +[2023-10-08 16:24:13,264][21194] Updated weights for policy 1, policy_version 17210 (0.0008) +[2023-10-08 16:24:13,265][21195] Updated weights for policy 0, policy_version 17330 (0.0008) +[2023-10-08 16:24:13,633][21195] Updated weights for policy 0, policy_version 17340 (0.0009) +[2023-10-08 16:24:13,803][19739] Fps is (10 sec: 19660.7, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 35389440. Throughput: 0: 1744.4, 1: 1718.8. Samples: 8849972. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:24:13,803][19739] Avg episode reward: [(0, '265.900'), (1, '651.360')] +[2023-10-08 16:24:17,253][21194] Updated weights for policy 1, policy_version 17220 (0.0007) +[2023-10-08 16:24:17,581][21195] Updated weights for policy 0, policy_version 17350 (0.0010) +[2023-10-08 16:24:17,624][21194] Updated weights for policy 1, policy_version 17230 (0.0008) +[2023-10-08 16:24:17,958][21195] Updated weights for policy 0, policy_version 17360 (0.0008) +[2023-10-08 16:24:17,988][21194] Updated weights for policy 1, policy_version 17240 (0.0008) +[2023-10-08 16:24:18,328][21195] Updated weights for policy 0, policy_version 17370 (0.0007) +[2023-10-08 16:24:18,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 35454976. Throughput: 0: 1714.7, 1: 1740.4. Samples: 8864958. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:24:18,803][19739] Avg episode reward: [(0, '266.260'), (1, '666.310')] +[2023-10-08 16:24:18,804][20836] Saving new best policy, reward=666.310! +[2023-10-08 16:24:21,911][21194] Updated weights for policy 1, policy_version 17250 (0.0009) +[2023-10-08 16:24:22,176][21195] Updated weights for policy 0, policy_version 17380 (0.0008) +[2023-10-08 16:24:22,280][21194] Updated weights for policy 1, policy_version 17260 (0.0007) +[2023-10-08 16:24:22,566][21195] Updated weights for policy 0, policy_version 17390 (0.0007) +[2023-10-08 16:24:22,641][21194] Updated weights for policy 1, policy_version 17270 (0.0007) +[2023-10-08 16:24:22,933][21195] Updated weights for policy 0, policy_version 17400 (0.0007) +[2023-10-08 16:24:23,009][21194] Updated weights for policy 1, policy_version 17280 (0.0010) +[2023-10-08 16:24:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 35520512. Throughput: 0: 1749.8, 1: 1732.7. Samples: 8881712. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:24:23,803][19739] Avg episode reward: [(0, '279.870'), (1, '704.050')] +[2023-10-08 16:24:23,804][20836] Saving new best policy, reward=704.050! +[2023-10-08 16:24:26,903][21195] Updated weights for policy 0, policy_version 17410 (0.0008) +[2023-10-08 16:24:26,994][21194] Updated weights for policy 1, policy_version 17290 (0.0009) +[2023-10-08 16:24:27,279][21195] Updated weights for policy 0, policy_version 17420 (0.0008) +[2023-10-08 16:24:27,354][21194] Updated weights for policy 1, policy_version 17300 (0.0007) +[2023-10-08 16:24:27,639][21195] Updated weights for policy 0, policy_version 17430 (0.0008) +[2023-10-08 16:24:27,715][21194] Updated weights for policy 1, policy_version 17310 (0.0007) +[2023-10-08 16:24:28,009][21195] Updated weights for policy 0, policy_version 17440 (0.0008) +[2023-10-08 16:24:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 35586048. Throughput: 0: 1714.6, 1: 1704.7. Samples: 8900618. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:24:28,803][19739] Avg episode reward: [(0, '290.450'), (1, '690.890')] +[2023-10-08 16:24:28,810][20740] Saving new best policy, reward=290.450! +[2023-10-08 16:24:31,953][21194] Updated weights for policy 1, policy_version 17320 (0.0009) +[2023-10-08 16:24:32,084][21195] Updated weights for policy 0, policy_version 17450 (0.0008) +[2023-10-08 16:24:32,329][21194] Updated weights for policy 1, policy_version 17330 (0.0008) +[2023-10-08 16:24:32,459][21195] Updated weights for policy 0, policy_version 17460 (0.0008) +[2023-10-08 16:24:32,683][21194] Updated weights for policy 1, policy_version 17340 (0.0008) +[2023-10-08 16:24:32,825][21195] Updated weights for policy 0, policy_version 17470 (0.0008) +[2023-10-08 16:24:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 35651584. Throughput: 0: 1704.2, 1: 1732.5. Samples: 8916610. Policy #0 lag: (min: 3.0, avg: 11.4, max: 35.0) +[2023-10-08 16:24:33,803][19739] Avg episode reward: [(0, '290.450'), (1, '690.890')] +[2023-10-08 16:24:36,514][21194] Updated weights for policy 1, policy_version 17350 (0.0008) +[2023-10-08 16:24:36,736][21195] Updated weights for policy 0, policy_version 17480 (0.0009) +[2023-10-08 16:24:36,885][21194] Updated weights for policy 1, policy_version 17360 (0.0008) +[2023-10-08 16:24:37,113][21195] Updated weights for policy 0, policy_version 17490 (0.0008) +[2023-10-08 16:24:37,248][21194] Updated weights for policy 1, policy_version 17370 (0.0007) +[2023-10-08 16:24:37,489][21195] Updated weights for policy 0, policy_version 17500 (0.0008) +[2023-10-08 16:24:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 35717120. Throughput: 0: 1729.5, 1: 1715.5. Samples: 8932264. Policy #0 lag: (min: 3.0, avg: 11.4, max: 35.0) +[2023-10-08 16:24:38,803][19739] Avg episode reward: [(0, '290.450'), (1, '676.340')] +[2023-10-08 16:24:41,120][21194] Updated weights for policy 1, policy_version 17380 (0.0008) +[2023-10-08 16:24:41,348][21195] Updated weights for policy 0, policy_version 17510 (0.0009) +[2023-10-08 16:24:41,477][21194] Updated weights for policy 1, policy_version 17390 (0.0008) +[2023-10-08 16:24:41,723][21195] Updated weights for policy 0, policy_version 17520 (0.0008) +[2023-10-08 16:24:41,850][21194] Updated weights for policy 1, policy_version 17400 (0.0008) +[2023-10-08 16:24:42,085][21195] Updated weights for policy 0, policy_version 17530 (0.0007) +[2023-10-08 16:24:43,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 35782656. Throughput: 0: 1708.9, 1: 1707.1. Samples: 8952312. Policy #0 lag: (min: 3.0, avg: 11.4, max: 35.0) +[2023-10-08 16:24:43,804][19739] Avg episode reward: [(0, '290.450'), (1, '676.340')] +[2023-10-08 16:24:45,852][21194] Updated weights for policy 1, policy_version 17410 (0.0008) +[2023-10-08 16:24:46,153][21195] Updated weights for policy 0, policy_version 17540 (0.0007) +[2023-10-08 16:24:46,221][21194] Updated weights for policy 1, policy_version 17420 (0.0007) +[2023-10-08 16:24:46,512][21195] Updated weights for policy 0, policy_version 17550 (0.0010) +[2023-10-08 16:24:46,603][21194] Updated weights for policy 1, policy_version 17430 (0.0009) +[2023-10-08 16:24:46,882][21195] Updated weights for policy 0, policy_version 17560 (0.0009) +[2023-10-08 16:24:46,960][21194] Updated weights for policy 1, policy_version 17440 (0.0008) +[2023-10-08 16:24:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 35848192. Throughput: 0: 1717.0, 1: 1730.2. Samples: 8968468. Policy #0 lag: (min: 31.0, avg: 32.0, max: 52.0) +[2023-10-08 16:24:48,803][19739] Avg episode reward: [(0, '291.210'), (1, '676.340')] +[2023-10-08 16:24:48,804][20740] Saving new best policy, reward=291.210! +[2023-10-08 16:24:50,932][21194] Updated weights for policy 1, policy_version 17450 (0.0009) +[2023-10-08 16:24:50,977][21195] Updated weights for policy 0, policy_version 17570 (0.0009) +[2023-10-08 16:24:51,289][21194] Updated weights for policy 1, policy_version 17460 (0.0007) +[2023-10-08 16:24:51,351][21195] Updated weights for policy 0, policy_version 17580 (0.0008) +[2023-10-08 16:24:51,650][21194] Updated weights for policy 1, policy_version 17470 (0.0010) +[2023-10-08 16:24:51,714][21195] Updated weights for policy 0, policy_version 17590 (0.0007) +[2023-10-08 16:24:52,090][21195] Updated weights for policy 0, policy_version 17600 (0.0009) +[2023-10-08 16:24:53,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 35913728. Throughput: 0: 1713.5, 1: 1699.4. Samples: 8983096. Policy #0 lag: (min: 31.0, avg: 32.0, max: 52.0) +[2023-10-08 16:24:53,803][19739] Avg episode reward: [(0, '291.210'), (1, '686.990')] +[2023-10-08 16:24:55,729][21194] Updated weights for policy 1, policy_version 17480 (0.0007) +[2023-10-08 16:24:56,091][21194] Updated weights for policy 1, policy_version 17490 (0.0007) +[2023-10-08 16:24:56,116][21195] Updated weights for policy 0, policy_version 17610 (0.0008) +[2023-10-08 16:24:56,449][21194] Updated weights for policy 1, policy_version 17500 (0.0009) +[2023-10-08 16:24:56,484][21195] Updated weights for policy 0, policy_version 17620 (0.0007) +[2023-10-08 16:24:56,857][21195] Updated weights for policy 0, policy_version 17630 (0.0009) +[2023-10-08 16:24:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 35979264. Throughput: 0: 1707.3, 1: 1717.8. Samples: 9004102. Policy #0 lag: (min: 31.0, avg: 32.0, max: 52.0) +[2023-10-08 16:24:58,803][19739] Avg episode reward: [(0, '291.210'), (1, '688.670')] +[2023-10-08 16:25:00,411][21194] Updated weights for policy 1, policy_version 17510 (0.0008) +[2023-10-08 16:25:00,650][21195] Updated weights for policy 0, policy_version 17640 (0.0008) +[2023-10-08 16:25:00,775][21194] Updated weights for policy 1, policy_version 17520 (0.0008) +[2023-10-08 16:25:01,019][21195] Updated weights for policy 0, policy_version 17650 (0.0009) +[2023-10-08 16:25:01,141][21194] Updated weights for policy 1, policy_version 17530 (0.0009) +[2023-10-08 16:25:01,381][21195] Updated weights for policy 0, policy_version 17660 (0.0008) +[2023-10-08 16:25:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 36044800. Throughput: 0: 1733.2, 1: 1708.1. Samples: 9019814. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 16:25:03,803][19739] Avg episode reward: [(0, '299.690'), (1, '688.670')] +[2023-10-08 16:25:03,804][20740] Saving new best policy, reward=299.690! +[2023-10-08 16:25:05,017][21194] Updated weights for policy 1, policy_version 17540 (0.0007) +[2023-10-08 16:25:05,387][21194] Updated weights for policy 1, policy_version 17550 (0.0008) +[2023-10-08 16:25:05,524][21195] Updated weights for policy 0, policy_version 17670 (0.0009) +[2023-10-08 16:25:05,751][21194] Updated weights for policy 1, policy_version 17560 (0.0008) +[2023-10-08 16:25:05,890][21195] Updated weights for policy 0, policy_version 17680 (0.0008) +[2023-10-08 16:25:06,269][21195] Updated weights for policy 0, policy_version 17690 (0.0008) +[2023-10-08 16:25:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 36110336. Throughput: 0: 1696.5, 1: 1705.9. Samples: 9034822. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 16:25:08,803][19739] Avg episode reward: [(0, '299.690'), (1, '688.670')] +[2023-10-08 16:25:09,595][21194] Updated weights for policy 1, policy_version 17570 (0.0007) +[2023-10-08 16:25:09,973][21194] Updated weights for policy 1, policy_version 17580 (0.0008) +[2023-10-08 16:25:10,164][21195] Updated weights for policy 0, policy_version 17700 (0.0007) +[2023-10-08 16:25:10,330][21194] Updated weights for policy 1, policy_version 17590 (0.0008) +[2023-10-08 16:25:10,537][21195] Updated weights for policy 0, policy_version 17710 (0.0008) +[2023-10-08 16:25:10,699][21194] Updated weights for policy 1, policy_version 17600 (0.0010) +[2023-10-08 16:25:10,916][21195] Updated weights for policy 0, policy_version 17720 (0.0008) +[2023-10-08 16:25:13,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 36175872. Throughput: 0: 1722.4, 1: 1740.1. Samples: 9056432. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 16:25:13,804][19739] Avg episode reward: [(0, '299.690'), (1, '682.290')] +[2023-10-08 16:25:13,818][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000017728_18153472.pth... +[2023-10-08 16:25:13,819][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000017600_18022400.pth... +[2023-10-08 16:25:13,853][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000016000_16384000.pth +[2023-10-08 16:25:13,858][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000016128_16515072.pth +[2023-10-08 16:25:14,477][21194] Updated weights for policy 1, policy_version 17610 (0.0008) +[2023-10-08 16:25:14,837][21194] Updated weights for policy 1, policy_version 17620 (0.0007) +[2023-10-08 16:25:14,855][21195] Updated weights for policy 0, policy_version 17730 (0.0010) +[2023-10-08 16:25:15,205][21194] Updated weights for policy 1, policy_version 17630 (0.0007) +[2023-10-08 16:25:15,228][21195] Updated weights for policy 0, policy_version 17740 (0.0008) +[2023-10-08 16:25:15,605][21195] Updated weights for policy 0, policy_version 17750 (0.0009) +[2023-10-08 16:25:15,972][21195] Updated weights for policy 0, policy_version 17760 (0.0008) +[2023-10-08 16:25:18,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 36241408. Throughput: 0: 1731.7, 1: 1716.6. Samples: 9071782. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 16:25:18,803][19739] Avg episode reward: [(0, '299.690'), (1, '682.290')] +[2023-10-08 16:25:19,080][21194] Updated weights for policy 1, policy_version 17640 (0.0010) +[2023-10-08 16:25:19,444][21194] Updated weights for policy 1, policy_version 17650 (0.0009) +[2023-10-08 16:25:19,810][21194] Updated weights for policy 1, policy_version 17660 (0.0008) +[2023-10-08 16:25:19,945][21195] Updated weights for policy 0, policy_version 17770 (0.0007) +[2023-10-08 16:25:20,326][21195] Updated weights for policy 0, policy_version 17780 (0.0007) +[2023-10-08 16:25:20,697][21195] Updated weights for policy 0, policy_version 17790 (0.0007) +[2023-10-08 16:25:23,628][21194] Updated weights for policy 1, policy_version 17670 (0.0007) +[2023-10-08 16:25:23,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 36306944. Throughput: 0: 1707.7, 1: 1738.8. Samples: 9087358. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 16:25:23,803][19739] Avg episode reward: [(0, '306.460'), (1, '696.130')] +[2023-10-08 16:25:23,804][20740] Saving new best policy, reward=306.460! +[2023-10-08 16:25:24,000][21194] Updated weights for policy 1, policy_version 17680 (0.0007) +[2023-10-08 16:25:24,356][21194] Updated weights for policy 1, policy_version 17690 (0.0009) +[2023-10-08 16:25:24,563][21195] Updated weights for policy 0, policy_version 17800 (0.0007) +[2023-10-08 16:25:24,924][21195] Updated weights for policy 0, policy_version 17810 (0.0008) +[2023-10-08 16:25:25,301][21195] Updated weights for policy 0, policy_version 17820 (0.0009) +[2023-10-08 16:25:28,543][21194] Updated weights for policy 1, policy_version 17700 (0.0008) +[2023-10-08 16:25:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 36372480. Throughput: 0: 1734.5, 1: 1744.2. Samples: 9108854. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 16:25:28,803][19739] Avg episode reward: [(0, '301.320'), (1, '696.130')] +[2023-10-08 16:25:28,907][21194] Updated weights for policy 1, policy_version 17710 (0.0009) +[2023-10-08 16:25:29,156][21195] Updated weights for policy 0, policy_version 17830 (0.0008) +[2023-10-08 16:25:29,278][21194] Updated weights for policy 1, policy_version 17720 (0.0007) +[2023-10-08 16:25:29,524][21195] Updated weights for policy 0, policy_version 17840 (0.0007) +[2023-10-08 16:25:29,896][21195] Updated weights for policy 0, policy_version 17850 (0.0009) +[2023-10-08 16:25:33,203][21194] Updated weights for policy 1, policy_version 17730 (0.0008) +[2023-10-08 16:25:33,569][21194] Updated weights for policy 1, policy_version 17740 (0.0008) +[2023-10-08 16:25:33,687][21195] Updated weights for policy 0, policy_version 17860 (0.0008) +[2023-10-08 16:25:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.1, 300 sec: 13773.7). Total num frames: 36438016. Throughput: 0: 1737.5, 1: 1719.0. Samples: 9124010. Policy #0 lag: (min: 1.0, avg: 9.4, max: 33.0) +[2023-10-08 16:25:33,804][19739] Avg episode reward: [(0, '301.320'), (1, '683.760')] +[2023-10-08 16:25:33,938][21194] Updated weights for policy 1, policy_version 17750 (0.0008) +[2023-10-08 16:25:34,046][21195] Updated weights for policy 0, policy_version 17870 (0.0008) +[2023-10-08 16:25:34,304][21194] Updated weights for policy 1, policy_version 17760 (0.0008) +[2023-10-08 16:25:34,417][21195] Updated weights for policy 0, policy_version 17880 (0.0009) +[2023-10-08 16:25:38,142][21194] Updated weights for policy 1, policy_version 17770 (0.0009) +[2023-10-08 16:25:38,429][21195] Updated weights for policy 0, policy_version 17890 (0.0009) +[2023-10-08 16:25:38,499][21194] Updated weights for policy 1, policy_version 17780 (0.0009) +[2023-10-08 16:25:38,800][21195] Updated weights for policy 0, policy_version 17900 (0.0008) +[2023-10-08 16:25:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 36503552. Throughput: 0: 1732.7, 1: 1749.2. Samples: 9139782. Policy #0 lag: (min: 1.0, avg: 9.4, max: 33.0) +[2023-10-08 16:25:38,803][19739] Avg episode reward: [(0, '301.320'), (1, '683.760')] +[2023-10-08 16:25:38,868][21194] Updated weights for policy 1, policy_version 17790 (0.0008) +[2023-10-08 16:25:39,170][21195] Updated weights for policy 0, policy_version 17910 (0.0009) +[2023-10-08 16:25:39,548][21195] Updated weights for policy 0, policy_version 17920 (0.0008) +[2023-10-08 16:25:42,857][21194] Updated weights for policy 1, policy_version 17800 (0.0007) +[2023-10-08 16:25:43,223][21194] Updated weights for policy 1, policy_version 17810 (0.0007) +[2023-10-08 16:25:43,375][21195] Updated weights for policy 0, policy_version 17930 (0.0007) +[2023-10-08 16:25:43,588][21194] Updated weights for policy 1, policy_version 17820 (0.0008) +[2023-10-08 16:25:43,746][21195] Updated weights for policy 0, policy_version 17940 (0.0008) +[2023-10-08 16:25:43,803][19739] Fps is (10 sec: 16384.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 36601856. Throughput: 0: 1739.4, 1: 1738.0. Samples: 9160588. Policy #0 lag: (min: 1.0, avg: 9.4, max: 33.0) +[2023-10-08 16:25:43,803][19739] Avg episode reward: [(0, '315.670'), (1, '697.440')] +[2023-10-08 16:25:44,122][21195] Updated weights for policy 0, policy_version 17950 (0.0009) +[2023-10-08 16:25:44,196][20740] Saving new best policy, reward=315.670! +[2023-10-08 16:25:47,650][21194] Updated weights for policy 1, policy_version 17830 (0.0008) +[2023-10-08 16:25:48,006][21194] Updated weights for policy 1, policy_version 17840 (0.0007) +[2023-10-08 16:25:48,025][21195] Updated weights for policy 0, policy_version 17960 (0.0007) +[2023-10-08 16:25:48,375][21194] Updated weights for policy 1, policy_version 17850 (0.0007) +[2023-10-08 16:25:48,397][21195] Updated weights for policy 0, policy_version 17970 (0.0007) +[2023-10-08 16:25:48,764][21195] Updated weights for policy 0, policy_version 17980 (0.0008) +[2023-10-08 16:25:48,803][19739] Fps is (10 sec: 16383.8, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 36667392. Throughput: 0: 1717.8, 1: 1738.9. Samples: 9175364. Policy #0 lag: (min: 19.0, avg: 26.4, max: 51.0) +[2023-10-08 16:25:48,803][19739] Avg episode reward: [(0, '315.670'), (1, '697.440')] +[2023-10-08 16:25:52,410][21194] Updated weights for policy 1, policy_version 17860 (0.0007) +[2023-10-08 16:25:52,605][21195] Updated weights for policy 0, policy_version 17990 (0.0007) +[2023-10-08 16:25:52,768][21194] Updated weights for policy 1, policy_version 17870 (0.0007) +[2023-10-08 16:25:52,977][21195] Updated weights for policy 0, policy_version 18000 (0.0008) +[2023-10-08 16:25:53,136][21194] Updated weights for policy 1, policy_version 17880 (0.0007) +[2023-10-08 16:25:53,348][21195] Updated weights for policy 0, policy_version 18010 (0.0007) +[2023-10-08 16:25:53,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 36765696. Throughput: 0: 1747.8, 1: 1744.0. Samples: 9191950. Policy #0 lag: (min: 19.0, avg: 26.4, max: 51.0) +[2023-10-08 16:25:53,803][19739] Avg episode reward: [(0, '315.670'), (1, '702.340')] +[2023-10-08 16:25:57,020][21194] Updated weights for policy 1, policy_version 17890 (0.0007) +[2023-10-08 16:25:57,393][21194] Updated weights for policy 1, policy_version 17900 (0.0008) +[2023-10-08 16:25:57,481][21195] Updated weights for policy 0, policy_version 18020 (0.0007) +[2023-10-08 16:25:57,756][21194] Updated weights for policy 1, policy_version 17910 (0.0007) +[2023-10-08 16:25:57,872][21195] Updated weights for policy 0, policy_version 18030 (0.0009) +[2023-10-08 16:25:58,123][21194] Updated weights for policy 1, policy_version 17920 (0.0008) +[2023-10-08 16:25:58,235][21195] Updated weights for policy 0, policy_version 18040 (0.0010) +[2023-10-08 16:25:58,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 36831232. Throughput: 0: 1732.0, 1: 1712.0. Samples: 9211410. Policy #0 lag: (min: 9.0, avg: 12.5, max: 41.0) +[2023-10-08 16:25:58,803][19739] Avg episode reward: [(0, '315.670'), (1, '702.340')] +[2023-10-08 16:26:02,043][21194] Updated weights for policy 1, policy_version 17930 (0.0008) +[2023-10-08 16:26:02,206][21195] Updated weights for policy 0, policy_version 18050 (0.0011) +[2023-10-08 16:26:02,419][21194] Updated weights for policy 1, policy_version 17940 (0.0007) +[2023-10-08 16:26:02,577][21195] Updated weights for policy 0, policy_version 18060 (0.0007) +[2023-10-08 16:26:02,789][21194] Updated weights for policy 1, policy_version 17950 (0.0008) +[2023-10-08 16:26:02,949][21195] Updated weights for policy 0, policy_version 18070 (0.0008) +[2023-10-08 16:26:03,324][21195] Updated weights for policy 0, policy_version 18080 (0.0008) +[2023-10-08 16:26:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 36896768. Throughput: 0: 1711.1, 1: 1737.3. Samples: 9226960. Policy #0 lag: (min: 9.0, avg: 12.5, max: 41.0) +[2023-10-08 16:26:03,803][19739] Avg episode reward: [(0, '326.610'), (1, '702.340')] +[2023-10-08 16:26:03,804][20740] Saving new best policy, reward=326.610! +[2023-10-08 16:26:06,839][21194] Updated weights for policy 1, policy_version 17960 (0.0008) +[2023-10-08 16:26:07,193][21195] Updated weights for policy 0, policy_version 18090 (0.0008) +[2023-10-08 16:26:07,211][21194] Updated weights for policy 1, policy_version 17970 (0.0007) +[2023-10-08 16:26:07,554][21195] Updated weights for policy 0, policy_version 18100 (0.0010) +[2023-10-08 16:26:07,576][21194] Updated weights for policy 1, policy_version 17980 (0.0007) +[2023-10-08 16:26:07,930][21195] Updated weights for policy 0, policy_version 18110 (0.0009) +[2023-10-08 16:26:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 36962304. Throughput: 0: 1742.9, 1: 1714.1. Samples: 9242926. Policy #0 lag: (min: 9.0, avg: 12.5, max: 41.0) +[2023-10-08 16:26:08,803][19739] Avg episode reward: [(0, '324.050'), (1, '702.340')] +[2023-10-08 16:26:11,355][21194] Updated weights for policy 1, policy_version 17990 (0.0007) +[2023-10-08 16:26:11,718][21194] Updated weights for policy 1, policy_version 18000 (0.0007) +[2023-10-08 16:26:11,893][21195] Updated weights for policy 0, policy_version 18120 (0.0008) +[2023-10-08 16:26:12,084][21194] Updated weights for policy 1, policy_version 18010 (0.0008) +[2023-10-08 16:26:12,270][21195] Updated weights for policy 0, policy_version 18130 (0.0010) +[2023-10-08 16:26:12,637][21195] Updated weights for policy 0, policy_version 18140 (0.0008) +[2023-10-08 16:26:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 37027840. Throughput: 0: 1709.3, 1: 1697.7. Samples: 9262170. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:26:13,803][19739] Avg episode reward: [(0, '320.770'), (1, '702.340')] +[2023-10-08 16:26:16,087][21194] Updated weights for policy 1, policy_version 18020 (0.0007) +[2023-10-08 16:26:16,454][21194] Updated weights for policy 1, policy_version 18030 (0.0008) +[2023-10-08 16:26:16,610][21195] Updated weights for policy 0, policy_version 18150 (0.0008) +[2023-10-08 16:26:16,827][21194] Updated weights for policy 1, policy_version 18040 (0.0009) +[2023-10-08 16:26:16,977][21195] Updated weights for policy 0, policy_version 18160 (0.0007) +[2023-10-08 16:26:17,342][21195] Updated weights for policy 0, policy_version 18170 (0.0009) +[2023-10-08 16:26:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 37093376. Throughput: 0: 1711.1, 1: 1723.4. Samples: 9278564. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:26:18,803][19739] Avg episode reward: [(0, '330.120'), (1, '702.340')] +[2023-10-08 16:26:18,804][20740] Saving new best policy, reward=330.120! +[2023-10-08 16:26:20,949][21194] Updated weights for policy 1, policy_version 18050 (0.0008) +[2023-10-08 16:26:21,311][21194] Updated weights for policy 1, policy_version 18060 (0.0009) +[2023-10-08 16:26:21,522][21195] Updated weights for policy 0, policy_version 18180 (0.0010) +[2023-10-08 16:26:21,680][21194] Updated weights for policy 1, policy_version 18070 (0.0007) +[2023-10-08 16:26:21,885][21195] Updated weights for policy 0, policy_version 18190 (0.0007) +[2023-10-08 16:26:22,042][21194] Updated weights for policy 1, policy_version 18080 (0.0007) +[2023-10-08 16:26:22,258][21195] Updated weights for policy 0, policy_version 18200 (0.0007) +[2023-10-08 16:26:23,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 37158912. Throughput: 0: 1722.4, 1: 1689.7. Samples: 9293326. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:26:23,804][19739] Avg episode reward: [(0, '339.750'), (1, '702.340')] +[2023-10-08 16:26:23,805][20740] Saving new best policy, reward=339.750! +[2023-10-08 16:26:25,993][21194] Updated weights for policy 1, policy_version 18090 (0.0008) +[2023-10-08 16:26:26,113][21195] Updated weights for policy 0, policy_version 18210 (0.0007) +[2023-10-08 16:26:26,358][21194] Updated weights for policy 1, policy_version 18100 (0.0008) +[2023-10-08 16:26:26,481][21195] Updated weights for policy 0, policy_version 18220 (0.0008) +[2023-10-08 16:26:26,725][21194] Updated weights for policy 1, policy_version 18110 (0.0008) +[2023-10-08 16:26:26,846][21195] Updated weights for policy 0, policy_version 18230 (0.0008) +[2023-10-08 16:26:27,220][21195] Updated weights for policy 0, policy_version 18240 (0.0010) +[2023-10-08 16:26:28,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 37224448. Throughput: 0: 1698.4, 1: 1703.1. Samples: 9313656. Policy #0 lag: (min: 1.0, avg: 29.7, max: 32.0) +[2023-10-08 16:26:28,803][19739] Avg episode reward: [(0, '339.750'), (1, '702.340')] +[2023-10-08 16:26:30,685][21194] Updated weights for policy 1, policy_version 18120 (0.0007) +[2023-10-08 16:26:31,045][21194] Updated weights for policy 1, policy_version 18130 (0.0008) +[2023-10-08 16:26:31,096][21195] Updated weights for policy 0, policy_version 18250 (0.0007) +[2023-10-08 16:26:31,413][21194] Updated weights for policy 1, policy_version 18140 (0.0009) +[2023-10-08 16:26:31,454][21195] Updated weights for policy 0, policy_version 18260 (0.0008) +[2023-10-08 16:26:31,824][21195] Updated weights for policy 0, policy_version 18270 (0.0008) +[2023-10-08 16:26:33,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 37289984. Throughput: 0: 1724.5, 1: 1707.4. Samples: 9329800. Policy #0 lag: (min: 1.0, avg: 29.7, max: 32.0) +[2023-10-08 16:26:33,803][19739] Avg episode reward: [(0, '339.750'), (1, '702.340')] +[2023-10-08 16:26:35,359][21194] Updated weights for policy 1, policy_version 18150 (0.0007) +[2023-10-08 16:26:35,725][21194] Updated weights for policy 1, policy_version 18160 (0.0008) +[2023-10-08 16:26:35,756][21195] Updated weights for policy 0, policy_version 18280 (0.0008) +[2023-10-08 16:26:36,097][21194] Updated weights for policy 1, policy_version 18170 (0.0007) +[2023-10-08 16:26:36,132][21195] Updated weights for policy 0, policy_version 18290 (0.0008) +[2023-10-08 16:26:36,499][21195] Updated weights for policy 0, policy_version 18300 (0.0007) +[2023-10-08 16:26:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 37355520. Throughput: 0: 1696.9, 1: 1694.8. Samples: 9344578. Policy #0 lag: (min: 1.0, avg: 29.7, max: 32.0) +[2023-10-08 16:26:38,803][19739] Avg episode reward: [(0, '340.450'), (1, '701.170')] +[2023-10-08 16:26:38,804][20740] Saving new best policy, reward=340.450! +[2023-10-08 16:26:40,152][21194] Updated weights for policy 1, policy_version 18180 (0.0009) +[2023-10-08 16:26:40,394][21195] Updated weights for policy 0, policy_version 18310 (0.0008) +[2023-10-08 16:26:40,513][21194] Updated weights for policy 1, policy_version 18190 (0.0008) +[2023-10-08 16:26:40,765][21195] Updated weights for policy 0, policy_version 18320 (0.0009) +[2023-10-08 16:26:40,869][21194] Updated weights for policy 1, policy_version 18200 (0.0008) +[2023-10-08 16:26:41,125][21195] Updated weights for policy 0, policy_version 18330 (0.0009) +[2023-10-08 16:26:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 37421056. Throughput: 0: 1715.5, 1: 1725.2. Samples: 9366242. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:26:43,803][19739] Avg episode reward: [(0, '340.450'), (1, '701.170')] +[2023-10-08 16:26:44,863][21194] Updated weights for policy 1, policy_version 18210 (0.0009) +[2023-10-08 16:26:45,187][21195] Updated weights for policy 0, policy_version 18340 (0.0010) +[2023-10-08 16:26:45,218][21194] Updated weights for policy 1, policy_version 18220 (0.0009) +[2023-10-08 16:26:45,574][21195] Updated weights for policy 0, policy_version 18350 (0.0007) +[2023-10-08 16:26:45,587][21194] Updated weights for policy 1, policy_version 18230 (0.0009) +[2023-10-08 16:26:45,936][21195] Updated weights for policy 0, policy_version 18360 (0.0007) +[2023-10-08 16:26:45,961][21194] Updated weights for policy 1, policy_version 18240 (0.0008) +[2023-10-08 16:26:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 37486592. Throughput: 0: 1733.9, 1: 1698.3. Samples: 9381406. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:26:48,803][19739] Avg episode reward: [(0, '341.730'), (1, '701.170')] +[2023-10-08 16:26:48,804][20740] Saving new best policy, reward=341.730! +[2023-10-08 16:26:49,747][21195] Updated weights for policy 0, policy_version 18370 (0.0009) +[2023-10-08 16:26:49,874][21194] Updated weights for policy 1, policy_version 18250 (0.0009) +[2023-10-08 16:26:50,114][21195] Updated weights for policy 0, policy_version 18380 (0.0008) +[2023-10-08 16:26:50,234][21194] Updated weights for policy 1, policy_version 18260 (0.0007) +[2023-10-08 16:26:50,488][21195] Updated weights for policy 0, policy_version 18390 (0.0009) +[2023-10-08 16:26:50,605][21194] Updated weights for policy 1, policy_version 18270 (0.0008) +[2023-10-08 16:26:50,845][21195] Updated weights for policy 0, policy_version 18400 (0.0008) +[2023-10-08 16:26:53,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 37552128. Throughput: 0: 1700.2, 1: 1713.6. Samples: 9396546. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:26:53,803][19739] Avg episode reward: [(0, '341.730'), (1, '701.170')] +[2023-10-08 16:26:54,606][21194] Updated weights for policy 1, policy_version 18280 (0.0008) +[2023-10-08 16:26:54,782][21195] Updated weights for policy 0, policy_version 18410 (0.0008) +[2023-10-08 16:26:54,985][21194] Updated weights for policy 1, policy_version 18290 (0.0007) +[2023-10-08 16:26:55,147][21195] Updated weights for policy 0, policy_version 18420 (0.0008) +[2023-10-08 16:26:55,350][21194] Updated weights for policy 1, policy_version 18300 (0.0009) +[2023-10-08 16:26:55,515][21195] Updated weights for policy 0, policy_version 18430 (0.0009) +[2023-10-08 16:26:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 37617664. Throughput: 0: 1724.5, 1: 1727.9. Samples: 9417526. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 16:26:58,803][19739] Avg episode reward: [(0, '341.730'), (1, '706.890')] +[2023-10-08 16:26:58,813][20836] Saving new best policy, reward=706.890! +[2023-10-08 16:26:59,468][21194] Updated weights for policy 1, policy_version 18310 (0.0008) +[2023-10-08 16:26:59,620][21195] Updated weights for policy 0, policy_version 18440 (0.0009) +[2023-10-08 16:26:59,840][21194] Updated weights for policy 1, policy_version 18320 (0.0008) +[2023-10-08 16:26:59,992][21195] Updated weights for policy 0, policy_version 18450 (0.0007) +[2023-10-08 16:27:00,209][21194] Updated weights for policy 1, policy_version 18330 (0.0009) +[2023-10-08 16:27:00,365][21195] Updated weights for policy 0, policy_version 18460 (0.0009) +[2023-10-08 16:27:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 37683200. Throughput: 0: 1725.0, 1: 1699.8. Samples: 9432680. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 16:27:03,803][19739] Avg episode reward: [(0, '352.940'), (1, '706.890')] +[2023-10-08 16:27:03,804][20740] Saving new best policy, reward=352.940! +[2023-10-08 16:27:04,218][21194] Updated weights for policy 1, policy_version 18340 (0.0007) +[2023-10-08 16:27:04,365][21195] Updated weights for policy 0, policy_version 18470 (0.0009) +[2023-10-08 16:27:04,590][21194] Updated weights for policy 1, policy_version 18350 (0.0008) +[2023-10-08 16:27:04,740][21195] Updated weights for policy 0, policy_version 18480 (0.0007) +[2023-10-08 16:27:04,968][21194] Updated weights for policy 1, policy_version 18360 (0.0008) +[2023-10-08 16:27:05,113][21195] Updated weights for policy 0, policy_version 18490 (0.0009) +[2023-10-08 16:27:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 37748736. Throughput: 0: 1713.6, 1: 1724.4. Samples: 9448036. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 16:27:08,803][19739] Avg episode reward: [(0, '352.940'), (1, '706.890')] +[2023-10-08 16:27:08,824][21194] Updated weights for policy 1, policy_version 18370 (0.0008) +[2023-10-08 16:27:09,189][21195] Updated weights for policy 0, policy_version 18500 (0.0009) +[2023-10-08 16:27:09,193][21194] Updated weights for policy 1, policy_version 18380 (0.0007) +[2023-10-08 16:27:09,549][21195] Updated weights for policy 0, policy_version 18510 (0.0007) +[2023-10-08 16:27:09,559][21194] Updated weights for policy 1, policy_version 18390 (0.0008) +[2023-10-08 16:27:09,928][21194] Updated weights for policy 1, policy_version 18400 (0.0007) +[2023-10-08 16:27:09,935][21195] Updated weights for policy 0, policy_version 18520 (0.0009) +[2023-10-08 16:27:13,692][21194] Updated weights for policy 1, policy_version 18410 (0.0008) +[2023-10-08 16:27:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 37814272. Throughput: 0: 1737.1, 1: 1728.3. Samples: 9469598. Policy #0 lag: (min: 24.0, avg: 41.9, max: 56.0) +[2023-10-08 16:27:13,803][19739] Avg episode reward: [(0, '352.940'), (1, '706.890')] +[2023-10-08 16:27:13,836][21195] Updated weights for policy 0, policy_version 18530 (0.0008) +[2023-10-08 16:27:14,053][21194] Updated weights for policy 1, policy_version 18420 (0.0008) +[2023-10-08 16:27:14,209][21195] Updated weights for policy 0, policy_version 18540 (0.0009) +[2023-10-08 16:27:14,412][21194] Updated weights for policy 1, policy_version 18430 (0.0008) +[2023-10-08 16:27:14,484][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000018432_18874368.pth... +[2023-10-08 16:27:14,513][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000016800_17203200.pth +[2023-10-08 16:27:14,575][21195] Updated weights for policy 0, policy_version 18550 (0.0007) +[2023-10-08 16:27:14,948][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000018560_19005440.pth... +[2023-10-08 16:27:14,949][21195] Updated weights for policy 0, policy_version 18560 (0.0010) +[2023-10-08 16:27:14,987][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000016928_17334272.pth +[2023-10-08 16:27:18,634][21194] Updated weights for policy 1, policy_version 18440 (0.0008) +[2023-10-08 16:27:18,738][21195] Updated weights for policy 0, policy_version 18570 (0.0008) +[2023-10-08 16:27:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 37879808. Throughput: 0: 1723.5, 1: 1713.7. Samples: 9484476. Policy #0 lag: (min: 24.0, avg: 41.9, max: 56.0) +[2023-10-08 16:27:18,803][19739] Avg episode reward: [(0, '356.430'), (1, '706.890')] +[2023-10-08 16:27:18,993][21194] Updated weights for policy 1, policy_version 18450 (0.0008) +[2023-10-08 16:27:19,103][21195] Updated weights for policy 0, policy_version 18580 (0.0008) +[2023-10-08 16:27:19,362][21194] Updated weights for policy 1, policy_version 18460 (0.0008) +[2023-10-08 16:27:19,490][21195] Updated weights for policy 0, policy_version 18590 (0.0008) +[2023-10-08 16:27:19,553][20740] Saving new best policy, reward=356.430! +[2023-10-08 16:27:23,411][21194] Updated weights for policy 1, policy_version 18470 (0.0009) +[2023-10-08 16:27:23,421][21195] Updated weights for policy 0, policy_version 18600 (0.0008) +[2023-10-08 16:27:23,772][21194] Updated weights for policy 1, policy_version 18480 (0.0008) +[2023-10-08 16:27:23,790][21195] Updated weights for policy 0, policy_version 18610 (0.0009) +[2023-10-08 16:27:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 37945344. Throughput: 0: 1733.0, 1: 1720.5. Samples: 9499984. Policy #0 lag: (min: 24.0, avg: 41.9, max: 56.0) +[2023-10-08 16:27:23,803][19739] Avg episode reward: [(0, '359.990'), (1, '706.890')] +[2023-10-08 16:27:24,140][21194] Updated weights for policy 1, policy_version 18490 (0.0007) +[2023-10-08 16:27:24,149][21195] Updated weights for policy 0, policy_version 18620 (0.0009) +[2023-10-08 16:27:24,299][20740] Saving new best policy, reward=359.990! +[2023-10-08 16:27:28,034][21195] Updated weights for policy 0, policy_version 18630 (0.0008) +[2023-10-08 16:27:28,037][21194] Updated weights for policy 1, policy_version 18500 (0.0008) +[2023-10-08 16:27:28,401][21194] Updated weights for policy 1, policy_version 18510 (0.0007) +[2023-10-08 16:27:28,406][21195] Updated weights for policy 0, policy_version 18640 (0.0009) +[2023-10-08 16:27:28,766][21194] Updated weights for policy 1, policy_version 18520 (0.0007) +[2023-10-08 16:27:28,781][21195] Updated weights for policy 0, policy_version 18650 (0.0008) +[2023-10-08 16:27:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 38010880. Throughput: 0: 1735.2, 1: 1715.3. Samples: 9521514. Policy #0 lag: (min: 31.0, avg: 38.4, max: 63.0) +[2023-10-08 16:27:28,803][19739] Avg episode reward: [(0, '394.260'), (1, '706.890')] +[2023-10-08 16:27:28,999][20740] Saving new best policy, reward=394.260! +[2023-10-08 16:27:32,633][21194] Updated weights for policy 1, policy_version 18530 (0.0008) +[2023-10-08 16:27:32,776][21195] Updated weights for policy 0, policy_version 18660 (0.0008) +[2023-10-08 16:27:33,005][21194] Updated weights for policy 1, policy_version 18540 (0.0009) +[2023-10-08 16:27:33,157][21195] Updated weights for policy 0, policy_version 18670 (0.0008) +[2023-10-08 16:27:33,367][21194] Updated weights for policy 1, policy_version 18550 (0.0008) +[2023-10-08 16:27:33,527][21195] Updated weights for policy 0, policy_version 18680 (0.0010) +[2023-10-08 16:27:33,732][21194] Updated weights for policy 1, policy_version 18560 (0.0007) +[2023-10-08 16:27:33,803][19739] Fps is (10 sec: 16383.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 38109184. Throughput: 0: 1704.4, 1: 1718.7. Samples: 9535450. Policy #0 lag: (min: 31.0, avg: 38.4, max: 63.0) +[2023-10-08 16:27:33,804][19739] Avg episode reward: [(0, '394.260'), (1, '706.890')] +[2023-10-08 16:27:37,550][21195] Updated weights for policy 0, policy_version 18690 (0.0009) +[2023-10-08 16:27:37,835][21194] Updated weights for policy 1, policy_version 18570 (0.0010) +[2023-10-08 16:27:37,918][21195] Updated weights for policy 0, policy_version 18700 (0.0007) +[2023-10-08 16:27:38,203][21194] Updated weights for policy 1, policy_version 18580 (0.0007) +[2023-10-08 16:27:38,292][21195] Updated weights for policy 0, policy_version 18710 (0.0009) +[2023-10-08 16:27:38,571][21194] Updated weights for policy 1, policy_version 18590 (0.0009) +[2023-10-08 16:27:38,659][21195] Updated weights for policy 0, policy_version 18720 (0.0009) +[2023-10-08 16:27:38,802][19739] Fps is (10 sec: 19661.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 38207488. Throughput: 0: 1732.4, 1: 1718.1. Samples: 9551818. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:27:38,803][19739] Avg episode reward: [(0, '401.020'), (1, '735.650')] +[2023-10-08 16:27:38,804][20740] Saving new best policy, reward=401.020! +[2023-10-08 16:27:38,804][20836] Saving new best policy, reward=735.650! +[2023-10-08 16:27:42,586][21195] Updated weights for policy 0, policy_version 18730 (0.0007) +[2023-10-08 16:27:42,755][21194] Updated weights for policy 1, policy_version 18600 (0.0007) +[2023-10-08 16:27:42,952][21195] Updated weights for policy 0, policy_version 18740 (0.0007) +[2023-10-08 16:27:43,129][21194] Updated weights for policy 1, policy_version 18610 (0.0009) +[2023-10-08 16:27:43,318][21195] Updated weights for policy 0, policy_version 18750 (0.0007) +[2023-10-08 16:27:43,501][21194] Updated weights for policy 1, policy_version 18620 (0.0009) +[2023-10-08 16:27:43,803][19739] Fps is (10 sec: 16384.5, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 38273024. Throughput: 0: 1720.4, 1: 1701.0. Samples: 9571492. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:27:43,803][19739] Avg episode reward: [(0, '401.340'), (1, '735.650')] +[2023-10-08 16:27:43,812][20740] Saving new best policy, reward=401.340! +[2023-10-08 16:27:47,237][21195] Updated weights for policy 0, policy_version 18760 (0.0007) +[2023-10-08 16:27:47,476][21194] Updated weights for policy 1, policy_version 18630 (0.0008) +[2023-10-08 16:27:47,602][21195] Updated weights for policy 0, policy_version 18770 (0.0008) +[2023-10-08 16:27:47,842][21194] Updated weights for policy 1, policy_version 18640 (0.0008) +[2023-10-08 16:27:47,969][21195] Updated weights for policy 0, policy_version 18780 (0.0009) +[2023-10-08 16:27:48,208][21194] Updated weights for policy 1, policy_version 18650 (0.0010) +[2023-10-08 16:27:48,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 38338560. Throughput: 0: 1706.2, 1: 1716.2. Samples: 9586688. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:27:48,804][19739] Avg episode reward: [(0, '401.340'), (1, '735.650')] +[2023-10-08 16:27:52,042][21195] Updated weights for policy 0, policy_version 18790 (0.0009) +[2023-10-08 16:27:52,228][21194] Updated weights for policy 1, policy_version 18660 (0.0009) +[2023-10-08 16:27:52,415][21195] Updated weights for policy 0, policy_version 18800 (0.0008) +[2023-10-08 16:27:52,591][21194] Updated weights for policy 1, policy_version 18670 (0.0008) +[2023-10-08 16:27:52,778][21195] Updated weights for policy 0, policy_version 18810 (0.0008) +[2023-10-08 16:27:52,952][21194] Updated weights for policy 1, policy_version 18680 (0.0008) +[2023-10-08 16:27:53,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 38404096. Throughput: 0: 1733.2, 1: 1714.4. Samples: 9603178. Policy #0 lag: (min: 28.0, avg: 30.7, max: 60.0) +[2023-10-08 16:27:53,803][19739] Avg episode reward: [(0, '401.340'), (1, '735.640')] +[2023-10-08 16:27:56,761][21195] Updated weights for policy 0, policy_version 18820 (0.0008) +[2023-10-08 16:27:56,930][21194] Updated weights for policy 1, policy_version 18690 (0.0007) +[2023-10-08 16:27:57,128][21195] Updated weights for policy 0, policy_version 18830 (0.0007) +[2023-10-08 16:27:57,305][21194] Updated weights for policy 1, policy_version 18700 (0.0008) +[2023-10-08 16:27:57,494][21195] Updated weights for policy 0, policy_version 18840 (0.0009) +[2023-10-08 16:27:57,670][21194] Updated weights for policy 1, policy_version 18710 (0.0009) +[2023-10-08 16:27:58,045][21194] Updated weights for policy 1, policy_version 18720 (0.0009) +[2023-10-08 16:27:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 38469632. Throughput: 0: 1703.9, 1: 1682.6. Samples: 9621990. Policy #0 lag: (min: 28.0, avg: 30.7, max: 60.0) +[2023-10-08 16:27:58,804][19739] Avg episode reward: [(0, '401.340'), (1, '735.640')] +[2023-10-08 16:28:01,400][21195] Updated weights for policy 0, policy_version 18850 (0.0008) +[2023-10-08 16:28:01,767][21195] Updated weights for policy 0, policy_version 18860 (0.0008) +[2023-10-08 16:28:01,981][21194] Updated weights for policy 1, policy_version 18730 (0.0009) +[2023-10-08 16:28:02,138][21195] Updated weights for policy 0, policy_version 18870 (0.0008) +[2023-10-08 16:28:02,352][21194] Updated weights for policy 1, policy_version 18740 (0.0009) +[2023-10-08 16:28:02,512][21195] Updated weights for policy 0, policy_version 18880 (0.0009) +[2023-10-08 16:28:02,709][21194] Updated weights for policy 1, policy_version 18750 (0.0007) +[2023-10-08 16:28:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 38535168. Throughput: 0: 1714.8, 1: 1712.4. Samples: 9638698. Policy #0 lag: (min: 28.0, avg: 30.7, max: 60.0) +[2023-10-08 16:28:03,803][19739] Avg episode reward: [(0, '401.340'), (1, '704.510')] +[2023-10-08 16:28:06,424][21195] Updated weights for policy 0, policy_version 18890 (0.0008) +[2023-10-08 16:28:06,513][21194] Updated weights for policy 1, policy_version 18760 (0.0007) +[2023-10-08 16:28:06,789][21195] Updated weights for policy 0, policy_version 18900 (0.0007) +[2023-10-08 16:28:06,885][21194] Updated weights for policy 1, policy_version 18770 (0.0008) +[2023-10-08 16:28:07,160][21195] Updated weights for policy 0, policy_version 18910 (0.0008) +[2023-10-08 16:28:07,242][21194] Updated weights for policy 1, policy_version 18780 (0.0009) +[2023-10-08 16:28:08,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 38600704. Throughput: 0: 1715.0, 1: 1700.4. Samples: 9653680. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:28:08,803][19739] Avg episode reward: [(0, '402.730'), (1, '678.660')] +[2023-10-08 16:28:08,804][20740] Saving new best policy, reward=402.730! +[2023-10-08 16:28:11,166][21195] Updated weights for policy 0, policy_version 18920 (0.0010) +[2023-10-08 16:28:11,247][21194] Updated weights for policy 1, policy_version 18790 (0.0008) +[2023-10-08 16:28:11,536][21195] Updated weights for policy 0, policy_version 18930 (0.0010) +[2023-10-08 16:28:11,613][21194] Updated weights for policy 1, policy_version 18800 (0.0008) +[2023-10-08 16:28:11,901][21195] Updated weights for policy 0, policy_version 18940 (0.0009) +[2023-10-08 16:28:11,988][21194] Updated weights for policy 1, policy_version 18810 (0.0007) +[2023-10-08 16:28:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 38666240. Throughput: 0: 1698.3, 1: 1692.2. Samples: 9674086. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:28:13,803][19739] Avg episode reward: [(0, '416.540'), (1, '678.660')] +[2023-10-08 16:28:13,812][20740] Saving new best policy, reward=416.540! +[2023-10-08 16:28:15,758][21195] Updated weights for policy 0, policy_version 18950 (0.0009) +[2023-10-08 16:28:15,897][21194] Updated weights for policy 1, policy_version 18820 (0.0009) +[2023-10-08 16:28:16,130][21195] Updated weights for policy 0, policy_version 18960 (0.0008) +[2023-10-08 16:28:16,267][21194] Updated weights for policy 1, policy_version 18830 (0.0007) +[2023-10-08 16:28:16,502][21195] Updated weights for policy 0, policy_version 18970 (0.0009) +[2023-10-08 16:28:16,632][21194] Updated weights for policy 1, policy_version 18840 (0.0008) +[2023-10-08 16:28:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 38731776. Throughput: 0: 1735.4, 1: 1711.5. Samples: 9690558. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:28:18,803][19739] Avg episode reward: [(0, '416.540'), (1, '682.670')] +[2023-10-08 16:28:20,299][21195] Updated weights for policy 0, policy_version 18980 (0.0008) +[2023-10-08 16:28:20,631][21194] Updated weights for policy 1, policy_version 18850 (0.0008) +[2023-10-08 16:28:20,661][21195] Updated weights for policy 0, policy_version 18990 (0.0008) +[2023-10-08 16:28:20,992][21194] Updated weights for policy 1, policy_version 18860 (0.0008) +[2023-10-08 16:28:21,030][21195] Updated weights for policy 0, policy_version 19000 (0.0008) +[2023-10-08 16:28:21,350][21194] Updated weights for policy 1, policy_version 18870 (0.0007) +[2023-10-08 16:28:21,723][21194] Updated weights for policy 1, policy_version 18880 (0.0008) +[2023-10-08 16:28:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 38797312. Throughput: 0: 1711.7, 1: 1695.1. Samples: 9705122. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:28:23,803][19739] Avg episode reward: [(0, '417.250'), (1, '696.230')] +[2023-10-08 16:28:23,804][20740] Saving new best policy, reward=417.250! +[2023-10-08 16:28:24,946][21195] Updated weights for policy 0, policy_version 19010 (0.0009) +[2023-10-08 16:28:25,328][21195] Updated weights for policy 0, policy_version 19020 (0.0009) +[2023-10-08 16:28:25,609][21194] Updated weights for policy 1, policy_version 18890 (0.0010) +[2023-10-08 16:28:25,695][21195] Updated weights for policy 0, policy_version 19030 (0.0010) +[2023-10-08 16:28:25,975][21194] Updated weights for policy 1, policy_version 18900 (0.0009) +[2023-10-08 16:28:26,072][21195] Updated weights for policy 0, policy_version 19040 (0.0008) +[2023-10-08 16:28:26,341][21194] Updated weights for policy 1, policy_version 18910 (0.0009) +[2023-10-08 16:28:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 38862848. Throughput: 0: 1723.5, 1: 1717.0. Samples: 9726312. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:28:28,803][19739] Avg episode reward: [(0, '417.250'), (1, '699.690')] +[2023-10-08 16:28:30,084][21195] Updated weights for policy 0, policy_version 19050 (0.0010) +[2023-10-08 16:28:30,380][21194] Updated weights for policy 1, policy_version 18920 (0.0008) +[2023-10-08 16:28:30,446][21195] Updated weights for policy 0, policy_version 19060 (0.0008) +[2023-10-08 16:28:30,750][21194] Updated weights for policy 1, policy_version 18930 (0.0008) +[2023-10-08 16:28:30,826][21195] Updated weights for policy 0, policy_version 19070 (0.0007) +[2023-10-08 16:28:31,110][21194] Updated weights for policy 1, policy_version 18940 (0.0009) +[2023-10-08 16:28:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 38928384. Throughput: 0: 1736.5, 1: 1711.0. Samples: 9741826. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:28:33,803][19739] Avg episode reward: [(0, '417.250'), (1, '704.350')] +[2023-10-08 16:28:34,778][21195] Updated weights for policy 0, policy_version 19080 (0.0007) +[2023-10-08 16:28:35,001][21194] Updated weights for policy 1, policy_version 18950 (0.0007) +[2023-10-08 16:28:35,150][21195] Updated weights for policy 0, policy_version 19090 (0.0009) +[2023-10-08 16:28:35,361][21194] Updated weights for policy 1, policy_version 18960 (0.0008) +[2023-10-08 16:28:35,521][21195] Updated weights for policy 0, policy_version 19100 (0.0008) +[2023-10-08 16:28:35,731][21194] Updated weights for policy 1, policy_version 18970 (0.0007) +[2023-10-08 16:28:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 38993920. Throughput: 0: 1707.4, 1: 1706.2. Samples: 9756790. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:28:38,803][19739] Avg episode reward: [(0, '431.400'), (1, '717.240')] +[2023-10-08 16:28:38,804][20740] Saving new best policy, reward=431.400! +[2023-10-08 16:28:39,488][21195] Updated weights for policy 0, policy_version 19110 (0.0007) +[2023-10-08 16:28:39,827][21194] Updated weights for policy 1, policy_version 18980 (0.0009) +[2023-10-08 16:28:39,851][21195] Updated weights for policy 0, policy_version 19120 (0.0007) +[2023-10-08 16:28:40,198][21194] Updated weights for policy 1, policy_version 18990 (0.0008) +[2023-10-08 16:28:40,216][21195] Updated weights for policy 0, policy_version 19130 (0.0007) +[2023-10-08 16:28:40,562][21194] Updated weights for policy 1, policy_version 19000 (0.0008) +[2023-10-08 16:28:43,803][19739] Fps is (10 sec: 13106.7, 60 sec: 13107.1, 300 sec: 13773.6). Total num frames: 39059456. Throughput: 0: 1743.2, 1: 1732.3. Samples: 9778386. Policy #0 lag: (min: 18.0, avg: 22.6, max: 50.0) +[2023-10-08 16:28:43,804][19739] Avg episode reward: [(0, '431.980'), (1, '716.950')] +[2023-10-08 16:28:44,021][21195] Updated weights for policy 0, policy_version 19140 (0.0007) +[2023-10-08 16:28:44,394][21195] Updated weights for policy 0, policy_version 19150 (0.0008) +[2023-10-08 16:28:44,637][21194] Updated weights for policy 1, policy_version 19010 (0.0008) +[2023-10-08 16:28:44,754][21195] Updated weights for policy 0, policy_version 19160 (0.0009) +[2023-10-08 16:28:44,998][21194] Updated weights for policy 1, policy_version 19020 (0.0007) +[2023-10-08 16:28:45,046][20740] Saving new best policy, reward=431.980! +[2023-10-08 16:28:45,367][21194] Updated weights for policy 1, policy_version 19030 (0.0007) +[2023-10-08 16:28:45,723][21194] Updated weights for policy 1, policy_version 19040 (0.0008) +[2023-10-08 16:28:48,535][21195] Updated weights for policy 0, policy_version 19170 (0.0007) +[2023-10-08 16:28:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 39124992. Throughput: 0: 1735.8, 1: 1704.3. Samples: 9793502. Policy #0 lag: (min: 18.0, avg: 22.6, max: 50.0) +[2023-10-08 16:28:48,803][19739] Avg episode reward: [(0, '425.470'), (1, '710.100')] +[2023-10-08 16:28:48,898][21195] Updated weights for policy 0, policy_version 19180 (0.0007) +[2023-10-08 16:28:49,263][21195] Updated weights for policy 0, policy_version 19190 (0.0007) +[2023-10-08 16:28:49,628][21195] Updated weights for policy 0, policy_version 19200 (0.0008) +[2023-10-08 16:28:49,630][21194] Updated weights for policy 1, policy_version 19050 (0.0008) +[2023-10-08 16:28:49,994][21194] Updated weights for policy 1, policy_version 19060 (0.0010) +[2023-10-08 16:28:50,359][21194] Updated weights for policy 1, policy_version 19070 (0.0011) +[2023-10-08 16:28:53,509][21195] Updated weights for policy 0, policy_version 19210 (0.0010) +[2023-10-08 16:28:53,803][19739] Fps is (10 sec: 13107.7, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 39190528. Throughput: 0: 1736.8, 1: 1721.5. Samples: 9809306. Policy #0 lag: (min: 18.0, avg: 22.6, max: 50.0) +[2023-10-08 16:28:53,803][19739] Avg episode reward: [(0, '425.470'), (1, '706.070')] +[2023-10-08 16:28:53,874][21195] Updated weights for policy 0, policy_version 19220 (0.0010) +[2023-10-08 16:28:54,246][21195] Updated weights for policy 0, policy_version 19230 (0.0008) +[2023-10-08 16:28:54,356][21194] Updated weights for policy 1, policy_version 19080 (0.0010) +[2023-10-08 16:28:54,730][21194] Updated weights for policy 1, policy_version 19090 (0.0008) +[2023-10-08 16:28:55,107][21194] Updated weights for policy 1, policy_version 19100 (0.0009) +[2023-10-08 16:28:58,057][21195] Updated weights for policy 0, policy_version 19240 (0.0007) +[2023-10-08 16:28:58,418][21195] Updated weights for policy 0, policy_version 19250 (0.0009) +[2023-10-08 16:28:58,790][21195] Updated weights for policy 0, policy_version 19260 (0.0007) +[2023-10-08 16:28:58,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 39256064. Throughput: 0: 1752.8, 1: 1730.3. Samples: 9830826. Policy #0 lag: (min: 26.0, avg: 26.0, max: 26.0) +[2023-10-08 16:28:58,804][19739] Avg episode reward: [(0, '425.750'), (1, '692.420')] +[2023-10-08 16:28:59,029][21194] Updated weights for policy 1, policy_version 19110 (0.0009) +[2023-10-08 16:28:59,399][21194] Updated weights for policy 1, policy_version 19120 (0.0008) +[2023-10-08 16:28:59,766][21194] Updated weights for policy 1, policy_version 19130 (0.0008) +[2023-10-08 16:29:02,663][21195] Updated weights for policy 0, policy_version 19270 (0.0007) +[2023-10-08 16:29:03,034][21195] Updated weights for policy 0, policy_version 19280 (0.0007) +[2023-10-08 16:29:03,411][21195] Updated weights for policy 0, policy_version 19290 (0.0007) +[2023-10-08 16:29:03,716][21194] Updated weights for policy 1, policy_version 19140 (0.0008) +[2023-10-08 16:29:03,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 39354368. Throughput: 0: 1725.9, 1: 1704.6. Samples: 9844930. Policy #0 lag: (min: 26.0, avg: 26.0, max: 26.0) +[2023-10-08 16:29:03,803][19739] Avg episode reward: [(0, '420.730'), (1, '686.450')] +[2023-10-08 16:29:04,077][21194] Updated weights for policy 1, policy_version 19150 (0.0008) +[2023-10-08 16:29:04,446][21194] Updated weights for policy 1, policy_version 19160 (0.0010) +[2023-10-08 16:29:07,305][21195] Updated weights for policy 0, policy_version 19300 (0.0007) +[2023-10-08 16:29:07,666][21195] Updated weights for policy 0, policy_version 19310 (0.0007) +[2023-10-08 16:29:08,036][21195] Updated weights for policy 0, policy_version 19320 (0.0007) +[2023-10-08 16:29:08,445][21194] Updated weights for policy 1, policy_version 19170 (0.0011) +[2023-10-08 16:29:08,803][19739] Fps is (10 sec: 16384.4, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 39419904. Throughput: 0: 1757.8, 1: 1725.1. Samples: 9861852. Policy #0 lag: (min: 26.0, avg: 26.0, max: 26.0) +[2023-10-08 16:29:08,803][19739] Avg episode reward: [(0, '421.590'), (1, '686.450')] +[2023-10-08 16:29:08,806][21194] Updated weights for policy 1, policy_version 19180 (0.0011) +[2023-10-08 16:29:09,175][21194] Updated weights for policy 1, policy_version 19190 (0.0010) +[2023-10-08 16:29:09,545][21194] Updated weights for policy 1, policy_version 19200 (0.0008) +[2023-10-08 16:29:11,995][21195] Updated weights for policy 0, policy_version 19330 (0.0008) +[2023-10-08 16:29:12,382][21195] Updated weights for policy 0, policy_version 19340 (0.0010) +[2023-10-08 16:29:12,756][21195] Updated weights for policy 0, policy_version 19350 (0.0009) +[2023-10-08 16:29:13,114][21195] Updated weights for policy 0, policy_version 19360 (0.0009) +[2023-10-08 16:29:13,543][21194] Updated weights for policy 1, policy_version 19210 (0.0008) +[2023-10-08 16:29:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 39485440. Throughput: 0: 1739.9, 1: 1723.6. Samples: 9882168. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:29:13,803][19739] Avg episode reward: [(0, '421.590'), (1, '686.450')] +[2023-10-08 16:29:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000019360_19824640.pth... +[2023-10-08 16:29:13,841][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000017728_18153472.pth +[2023-10-08 16:29:13,910][21194] Updated weights for policy 1, policy_version 19220 (0.0009) +[2023-10-08 16:29:14,282][21194] Updated weights for policy 1, policy_version 19230 (0.0009) +[2023-10-08 16:29:14,351][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000019232_19693568.pth... +[2023-10-08 16:29:14,390][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000017600_18022400.pth +[2023-10-08 16:29:17,121][21195] Updated weights for policy 0, policy_version 19370 (0.0008) +[2023-10-08 16:29:17,491][21195] Updated weights for policy 0, policy_version 19380 (0.0007) +[2023-10-08 16:29:17,873][21195] Updated weights for policy 0, policy_version 19390 (0.0008) +[2023-10-08 16:29:18,306][21194] Updated weights for policy 1, policy_version 19240 (0.0010) +[2023-10-08 16:29:18,682][21194] Updated weights for policy 1, policy_version 19250 (0.0008) +[2023-10-08 16:29:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 39550976. Throughput: 0: 1734.1, 1: 1718.5. Samples: 9897194. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:29:18,803][19739] Avg episode reward: [(0, '421.590'), (1, '673.760')] +[2023-10-08 16:29:19,050][21194] Updated weights for policy 1, policy_version 19260 (0.0009) +[2023-10-08 16:29:21,906][21195] Updated weights for policy 0, policy_version 19400 (0.0010) +[2023-10-08 16:29:22,272][21195] Updated weights for policy 0, policy_version 19410 (0.0011) +[2023-10-08 16:29:22,644][21195] Updated weights for policy 0, policy_version 19420 (0.0010) +[2023-10-08 16:29:22,948][21194] Updated weights for policy 1, policy_version 19270 (0.0009) +[2023-10-08 16:29:23,319][21194] Updated weights for policy 1, policy_version 19280 (0.0008) +[2023-10-08 16:29:23,695][21194] Updated weights for policy 1, policy_version 19290 (0.0008) +[2023-10-08 16:29:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 39616512. Throughput: 0: 1755.7, 1: 1724.5. Samples: 9913398. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:29:23,803][19739] Avg episode reward: [(0, '414.890'), (1, '675.760')] +[2023-10-08 16:29:26,623][21195] Updated weights for policy 0, policy_version 19430 (0.0007) +[2023-10-08 16:29:26,984][21195] Updated weights for policy 0, policy_version 19440 (0.0008) +[2023-10-08 16:29:27,352][21195] Updated weights for policy 0, policy_version 19450 (0.0007) +[2023-10-08 16:29:27,579][21194] Updated weights for policy 1, policy_version 19300 (0.0009) +[2023-10-08 16:29:27,950][21194] Updated weights for policy 1, policy_version 19310 (0.0008) +[2023-10-08 16:29:28,324][21194] Updated weights for policy 1, policy_version 19320 (0.0008) +[2023-10-08 16:29:28,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 39714816. Throughput: 0: 1721.3, 1: 1711.4. Samples: 9932854. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 16:29:28,803][19739] Avg episode reward: [(0, '414.890'), (1, '675.760')] +[2023-10-08 16:29:31,200][21195] Updated weights for policy 0, policy_version 19460 (0.0008) +[2023-10-08 16:29:31,584][21195] Updated weights for policy 0, policy_version 19470 (0.0009) +[2023-10-08 16:29:31,948][21195] Updated weights for policy 0, policy_version 19480 (0.0008) +[2023-10-08 16:29:32,251][21194] Updated weights for policy 1, policy_version 19330 (0.0010) +[2023-10-08 16:29:32,622][21194] Updated weights for policy 1, policy_version 19340 (0.0008) +[2023-10-08 16:29:32,985][21194] Updated weights for policy 1, policy_version 19350 (0.0009) +[2023-10-08 16:29:33,354][21194] Updated weights for policy 1, policy_version 19360 (0.0008) +[2023-10-08 16:29:33,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 39780352. Throughput: 0: 1731.2, 1: 1724.3. Samples: 9949000. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 16:29:33,803][19739] Avg episode reward: [(0, '414.890'), (1, '675.760')] +[2023-10-08 16:29:35,882][21195] Updated weights for policy 0, policy_version 19490 (0.0010) +[2023-10-08 16:29:36,262][21195] Updated weights for policy 0, policy_version 19500 (0.0008) +[2023-10-08 16:29:36,639][21195] Updated weights for policy 0, policy_version 19510 (0.0009) +[2023-10-08 16:29:37,015][21195] Updated weights for policy 0, policy_version 19520 (0.0008) +[2023-10-08 16:29:37,268][21194] Updated weights for policy 1, policy_version 19370 (0.0008) +[2023-10-08 16:29:37,640][21194] Updated weights for policy 1, policy_version 19380 (0.0007) +[2023-10-08 16:29:38,007][21194] Updated weights for policy 1, policy_version 19390 (0.0011) +[2023-10-08 16:29:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 39845888. Throughput: 0: 1724.0, 1: 1727.2. Samples: 9964612. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 16:29:38,803][19739] Avg episode reward: [(0, '414.890'), (1, '671.830')] +[2023-10-08 16:29:40,966][21195] Updated weights for policy 0, policy_version 19530 (0.0010) +[2023-10-08 16:29:41,336][21195] Updated weights for policy 0, policy_version 19540 (0.0009) +[2023-10-08 16:29:41,698][21195] Updated weights for policy 0, policy_version 19550 (0.0008) +[2023-10-08 16:29:41,889][21194] Updated weights for policy 1, policy_version 19400 (0.0010) +[2023-10-08 16:29:42,255][21194] Updated weights for policy 1, policy_version 19410 (0.0011) +[2023-10-08 16:29:42,622][21194] Updated weights for policy 1, policy_version 19420 (0.0010) +[2023-10-08 16:29:43,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 39911424. Throughput: 0: 1713.9, 1: 1700.8. Samples: 9984486. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 16:29:43,804][19739] Avg episode reward: [(0, '414.890'), (1, '660.410')] +[2023-10-08 16:29:45,736][21195] Updated weights for policy 0, policy_version 19560 (0.0009) +[2023-10-08 16:29:46,112][21195] Updated weights for policy 0, policy_version 19570 (0.0010) +[2023-10-08 16:29:46,474][21195] Updated weights for policy 0, policy_version 19580 (0.0008) +[2023-10-08 16:29:46,490][21194] Updated weights for policy 1, policy_version 19430 (0.0008) +[2023-10-08 16:29:46,865][21194] Updated weights for policy 1, policy_version 19440 (0.0008) +[2023-10-08 16:29:47,224][21194] Updated weights for policy 1, policy_version 19450 (0.0010) +[2023-10-08 16:29:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 39976960. Throughput: 0: 1739.4, 1: 1735.7. Samples: 10001310. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:29:48,803][19739] Avg episode reward: [(0, '427.680'), (1, '667.950')] +[2023-10-08 16:29:50,481][21195] Updated weights for policy 0, policy_version 19590 (0.0008) +[2023-10-08 16:29:50,852][21195] Updated weights for policy 0, policy_version 19600 (0.0008) +[2023-10-08 16:29:51,199][21194] Updated weights for policy 1, policy_version 19460 (0.0009) +[2023-10-08 16:29:51,210][21195] Updated weights for policy 0, policy_version 19610 (0.0008) +[2023-10-08 16:29:51,559][21194] Updated weights for policy 1, policy_version 19470 (0.0007) +[2023-10-08 16:29:51,926][21194] Updated weights for policy 1, policy_version 19480 (0.0010) +[2023-10-08 16:29:53,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 40042496. Throughput: 0: 1703.2, 1: 1712.0. Samples: 10015538. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:29:53,803][19739] Avg episode reward: [(0, '427.680'), (1, '667.950')] +[2023-10-08 16:29:55,213][21195] Updated weights for policy 0, policy_version 19620 (0.0007) +[2023-10-08 16:29:55,577][21195] Updated weights for policy 0, policy_version 19630 (0.0009) +[2023-10-08 16:29:55,899][21194] Updated weights for policy 1, policy_version 19490 (0.0009) +[2023-10-08 16:29:55,955][21195] Updated weights for policy 0, policy_version 19640 (0.0008) +[2023-10-08 16:29:56,271][21194] Updated weights for policy 1, policy_version 19500 (0.0007) +[2023-10-08 16:29:56,634][21194] Updated weights for policy 1, policy_version 19510 (0.0007) +[2023-10-08 16:29:57,005][21194] Updated weights for policy 1, policy_version 19520 (0.0009) +[2023-10-08 16:29:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 40108032. Throughput: 0: 1728.6, 1: 1704.9. Samples: 10036676. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:29:58,803][19739] Avg episode reward: [(0, '414.850'), (1, '676.990')] +[2023-10-08 16:29:59,866][21195] Updated weights for policy 0, policy_version 19650 (0.0008) +[2023-10-08 16:30:00,248][21195] Updated weights for policy 0, policy_version 19660 (0.0009) +[2023-10-08 16:30:00,630][21195] Updated weights for policy 0, policy_version 19670 (0.0009) +[2023-10-08 16:30:00,932][21194] Updated weights for policy 1, policy_version 19530 (0.0009) +[2023-10-08 16:30:00,993][21195] Updated weights for policy 0, policy_version 19680 (0.0008) +[2023-10-08 16:30:01,299][21194] Updated weights for policy 1, policy_version 19540 (0.0009) +[2023-10-08 16:30:01,669][21194] Updated weights for policy 1, policy_version 19550 (0.0008) +[2023-10-08 16:30:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 40173568. Throughput: 0: 1741.3, 1: 1723.8. Samples: 10053124. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:30:03,803][19739] Avg episode reward: [(0, '412.400'), (1, '676.990')] +[2023-10-08 16:30:04,827][21195] Updated weights for policy 0, policy_version 19690 (0.0008) +[2023-10-08 16:30:05,204][21195] Updated weights for policy 0, policy_version 19700 (0.0007) +[2023-10-08 16:30:05,578][21195] Updated weights for policy 0, policy_version 19710 (0.0009) +[2023-10-08 16:30:05,610][21194] Updated weights for policy 1, policy_version 19560 (0.0008) +[2023-10-08 16:30:05,976][21194] Updated weights for policy 1, policy_version 19570 (0.0008) +[2023-10-08 16:30:06,337][21194] Updated weights for policy 1, policy_version 19580 (0.0007) +[2023-10-08 16:30:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 40239104. Throughput: 0: 1718.8, 1: 1712.1. Samples: 10067788. Policy #0 lag: (min: 2.0, avg: 5.1, max: 30.0) +[2023-10-08 16:30:08,803][19739] Avg episode reward: [(0, '426.780'), (1, '676.990')] +[2023-10-08 16:30:09,354][21195] Updated weights for policy 0, policy_version 19720 (0.0009) +[2023-10-08 16:30:09,719][21195] Updated weights for policy 0, policy_version 19730 (0.0010) +[2023-10-08 16:30:10,092][21195] Updated weights for policy 0, policy_version 19740 (0.0010) +[2023-10-08 16:30:10,358][21194] Updated weights for policy 1, policy_version 19590 (0.0008) +[2023-10-08 16:30:10,726][21194] Updated weights for policy 1, policy_version 19600 (0.0009) +[2023-10-08 16:30:11,090][21194] Updated weights for policy 1, policy_version 19610 (0.0010) +[2023-10-08 16:30:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 40304640. Throughput: 0: 1754.2, 1: 1724.8. Samples: 10089410. Policy #0 lag: (min: 2.0, avg: 5.1, max: 30.0) +[2023-10-08 16:30:13,803][19739] Avg episode reward: [(0, '426.780'), (1, '676.990')] +[2023-10-08 16:30:13,901][21195] Updated weights for policy 0, policy_version 19750 (0.0007) +[2023-10-08 16:30:14,264][21195] Updated weights for policy 0, policy_version 19760 (0.0007) +[2023-10-08 16:30:14,638][21195] Updated weights for policy 0, policy_version 19770 (0.0007) +[2023-10-08 16:30:15,097][21194] Updated weights for policy 1, policy_version 19620 (0.0009) +[2023-10-08 16:30:15,457][21194] Updated weights for policy 1, policy_version 19630 (0.0011) +[2023-10-08 16:30:15,826][21194] Updated weights for policy 1, policy_version 19640 (0.0010) +[2023-10-08 16:30:18,289][21195] Updated weights for policy 0, policy_version 19780 (0.0008) +[2023-10-08 16:30:18,664][21195] Updated weights for policy 0, policy_version 19790 (0.0009) +[2023-10-08 16:30:18,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 40370176. Throughput: 0: 1740.0, 1: 1713.1. Samples: 10104386. Policy #0 lag: (min: 2.0, avg: 5.1, max: 30.0) +[2023-10-08 16:30:18,803][19739] Avg episode reward: [(0, '439.830'), (1, '676.990')] +[2023-10-08 16:30:19,035][21195] Updated weights for policy 0, policy_version 19800 (0.0008) +[2023-10-08 16:30:19,333][20740] Saving new best policy, reward=439.830! +[2023-10-08 16:30:19,673][21194] Updated weights for policy 1, policy_version 19650 (0.0010) +[2023-10-08 16:30:20,039][21194] Updated weights for policy 1, policy_version 19660 (0.0010) +[2023-10-08 16:30:20,413][21194] Updated weights for policy 1, policy_version 19670 (0.0008) +[2023-10-08 16:30:20,770][21194] Updated weights for policy 1, policy_version 19680 (0.0009) +[2023-10-08 16:30:23,084][21195] Updated weights for policy 0, policy_version 19810 (0.0010) +[2023-10-08 16:30:23,456][21195] Updated weights for policy 0, policy_version 19820 (0.0007) +[2023-10-08 16:30:23,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 40435712. Throughput: 0: 1751.4, 1: 1714.7. Samples: 10120584. Policy #0 lag: (min: 29.0, avg: 38.5, max: 61.0) +[2023-10-08 16:30:23,804][19739] Avg episode reward: [(0, '444.990'), (1, '676.990')] +[2023-10-08 16:30:23,828][21195] Updated weights for policy 0, policy_version 19830 (0.0007) +[2023-10-08 16:30:24,206][20740] Saving new best policy, reward=444.990! +[2023-10-08 16:30:24,206][21195] Updated weights for policy 0, policy_version 19840 (0.0009) +[2023-10-08 16:30:24,658][21194] Updated weights for policy 1, policy_version 19690 (0.0007) +[2023-10-08 16:30:25,025][21194] Updated weights for policy 1, policy_version 19700 (0.0007) +[2023-10-08 16:30:25,388][21194] Updated weights for policy 1, policy_version 19710 (0.0008) +[2023-10-08 16:30:28,136][21195] Updated weights for policy 0, policy_version 19850 (0.0007) +[2023-10-08 16:30:28,508][21195] Updated weights for policy 0, policy_version 19860 (0.0008) +[2023-10-08 16:30:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 40501248. Throughput: 0: 1754.6, 1: 1742.9. Samples: 10141874. Policy #0 lag: (min: 29.0, avg: 38.5, max: 61.0) +[2023-10-08 16:30:28,803][19739] Avg episode reward: [(0, '444.990'), (1, '676.990')] +[2023-10-08 16:30:28,876][21195] Updated weights for policy 0, policy_version 19870 (0.0009) +[2023-10-08 16:30:29,400][21194] Updated weights for policy 1, policy_version 19720 (0.0008) +[2023-10-08 16:30:29,769][21194] Updated weights for policy 1, policy_version 19730 (0.0009) +[2023-10-08 16:30:30,139][21194] Updated weights for policy 1, policy_version 19740 (0.0008) +[2023-10-08 16:30:32,872][21195] Updated weights for policy 0, policy_version 19880 (0.0008) +[2023-10-08 16:30:33,249][21195] Updated weights for policy 0, policy_version 19890 (0.0007) +[2023-10-08 16:30:33,627][21195] Updated weights for policy 0, policy_version 19900 (0.0007) +[2023-10-08 16:30:33,803][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 40599552. Throughput: 0: 1725.1, 1: 1706.8. Samples: 10155746. Policy #0 lag: (min: 29.0, avg: 38.5, max: 61.0) +[2023-10-08 16:30:33,803][19739] Avg episode reward: [(0, '444.990'), (1, '676.990')] +[2023-10-08 16:30:34,231][21194] Updated weights for policy 1, policy_version 19750 (0.0009) +[2023-10-08 16:30:34,612][21194] Updated weights for policy 1, policy_version 19760 (0.0009) +[2023-10-08 16:30:34,976][21194] Updated weights for policy 1, policy_version 19770 (0.0007) +[2023-10-08 16:30:37,507][21195] Updated weights for policy 0, policy_version 19910 (0.0007) +[2023-10-08 16:30:37,884][21195] Updated weights for policy 0, policy_version 19920 (0.0008) +[2023-10-08 16:30:38,247][21195] Updated weights for policy 0, policy_version 19930 (0.0010) +[2023-10-08 16:30:38,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 40665088. Throughput: 0: 1754.8, 1: 1727.9. Samples: 10172258. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:30:38,803][19739] Avg episode reward: [(0, '444.990'), (1, '676.990')] +[2023-10-08 16:30:38,870][21194] Updated weights for policy 1, policy_version 19780 (0.0009) +[2023-10-08 16:30:39,235][21194] Updated weights for policy 1, policy_version 19790 (0.0008) +[2023-10-08 16:30:39,605][21194] Updated weights for policy 1, policy_version 19800 (0.0010) +[2023-10-08 16:30:42,069][21195] Updated weights for policy 0, policy_version 19940 (0.0009) +[2023-10-08 16:30:42,439][21195] Updated weights for policy 0, policy_version 19950 (0.0007) +[2023-10-08 16:30:42,811][21195] Updated weights for policy 0, policy_version 19960 (0.0007) +[2023-10-08 16:30:43,548][21194] Updated weights for policy 1, policy_version 19810 (0.0010) +[2023-10-08 16:30:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 40730624. Throughput: 0: 1731.5, 1: 1739.1. Samples: 10192850. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:30:43,803][19739] Avg episode reward: [(0, '429.710'), (1, '676.990')] +[2023-10-08 16:30:43,916][21194] Updated weights for policy 1, policy_version 19820 (0.0009) +[2023-10-08 16:30:44,271][21194] Updated weights for policy 1, policy_version 19830 (0.0008) +[2023-10-08 16:30:44,633][21194] Updated weights for policy 1, policy_version 19840 (0.0009) +[2023-10-08 16:30:46,687][21195] Updated weights for policy 0, policy_version 19970 (0.0007) +[2023-10-08 16:30:47,061][21195] Updated weights for policy 0, policy_version 19980 (0.0007) +[2023-10-08 16:30:47,443][21195] Updated weights for policy 0, policy_version 19990 (0.0009) +[2023-10-08 16:30:47,812][21195] Updated weights for policy 0, policy_version 20000 (0.0008) +[2023-10-08 16:30:48,583][21194] Updated weights for policy 1, policy_version 19850 (0.0011) +[2023-10-08 16:30:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 40796160. Throughput: 0: 1725.7, 1: 1715.7. Samples: 10207988. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:30:48,803][19739] Avg episode reward: [(0, '435.160'), (1, '676.990')] +[2023-10-08 16:30:48,946][21194] Updated weights for policy 1, policy_version 19860 (0.0009) +[2023-10-08 16:30:49,313][21194] Updated weights for policy 1, policy_version 19870 (0.0010) +[2023-10-08 16:30:51,743][21195] Updated weights for policy 0, policy_version 20010 (0.0009) +[2023-10-08 16:30:52,108][21195] Updated weights for policy 0, policy_version 20020 (0.0007) +[2023-10-08 16:30:52,485][21195] Updated weights for policy 0, policy_version 20030 (0.0007) +[2023-10-08 16:30:53,421][21194] Updated weights for policy 1, policy_version 19880 (0.0012) +[2023-10-08 16:30:53,789][21194] Updated weights for policy 1, policy_version 19890 (0.0010) +[2023-10-08 16:30:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 40861696. Throughput: 0: 1749.0, 1: 1730.1. Samples: 10224348. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:30:53,803][19739] Avg episode reward: [(0, '449.670'), (1, '676.990')] +[2023-10-08 16:30:53,804][20740] Saving new best policy, reward=449.670! +[2023-10-08 16:30:54,157][21194] Updated weights for policy 1, policy_version 19900 (0.0009) +[2023-10-08 16:30:56,245][21195] Updated weights for policy 0, policy_version 20040 (0.0011) +[2023-10-08 16:30:56,616][21195] Updated weights for policy 0, policy_version 20050 (0.0009) +[2023-10-08 16:30:56,981][21195] Updated weights for policy 0, policy_version 20060 (0.0008) +[2023-10-08 16:30:58,148][21194] Updated weights for policy 1, policy_version 19910 (0.0009) +[2023-10-08 16:30:58,513][21194] Updated weights for policy 1, policy_version 19920 (0.0008) +[2023-10-08 16:30:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 40927232. Throughput: 0: 1726.0, 1: 1726.9. Samples: 10244790. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 16:30:58,803][19739] Avg episode reward: [(0, '449.670'), (1, '676.990')] +[2023-10-08 16:30:58,882][21194] Updated weights for policy 1, policy_version 19930 (0.0009) +[2023-10-08 16:31:00,894][21195] Updated weights for policy 0, policy_version 20070 (0.0008) +[2023-10-08 16:31:01,257][21195] Updated weights for policy 0, policy_version 20080 (0.0009) +[2023-10-08 16:31:01,621][21195] Updated weights for policy 0, policy_version 20090 (0.0010) +[2023-10-08 16:31:02,753][21194] Updated weights for policy 1, policy_version 19940 (0.0008) +[2023-10-08 16:31:03,130][21194] Updated weights for policy 1, policy_version 19950 (0.0008) +[2023-10-08 16:31:03,491][21194] Updated weights for policy 1, policy_version 19960 (0.0009) +[2023-10-08 16:31:03,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 41025536. Throughput: 0: 1738.7, 1: 1725.4. Samples: 10260272. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 16:31:03,803][19739] Avg episode reward: [(0, '449.670'), (1, '676.990')] +[2023-10-08 16:31:05,368][21195] Updated weights for policy 0, policy_version 20100 (0.0009) +[2023-10-08 16:31:05,736][21195] Updated weights for policy 0, policy_version 20110 (0.0007) +[2023-10-08 16:31:06,104][21195] Updated weights for policy 0, policy_version 20120 (0.0008) +[2023-10-08 16:31:07,354][21194] Updated weights for policy 1, policy_version 19970 (0.0008) +[2023-10-08 16:31:07,715][21194] Updated weights for policy 1, policy_version 19980 (0.0008) +[2023-10-08 16:31:08,080][21194] Updated weights for policy 1, policy_version 19990 (0.0008) +[2023-10-08 16:31:08,442][21194] Updated weights for policy 1, policy_version 20000 (0.0007) +[2023-10-08 16:31:08,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 41091072. Throughput: 0: 1724.1, 1: 1732.8. Samples: 10276142. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 16:31:08,803][19739] Avg episode reward: [(0, '463.750'), (1, '676.990')] +[2023-10-08 16:31:08,804][20740] Saving new best policy, reward=463.750! +[2023-10-08 16:31:10,010][21195] Updated weights for policy 0, policy_version 20130 (0.0009) +[2023-10-08 16:31:10,382][21195] Updated weights for policy 0, policy_version 20140 (0.0010) +[2023-10-08 16:31:10,746][21195] Updated weights for policy 0, policy_version 20150 (0.0011) +[2023-10-08 16:31:11,115][21195] Updated weights for policy 0, policy_version 20160 (0.0011) +[2023-10-08 16:31:12,141][21194] Updated weights for policy 1, policy_version 20010 (0.0010) +[2023-10-08 16:31:12,511][21194] Updated weights for policy 1, policy_version 20020 (0.0009) +[2023-10-08 16:31:12,878][21194] Updated weights for policy 1, policy_version 20030 (0.0007) +[2023-10-08 16:31:13,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 41156608. Throughput: 0: 1726.1, 1: 1707.6. Samples: 10296390. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 16:31:13,804][19739] Avg episode reward: [(0, '475.660'), (1, '680.770')] +[2023-10-08 16:31:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000020160_20643840.pth... +[2023-10-08 16:31:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000020032_20512768.pth... +[2023-10-08 16:31:13,849][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000018560_19005440.pth +[2023-10-08 16:31:13,852][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000018432_18874368.pth +[2023-10-08 16:31:13,855][20740] Saving new best policy, reward=475.660! +[2023-10-08 16:31:15,108][21195] Updated weights for policy 0, policy_version 20170 (0.0007) +[2023-10-08 16:31:15,474][21195] Updated weights for policy 0, policy_version 20180 (0.0008) +[2023-10-08 16:31:15,842][21195] Updated weights for policy 0, policy_version 20190 (0.0008) +[2023-10-08 16:31:16,820][21194] Updated weights for policy 1, policy_version 20040 (0.0010) +[2023-10-08 16:31:17,181][21194] Updated weights for policy 1, policy_version 20050 (0.0009) +[2023-10-08 16:31:17,551][21194] Updated weights for policy 1, policy_version 20060 (0.0008) +[2023-10-08 16:31:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 41222144. Throughput: 0: 1751.3, 1: 1743.3. Samples: 10313006. Policy #0 lag: (min: 10.0, avg: 10.6, max: 24.0) +[2023-10-08 16:31:18,803][19739] Avg episode reward: [(0, '475.660'), (1, '680.770')] +[2023-10-08 16:31:19,802][21195] Updated weights for policy 0, policy_version 20200 (0.0009) +[2023-10-08 16:31:20,180][21195] Updated weights for policy 0, policy_version 20210 (0.0010) +[2023-10-08 16:31:20,546][21195] Updated weights for policy 0, policy_version 20220 (0.0009) +[2023-10-08 16:31:21,433][21194] Updated weights for policy 1, policy_version 20070 (0.0008) +[2023-10-08 16:31:21,804][21194] Updated weights for policy 1, policy_version 20080 (0.0008) +[2023-10-08 16:31:22,171][21194] Updated weights for policy 1, policy_version 20090 (0.0009) +[2023-10-08 16:31:23,803][19739] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 41287680. Throughput: 0: 1724.6, 1: 1730.1. Samples: 10327720. Policy #0 lag: (min: 10.0, avg: 10.6, max: 24.0) +[2023-10-08 16:31:23,803][19739] Avg episode reward: [(0, '475.660'), (1, '680.770')] +[2023-10-08 16:31:24,606][21195] Updated weights for policy 0, policy_version 20230 (0.0010) +[2023-10-08 16:31:24,989][21195] Updated weights for policy 0, policy_version 20240 (0.0010) +[2023-10-08 16:31:25,361][21195] Updated weights for policy 0, policy_version 20250 (0.0010) +[2023-10-08 16:31:26,089][21194] Updated weights for policy 1, policy_version 20100 (0.0008) +[2023-10-08 16:31:26,454][21194] Updated weights for policy 1, policy_version 20110 (0.0007) +[2023-10-08 16:31:26,816][21194] Updated weights for policy 1, policy_version 20120 (0.0009) +[2023-10-08 16:31:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 41353216. Throughput: 0: 1747.4, 1: 1717.6. Samples: 10348778. Policy #0 lag: (min: 10.0, avg: 10.6, max: 24.0) +[2023-10-08 16:31:28,803][19739] Avg episode reward: [(0, '479.460'), (1, '680.770')] +[2023-10-08 16:31:28,810][20740] Saving new best policy, reward=479.460! +[2023-10-08 16:31:29,135][21195] Updated weights for policy 0, policy_version 20260 (0.0008) +[2023-10-08 16:31:29,502][21195] Updated weights for policy 0, policy_version 20270 (0.0007) +[2023-10-08 16:31:29,883][21195] Updated weights for policy 0, policy_version 20280 (0.0008) +[2023-10-08 16:31:30,801][21194] Updated weights for policy 1, policy_version 20130 (0.0011) +[2023-10-08 16:31:31,166][21194] Updated weights for policy 1, policy_version 20140 (0.0007) +[2023-10-08 16:31:31,528][21194] Updated weights for policy 1, policy_version 20150 (0.0007) +[2023-10-08 16:31:31,899][21194] Updated weights for policy 1, policy_version 20160 (0.0008) +[2023-10-08 16:31:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 41418752. Throughput: 0: 1745.4, 1: 1740.4. Samples: 10364850. Policy #0 lag: (min: 7.0, avg: 12.9, max: 39.0) +[2023-10-08 16:31:33,804][19739] Avg episode reward: [(0, '474.600'), (1, '680.770')] +[2023-10-08 16:31:33,874][21195] Updated weights for policy 0, policy_version 20290 (0.0008) +[2023-10-08 16:31:34,286][21195] Updated weights for policy 0, policy_version 20300 (0.0008) +[2023-10-08 16:31:34,656][21195] Updated weights for policy 0, policy_version 20310 (0.0008) +[2023-10-08 16:31:35,020][21195] Updated weights for policy 0, policy_version 20320 (0.0007) +[2023-10-08 16:31:35,951][21194] Updated weights for policy 1, policy_version 20170 (0.0008) +[2023-10-08 16:31:36,327][21194] Updated weights for policy 1, policy_version 20180 (0.0008) +[2023-10-08 16:31:36,698][21194] Updated weights for policy 1, policy_version 20190 (0.0007) +[2023-10-08 16:31:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 41484288. Throughput: 0: 1721.6, 1: 1718.5. Samples: 10379150. Policy #0 lag: (min: 7.0, avg: 12.9, max: 39.0) +[2023-10-08 16:31:38,803][19739] Avg episode reward: [(0, '475.300'), (1, '680.770')] +[2023-10-08 16:31:39,050][21195] Updated weights for policy 0, policy_version 20330 (0.0010) +[2023-10-08 16:31:39,420][21195] Updated weights for policy 0, policy_version 20340 (0.0008) +[2023-10-08 16:31:39,786][21195] Updated weights for policy 0, policy_version 20350 (0.0008) +[2023-10-08 16:31:40,628][21194] Updated weights for policy 1, policy_version 20200 (0.0010) +[2023-10-08 16:31:41,002][21194] Updated weights for policy 1, policy_version 20210 (0.0008) +[2023-10-08 16:31:41,365][21194] Updated weights for policy 1, policy_version 20220 (0.0007) +[2023-10-08 16:31:43,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 41549824. Throughput: 0: 1731.7, 1: 1724.3. Samples: 10400308. Policy #0 lag: (min: 7.0, avg: 12.9, max: 39.0) +[2023-10-08 16:31:43,803][19739] Avg episode reward: [(0, '482.070'), (1, '694.080')] +[2023-10-08 16:31:43,807][21195] Updated weights for policy 0, policy_version 20360 (0.0010) +[2023-10-08 16:31:44,183][21195] Updated weights for policy 0, policy_version 20370 (0.0008) +[2023-10-08 16:31:44,547][21195] Updated weights for policy 0, policy_version 20380 (0.0009) +[2023-10-08 16:31:44,692][20740] Saving new best policy, reward=482.070! +[2023-10-08 16:31:45,146][21194] Updated weights for policy 1, policy_version 20230 (0.0008) +[2023-10-08 16:31:45,512][21194] Updated weights for policy 1, policy_version 20240 (0.0010) +[2023-10-08 16:31:45,880][21194] Updated weights for policy 1, policy_version 20250 (0.0008) +[2023-10-08 16:31:48,569][21195] Updated weights for policy 0, policy_version 20390 (0.0008) +[2023-10-08 16:31:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 41615360. Throughput: 0: 1716.7, 1: 1729.9. Samples: 10415368. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 16:31:48,803][19739] Avg episode reward: [(0, '482.140'), (1, '709.750')] +[2023-10-08 16:31:48,934][21195] Updated weights for policy 0, policy_version 20400 (0.0009) +[2023-10-08 16:31:49,294][21195] Updated weights for policy 0, policy_version 20410 (0.0007) +[2023-10-08 16:31:49,509][20740] Saving new best policy, reward=482.140! +[2023-10-08 16:31:49,852][21194] Updated weights for policy 1, policy_version 20260 (0.0009) +[2023-10-08 16:31:50,210][21194] Updated weights for policy 1, policy_version 20270 (0.0009) +[2023-10-08 16:31:50,575][21194] Updated weights for policy 1, policy_version 20280 (0.0007) +[2023-10-08 16:31:53,015][21195] Updated weights for policy 0, policy_version 20420 (0.0009) +[2023-10-08 16:31:53,379][21195] Updated weights for policy 0, policy_version 20430 (0.0007) +[2023-10-08 16:31:53,750][21195] Updated weights for policy 0, policy_version 20440 (0.0008) +[2023-10-08 16:31:53,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 41680896. Throughput: 0: 1730.0, 1: 1717.7. Samples: 10431292. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 16:31:53,803][19739] Avg episode reward: [(0, '482.140'), (1, '707.660')] +[2023-10-08 16:31:54,477][21194] Updated weights for policy 1, policy_version 20290 (0.0008) +[2023-10-08 16:31:54,847][21194] Updated weights for policy 1, policy_version 20300 (0.0008) +[2023-10-08 16:31:55,207][21194] Updated weights for policy 1, policy_version 20310 (0.0009) +[2023-10-08 16:31:55,576][21194] Updated weights for policy 1, policy_version 20320 (0.0008) +[2023-10-08 16:31:57,321][21195] Updated weights for policy 0, policy_version 20450 (0.0008) +[2023-10-08 16:31:57,686][21195] Updated weights for policy 0, policy_version 20460 (0.0007) +[2023-10-08 16:31:58,058][21195] Updated weights for policy 0, policy_version 20470 (0.0009) +[2023-10-08 16:31:58,422][21195] Updated weights for policy 0, policy_version 20480 (0.0011) +[2023-10-08 16:31:58,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 41779200. Throughput: 0: 1725.2, 1: 1748.6. Samples: 10452708. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 16:31:58,803][19739] Avg episode reward: [(0, '482.140'), (1, '722.390')] +[2023-10-08 16:31:59,516][21194] Updated weights for policy 1, policy_version 20330 (0.0007) +[2023-10-08 16:31:59,873][21194] Updated weights for policy 1, policy_version 20340 (0.0009) +[2023-10-08 16:32:00,235][21194] Updated weights for policy 1, policy_version 20350 (0.0007) +[2023-10-08 16:32:02,434][21195] Updated weights for policy 0, policy_version 20490 (0.0007) +[2023-10-08 16:32:02,813][21195] Updated weights for policy 0, policy_version 20500 (0.0010) +[2023-10-08 16:32:03,181][21195] Updated weights for policy 0, policy_version 20510 (0.0010) +[2023-10-08 16:32:03,803][19739] Fps is (10 sec: 16383.6, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 41844736. Throughput: 0: 1713.5, 1: 1717.6. Samples: 10467406. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 16:32:03,804][19739] Avg episode reward: [(0, '482.140'), (1, '722.390')] +[2023-10-08 16:32:04,165][21194] Updated weights for policy 1, policy_version 20360 (0.0007) +[2023-10-08 16:32:04,532][21194] Updated weights for policy 1, policy_version 20370 (0.0007) +[2023-10-08 16:32:04,906][21194] Updated weights for policy 1, policy_version 20380 (0.0007) +[2023-10-08 16:32:06,991][21195] Updated weights for policy 0, policy_version 20520 (0.0007) +[2023-10-08 16:32:07,356][21195] Updated weights for policy 0, policy_version 20530 (0.0007) +[2023-10-08 16:32:07,728][21195] Updated weights for policy 0, policy_version 20540 (0.0007) +[2023-10-08 16:32:08,730][21194] Updated weights for policy 1, policy_version 20390 (0.0008) +[2023-10-08 16:32:08,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 41910272. Throughput: 0: 1744.8, 1: 1739.0. Samples: 10484492. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 16:32:08,803][19739] Avg episode reward: [(0, '482.140'), (1, '722.180')] +[2023-10-08 16:32:09,091][21194] Updated weights for policy 1, policy_version 20400 (0.0009) +[2023-10-08 16:32:09,465][21194] Updated weights for policy 1, policy_version 20410 (0.0007) +[2023-10-08 16:32:11,499][21195] Updated weights for policy 0, policy_version 20550 (0.0007) +[2023-10-08 16:32:11,864][21195] Updated weights for policy 0, policy_version 20560 (0.0007) +[2023-10-08 16:32:12,240][21195] Updated weights for policy 0, policy_version 20570 (0.0008) +[2023-10-08 16:32:13,345][21194] Updated weights for policy 1, policy_version 20420 (0.0009) +[2023-10-08 16:32:13,704][21194] Updated weights for policy 1, policy_version 20430 (0.0007) +[2023-10-08 16:32:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 41975808. Throughput: 0: 1719.9, 1: 1751.7. Samples: 10505000. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 16:32:13,803][19739] Avg episode reward: [(0, '482.140'), (1, '715.420')] +[2023-10-08 16:32:14,074][21194] Updated weights for policy 1, policy_version 20440 (0.0012) +[2023-10-08 16:32:16,167][21195] Updated weights for policy 0, policy_version 20580 (0.0009) +[2023-10-08 16:32:16,537][21195] Updated weights for policy 0, policy_version 20590 (0.0007) +[2023-10-08 16:32:16,905][21195] Updated weights for policy 0, policy_version 20600 (0.0007) +[2023-10-08 16:32:17,886][21194] Updated weights for policy 1, policy_version 20450 (0.0008) +[2023-10-08 16:32:18,262][21194] Updated weights for policy 1, policy_version 20460 (0.0008) +[2023-10-08 16:32:18,632][21194] Updated weights for policy 1, policy_version 20470 (0.0008) +[2023-10-08 16:32:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 42041344. Throughput: 0: 1727.8, 1: 1735.4. Samples: 10520692. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 16:32:18,803][19739] Avg episode reward: [(0, '483.280'), (1, '715.420')] +[2023-10-08 16:32:18,804][20740] Saving new best policy, reward=483.280! +[2023-10-08 16:32:19,008][21194] Updated weights for policy 1, policy_version 20480 (0.0008) +[2023-10-08 16:32:21,041][21195] Updated weights for policy 0, policy_version 20610 (0.0008) +[2023-10-08 16:32:21,416][21195] Updated weights for policy 0, policy_version 20620 (0.0008) +[2023-10-08 16:32:21,788][21195] Updated weights for policy 0, policy_version 20630 (0.0007) +[2023-10-08 16:32:22,158][21195] Updated weights for policy 0, policy_version 20640 (0.0009) +[2023-10-08 16:32:23,010][21194] Updated weights for policy 1, policy_version 20490 (0.0007) +[2023-10-08 16:32:23,383][21194] Updated weights for policy 1, policy_version 20500 (0.0007) +[2023-10-08 16:32:23,754][21194] Updated weights for policy 1, policy_version 20510 (0.0010) +[2023-10-08 16:32:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 42106880. Throughput: 0: 1737.1, 1: 1759.3. Samples: 10536490. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 16:32:23,804][19739] Avg episode reward: [(0, '490.110'), (1, '715.420')] +[2023-10-08 16:32:23,805][20740] Saving new best policy, reward=490.110! +[2023-10-08 16:32:26,325][21195] Updated weights for policy 0, policy_version 20650 (0.0008) +[2023-10-08 16:32:26,704][21195] Updated weights for policy 0, policy_version 20660 (0.0008) +[2023-10-08 16:32:27,074][21195] Updated weights for policy 0, policy_version 20670 (0.0007) +[2023-10-08 16:32:27,705][21194] Updated weights for policy 1, policy_version 20520 (0.0009) +[2023-10-08 16:32:28,088][21194] Updated weights for policy 1, policy_version 20530 (0.0008) +[2023-10-08 16:32:28,449][21194] Updated weights for policy 1, policy_version 20540 (0.0009) +[2023-10-08 16:32:28,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 42205184. Throughput: 0: 1728.8, 1: 1742.2. Samples: 10556500. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 16:32:28,803][19739] Avg episode reward: [(0, '490.110'), (1, '715.420')] +[2023-10-08 16:32:30,889][21195] Updated weights for policy 0, policy_version 20680 (0.0010) +[2023-10-08 16:32:31,255][21195] Updated weights for policy 0, policy_version 20690 (0.0011) +[2023-10-08 16:32:31,621][21195] Updated weights for policy 0, policy_version 20700 (0.0010) +[2023-10-08 16:32:32,607][21194] Updated weights for policy 1, policy_version 20550 (0.0010) +[2023-10-08 16:32:32,980][21194] Updated weights for policy 1, policy_version 20560 (0.0007) +[2023-10-08 16:32:33,357][21194] Updated weights for policy 1, policy_version 20570 (0.0007) +[2023-10-08 16:32:33,802][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 42270720. Throughput: 0: 1747.2, 1: 1745.8. Samples: 10572554. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 16:32:33,803][19739] Avg episode reward: [(0, '490.110'), (1, '715.370')] +[2023-10-08 16:32:35,401][21195] Updated weights for policy 0, policy_version 20710 (0.0009) +[2023-10-08 16:32:35,767][21195] Updated weights for policy 0, policy_version 20720 (0.0009) +[2023-10-08 16:32:36,145][21195] Updated weights for policy 0, policy_version 20730 (0.0010) +[2023-10-08 16:32:37,180][21194] Updated weights for policy 1, policy_version 20580 (0.0007) +[2023-10-08 16:32:37,552][21194] Updated weights for policy 1, policy_version 20590 (0.0008) +[2023-10-08 16:32:37,930][21194] Updated weights for policy 1, policy_version 20600 (0.0010) +[2023-10-08 16:32:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 42336256. Throughput: 0: 1729.0, 1: 1750.9. Samples: 10587886. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 16:32:38,803][19739] Avg episode reward: [(0, '490.110'), (1, '698.160')] +[2023-10-08 16:32:39,982][21195] Updated weights for policy 0, policy_version 20740 (0.0009) +[2023-10-08 16:32:40,358][21195] Updated weights for policy 0, policy_version 20750 (0.0007) +[2023-10-08 16:32:40,725][21195] Updated weights for policy 0, policy_version 20760 (0.0008) +[2023-10-08 16:32:41,917][21194] Updated weights for policy 1, policy_version 20610 (0.0011) +[2023-10-08 16:32:42,273][21194] Updated weights for policy 1, policy_version 20620 (0.0009) +[2023-10-08 16:32:42,645][21194] Updated weights for policy 1, policy_version 20630 (0.0008) +[2023-10-08 16:32:43,011][21194] Updated weights for policy 1, policy_version 20640 (0.0007) +[2023-10-08 16:32:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 42401792. Throughput: 0: 1741.9, 1: 1714.1. Samples: 10608228. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:32:43,803][19739] Avg episode reward: [(0, '490.190'), (1, '697.580')] +[2023-10-08 16:32:43,812][20740] Saving new best policy, reward=490.190! +[2023-10-08 16:32:44,605][21195] Updated weights for policy 0, policy_version 20770 (0.0007) +[2023-10-08 16:32:44,982][21195] Updated weights for policy 0, policy_version 20780 (0.0007) +[2023-10-08 16:32:45,355][21195] Updated weights for policy 0, policy_version 20790 (0.0008) +[2023-10-08 16:32:45,727][21195] Updated weights for policy 0, policy_version 20800 (0.0010) +[2023-10-08 16:32:46,911][21194] Updated weights for policy 1, policy_version 20650 (0.0010) +[2023-10-08 16:32:47,280][21194] Updated weights for policy 1, policy_version 20660 (0.0009) +[2023-10-08 16:32:47,642][21194] Updated weights for policy 1, policy_version 20670 (0.0008) +[2023-10-08 16:32:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 42467328. Throughput: 0: 1757.2, 1: 1744.9. Samples: 10624996. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:32:48,803][19739] Avg episode reward: [(0, '496.040'), (1, '696.370')] +[2023-10-08 16:32:48,804][20740] Saving new best policy, reward=496.040! +[2023-10-08 16:32:49,823][21195] Updated weights for policy 0, policy_version 20810 (0.0010) +[2023-10-08 16:32:50,187][21195] Updated weights for policy 0, policy_version 20820 (0.0010) +[2023-10-08 16:32:50,548][21195] Updated weights for policy 0, policy_version 20830 (0.0009) +[2023-10-08 16:32:51,629][21194] Updated weights for policy 1, policy_version 20680 (0.0008) +[2023-10-08 16:32:52,002][21194] Updated weights for policy 1, policy_version 20690 (0.0010) +[2023-10-08 16:32:52,373][21194] Updated weights for policy 1, policy_version 20700 (0.0010) +[2023-10-08 16:32:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 42532864. Throughput: 0: 1722.2, 1: 1724.4. Samples: 10639592. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:32:53,803][19739] Avg episode reward: [(0, '496.040'), (1, '699.150')] +[2023-10-08 16:32:54,425][21195] Updated weights for policy 0, policy_version 20840 (0.0009) +[2023-10-08 16:32:54,800][21195] Updated weights for policy 0, policy_version 20850 (0.0007) +[2023-10-08 16:32:55,166][21195] Updated weights for policy 0, policy_version 20860 (0.0007) +[2023-10-08 16:32:56,246][21194] Updated weights for policy 1, policy_version 20710 (0.0008) +[2023-10-08 16:32:56,613][21194] Updated weights for policy 1, policy_version 20720 (0.0007) +[2023-10-08 16:32:56,976][21194] Updated weights for policy 1, policy_version 20730 (0.0007) +[2023-10-08 16:32:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 42598400. Throughput: 0: 1748.1, 1: 1706.7. Samples: 10660464. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:32:58,803][19739] Avg episode reward: [(0, '496.040'), (1, '702.930')] +[2023-10-08 16:32:58,947][21195] Updated weights for policy 0, policy_version 20870 (0.0007) +[2023-10-08 16:32:59,320][21195] Updated weights for policy 0, policy_version 20880 (0.0008) +[2023-10-08 16:32:59,684][21195] Updated weights for policy 0, policy_version 20890 (0.0007) +[2023-10-08 16:33:00,876][21194] Updated weights for policy 1, policy_version 20740 (0.0009) +[2023-10-08 16:33:01,241][21194] Updated weights for policy 1, policy_version 20750 (0.0009) +[2023-10-08 16:33:01,609][21194] Updated weights for policy 1, policy_version 20760 (0.0008) +[2023-10-08 16:33:03,610][21195] Updated weights for policy 0, policy_version 20900 (0.0007) +[2023-10-08 16:33:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 42663936. Throughput: 0: 1742.1, 1: 1727.1. Samples: 10676804. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 16:33:03,803][19739] Avg episode reward: [(0, '496.040'), (1, '687.010')] +[2023-10-08 16:33:03,986][21195] Updated weights for policy 0, policy_version 20910 (0.0008) +[2023-10-08 16:33:04,355][21195] Updated weights for policy 0, policy_version 20920 (0.0008) +[2023-10-08 16:33:05,447][21194] Updated weights for policy 1, policy_version 20770 (0.0007) +[2023-10-08 16:33:05,816][21194] Updated weights for policy 1, policy_version 20780 (0.0009) +[2023-10-08 16:33:06,187][21194] Updated weights for policy 1, policy_version 20790 (0.0008) +[2023-10-08 16:33:06,555][21194] Updated weights for policy 1, policy_version 20800 (0.0007) +[2023-10-08 16:33:08,004][21195] Updated weights for policy 0, policy_version 20930 (0.0008) +[2023-10-08 16:33:08,382][21195] Updated weights for policy 0, policy_version 20940 (0.0010) +[2023-10-08 16:33:08,759][21195] Updated weights for policy 0, policy_version 20950 (0.0009) +[2023-10-08 16:33:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 42729472. Throughput: 0: 1745.4, 1: 1703.0. Samples: 10691668. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 16:33:08,803][19739] Avg episode reward: [(0, '496.040'), (1, '673.190')] +[2023-10-08 16:33:09,123][21195] Updated weights for policy 0, policy_version 20960 (0.0010) +[2023-10-08 16:33:10,679][21194] Updated weights for policy 1, policy_version 20810 (0.0009) +[2023-10-08 16:33:11,051][21194] Updated weights for policy 1, policy_version 20820 (0.0008) +[2023-10-08 16:33:11,425][21194] Updated weights for policy 1, policy_version 20830 (0.0007) +[2023-10-08 16:33:13,057][21195] Updated weights for policy 0, policy_version 20970 (0.0007) +[2023-10-08 16:33:13,427][21195] Updated weights for policy 0, policy_version 20980 (0.0010) +[2023-10-08 16:33:13,795][21195] Updated weights for policy 0, policy_version 20990 (0.0007) +[2023-10-08 16:33:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 42795008. Throughput: 0: 1762.0, 1: 1721.7. Samples: 10713270. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 16:33:13,803][19739] Avg episode reward: [(0, '509.570'), (1, '673.190')] +[2023-10-08 16:33:13,811][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000020832_21331968.pth... +[2023-10-08 16:33:13,846][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000019232_19693568.pth +[2023-10-08 16:33:13,864][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000020992_21495808.pth... +[2023-10-08 16:33:13,900][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000019360_19824640.pth +[2023-10-08 16:33:13,905][20740] Saving new best policy, reward=509.570! +[2023-10-08 16:33:15,441][21194] Updated weights for policy 1, policy_version 20840 (0.0008) +[2023-10-08 16:33:15,809][21194] Updated weights for policy 1, policy_version 20850 (0.0010) +[2023-10-08 16:33:16,187][21194] Updated weights for policy 1, policy_version 20860 (0.0009) +[2023-10-08 16:33:17,570][21195] Updated weights for policy 0, policy_version 21000 (0.0008) +[2023-10-08 16:33:17,943][21195] Updated weights for policy 0, policy_version 21010 (0.0007) +[2023-10-08 16:33:18,317][21195] Updated weights for policy 0, policy_version 21020 (0.0007) +[2023-10-08 16:33:18,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 42893312. Throughput: 0: 1732.3, 1: 1719.0. Samples: 10727864. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:33:18,803][19739] Avg episode reward: [(0, '509.570'), (1, '687.070')] +[2023-10-08 16:33:20,050][21194] Updated weights for policy 1, policy_version 20870 (0.0007) +[2023-10-08 16:33:20,424][21194] Updated weights for policy 1, policy_version 20880 (0.0009) +[2023-10-08 16:33:20,793][21194] Updated weights for policy 1, policy_version 20890 (0.0009) +[2023-10-08 16:33:22,308][21195] Updated weights for policy 0, policy_version 21030 (0.0008) +[2023-10-08 16:33:22,672][21195] Updated weights for policy 0, policy_version 21040 (0.0008) +[2023-10-08 16:33:23,039][21195] Updated weights for policy 0, policy_version 21050 (0.0008) +[2023-10-08 16:33:23,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 42958848. Throughput: 0: 1767.4, 1: 1708.1. Samples: 10744282. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:33:23,803][19739] Avg episode reward: [(0, '509.570'), (1, '687.070')] +[2023-10-08 16:33:24,622][21194] Updated weights for policy 1, policy_version 20900 (0.0008) +[2023-10-08 16:33:24,991][21194] Updated weights for policy 1, policy_version 20910 (0.0009) +[2023-10-08 16:33:25,353][21194] Updated weights for policy 1, policy_version 20920 (0.0008) +[2023-10-08 16:33:26,990][21195] Updated weights for policy 0, policy_version 21060 (0.0008) +[2023-10-08 16:33:27,355][21195] Updated weights for policy 0, policy_version 21070 (0.0009) +[2023-10-08 16:33:27,731][21195] Updated weights for policy 0, policy_version 21080 (0.0010) +[2023-10-08 16:33:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 43024384. Throughput: 0: 1739.0, 1: 1748.8. Samples: 10765180. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:33:28,803][19739] Avg episode reward: [(0, '509.570'), (1, '673.540')] +[2023-10-08 16:33:29,221][21194] Updated weights for policy 1, policy_version 20930 (0.0009) +[2023-10-08 16:33:29,597][21194] Updated weights for policy 1, policy_version 20940 (0.0007) +[2023-10-08 16:33:29,958][21194] Updated weights for policy 1, policy_version 20950 (0.0009) +[2023-10-08 16:33:30,323][21194] Updated weights for policy 1, policy_version 20960 (0.0008) +[2023-10-08 16:33:31,539][21195] Updated weights for policy 0, policy_version 21090 (0.0009) +[2023-10-08 16:33:31,909][21195] Updated weights for policy 0, policy_version 21100 (0.0008) +[2023-10-08 16:33:32,278][21195] Updated weights for policy 0, policy_version 21110 (0.0009) +[2023-10-08 16:33:32,658][21195] Updated weights for policy 0, policy_version 21120 (0.0008) +[2023-10-08 16:33:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 43089920. Throughput: 0: 1736.9, 1: 1713.2. Samples: 10780254. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:33:33,803][19739] Avg episode reward: [(0, '515.650'), (1, '673.540')] +[2023-10-08 16:33:33,804][20740] Saving new best policy, reward=515.650! +[2023-10-08 16:33:34,219][21194] Updated weights for policy 1, policy_version 20970 (0.0007) +[2023-10-08 16:33:34,591][21194] Updated weights for policy 1, policy_version 20980 (0.0008) +[2023-10-08 16:33:34,963][21194] Updated weights for policy 1, policy_version 20990 (0.0009) +[2023-10-08 16:33:36,679][21195] Updated weights for policy 0, policy_version 21130 (0.0007) +[2023-10-08 16:33:37,052][21195] Updated weights for policy 0, policy_version 21140 (0.0007) +[2023-10-08 16:33:37,418][21195] Updated weights for policy 0, policy_version 21150 (0.0008) +[2023-10-08 16:33:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 43155456. Throughput: 0: 1758.0, 1: 1730.5. Samples: 10796574. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:33:38,803][19739] Avg episode reward: [(0, '515.650'), (1, '673.540')] +[2023-10-08 16:33:38,832][21194] Updated weights for policy 1, policy_version 21000 (0.0008) +[2023-10-08 16:33:39,197][21194] Updated weights for policy 1, policy_version 21010 (0.0009) +[2023-10-08 16:33:39,566][21194] Updated weights for policy 1, policy_version 21020 (0.0009) +[2023-10-08 16:33:41,333][21195] Updated weights for policy 0, policy_version 21160 (0.0007) +[2023-10-08 16:33:41,705][21195] Updated weights for policy 0, policy_version 21170 (0.0007) +[2023-10-08 16:33:42,074][21195] Updated weights for policy 0, policy_version 21180 (0.0009) +[2023-10-08 16:33:43,495][21194] Updated weights for policy 1, policy_version 21030 (0.0009) +[2023-10-08 16:33:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 43220992. Throughput: 0: 1737.9, 1: 1747.2. Samples: 10817296. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:33:43,803][19739] Avg episode reward: [(0, '515.650'), (1, '673.540')] +[2023-10-08 16:33:43,863][21194] Updated weights for policy 1, policy_version 21040 (0.0011) +[2023-10-08 16:33:44,233][21194] Updated weights for policy 1, policy_version 21050 (0.0010) +[2023-10-08 16:33:45,939][21195] Updated weights for policy 0, policy_version 21190 (0.0009) +[2023-10-08 16:33:46,310][21195] Updated weights for policy 0, policy_version 21200 (0.0007) +[2023-10-08 16:33:46,690][21195] Updated weights for policy 0, policy_version 21210 (0.0008) +[2023-10-08 16:33:48,157][21194] Updated weights for policy 1, policy_version 21060 (0.0009) +[2023-10-08 16:33:48,533][21194] Updated weights for policy 1, policy_version 21070 (0.0008) +[2023-10-08 16:33:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 43286528. Throughput: 0: 1738.8, 1: 1724.2. Samples: 10832642. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:33:48,803][19739] Avg episode reward: [(0, '515.650'), (1, '681.640')] +[2023-10-08 16:33:48,897][21194] Updated weights for policy 1, policy_version 21080 (0.0009) +[2023-10-08 16:33:50,531][21195] Updated weights for policy 0, policy_version 21220 (0.0010) +[2023-10-08 16:33:50,898][21195] Updated weights for policy 0, policy_version 21230 (0.0010) +[2023-10-08 16:33:51,262][21195] Updated weights for policy 0, policy_version 21240 (0.0009) +[2023-10-08 16:33:52,874][21194] Updated weights for policy 1, policy_version 21090 (0.0008) +[2023-10-08 16:33:53,243][21194] Updated weights for policy 1, policy_version 21100 (0.0008) +[2023-10-08 16:33:53,600][21194] Updated weights for policy 1, policy_version 21110 (0.0008) +[2023-10-08 16:33:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 43352064. Throughput: 0: 1727.6, 1: 1746.1. Samples: 10847986. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:33:53,803][19739] Avg episode reward: [(0, '515.650'), (1, '684.860')] +[2023-10-08 16:33:53,962][21194] Updated weights for policy 1, policy_version 21120 (0.0009) +[2023-10-08 16:33:55,196][21195] Updated weights for policy 0, policy_version 21250 (0.0009) +[2023-10-08 16:33:55,570][21195] Updated weights for policy 0, policy_version 21260 (0.0008) +[2023-10-08 16:33:55,938][21195] Updated weights for policy 0, policy_version 21270 (0.0009) +[2023-10-08 16:33:56,306][21195] Updated weights for policy 0, policy_version 21280 (0.0007) +[2023-10-08 16:33:57,853][21194] Updated weights for policy 1, policy_version 21130 (0.0009) +[2023-10-08 16:33:58,224][21194] Updated weights for policy 1, policy_version 21140 (0.0008) +[2023-10-08 16:33:58,587][21194] Updated weights for policy 1, policy_version 21150 (0.0008) +[2023-10-08 16:33:58,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 43450368. Throughput: 0: 1728.0, 1: 1732.4. Samples: 10868984. Policy #0 lag: (min: 31.0, avg: 31.1, max: 38.0) +[2023-10-08 16:33:58,803][19739] Avg episode reward: [(0, '529.510'), (1, '693.100')] +[2023-10-08 16:33:58,810][20740] Saving new best policy, reward=529.510! +[2023-10-08 16:34:00,410][21195] Updated weights for policy 0, policy_version 21290 (0.0007) +[2023-10-08 16:34:00,775][21195] Updated weights for policy 0, policy_version 21300 (0.0007) +[2023-10-08 16:34:01,148][21195] Updated weights for policy 0, policy_version 21310 (0.0010) +[2023-10-08 16:34:02,611][21194] Updated weights for policy 1, policy_version 21160 (0.0007) +[2023-10-08 16:34:02,993][21194] Updated weights for policy 1, policy_version 21170 (0.0007) +[2023-10-08 16:34:03,349][21194] Updated weights for policy 1, policy_version 21180 (0.0007) +[2023-10-08 16:34:03,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 43515904. Throughput: 0: 1751.2, 1: 1739.2. Samples: 10884932. Policy #0 lag: (min: 31.0, avg: 31.1, max: 38.0) +[2023-10-08 16:34:03,804][19739] Avg episode reward: [(0, '529.510'), (1, '693.100')] +[2023-10-08 16:34:05,174][21195] Updated weights for policy 0, policy_version 21320 (0.0010) +[2023-10-08 16:34:05,559][21195] Updated weights for policy 0, policy_version 21330 (0.0010) +[2023-10-08 16:34:05,928][21195] Updated weights for policy 0, policy_version 21340 (0.0008) +[2023-10-08 16:34:07,280][21194] Updated weights for policy 1, policy_version 21190 (0.0007) +[2023-10-08 16:34:07,646][21194] Updated weights for policy 1, policy_version 21200 (0.0009) +[2023-10-08 16:34:08,011][21194] Updated weights for policy 1, policy_version 21210 (0.0009) +[2023-10-08 16:34:08,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 43581440. Throughput: 0: 1716.9, 1: 1751.6. Samples: 10900366. Policy #0 lag: (min: 31.0, avg: 31.1, max: 38.0) +[2023-10-08 16:34:08,803][19739] Avg episode reward: [(0, '538.250'), (1, '700.210')] +[2023-10-08 16:34:08,804][20740] Saving new best policy, reward=538.250! +[2023-10-08 16:34:09,640][21195] Updated weights for policy 0, policy_version 21350 (0.0008) +[2023-10-08 16:34:10,004][21195] Updated weights for policy 0, policy_version 21360 (0.0009) +[2023-10-08 16:34:10,375][21195] Updated weights for policy 0, policy_version 21370 (0.0008) +[2023-10-08 16:34:12,102][21194] Updated weights for policy 1, policy_version 21220 (0.0007) +[2023-10-08 16:34:12,465][21194] Updated weights for policy 1, policy_version 21230 (0.0007) +[2023-10-08 16:34:12,828][21194] Updated weights for policy 1, policy_version 21240 (0.0007) +[2023-10-08 16:34:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 43646976. Throughput: 0: 1742.8, 1: 1713.3. Samples: 10920704. Policy #0 lag: (min: 31.0, avg: 31.1, max: 38.0) +[2023-10-08 16:34:13,803][19739] Avg episode reward: [(0, '551.460'), (1, '700.210')] +[2023-10-08 16:34:13,811][20740] Saving new best policy, reward=551.460! +[2023-10-08 16:34:14,279][21195] Updated weights for policy 0, policy_version 21380 (0.0008) +[2023-10-08 16:34:14,649][21195] Updated weights for policy 0, policy_version 21390 (0.0007) +[2023-10-08 16:34:15,024][21195] Updated weights for policy 0, policy_version 21400 (0.0007) +[2023-10-08 16:34:16,718][21194] Updated weights for policy 1, policy_version 21250 (0.0009) +[2023-10-08 16:34:17,081][21194] Updated weights for policy 1, policy_version 21260 (0.0009) +[2023-10-08 16:34:17,444][21194] Updated weights for policy 1, policy_version 21270 (0.0008) +[2023-10-08 16:34:17,808][21194] Updated weights for policy 1, policy_version 21280 (0.0007) +[2023-10-08 16:34:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 43712512. Throughput: 0: 1752.0, 1: 1740.7. Samples: 10937422. Policy #0 lag: (min: 12.0, avg: 12.0, max: 16.0) +[2023-10-08 16:34:18,803][19739] Avg episode reward: [(0, '551.460'), (1, '693.720')] +[2023-10-08 16:34:18,931][21195] Updated weights for policy 0, policy_version 21410 (0.0007) +[2023-10-08 16:34:19,301][21195] Updated weights for policy 0, policy_version 21420 (0.0009) +[2023-10-08 16:34:19,684][21195] Updated weights for policy 0, policy_version 21430 (0.0007) +[2023-10-08 16:34:20,051][21195] Updated weights for policy 0, policy_version 21440 (0.0010) +[2023-10-08 16:34:21,736][21194] Updated weights for policy 1, policy_version 21290 (0.0009) +[2023-10-08 16:34:22,102][21194] Updated weights for policy 1, policy_version 21300 (0.0009) +[2023-10-08 16:34:22,472][21194] Updated weights for policy 1, policy_version 21310 (0.0010) +[2023-10-08 16:34:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 43778048. Throughput: 0: 1732.3, 1: 1720.4. Samples: 10951942. Policy #0 lag: (min: 12.0, avg: 12.0, max: 16.0) +[2023-10-08 16:34:23,803][19739] Avg episode reward: [(0, '551.460'), (1, '693.720')] +[2023-10-08 16:34:23,836][21195] Updated weights for policy 0, policy_version 21450 (0.0009) +[2023-10-08 16:34:24,212][21195] Updated weights for policy 0, policy_version 21460 (0.0007) +[2023-10-08 16:34:24,585][21195] Updated weights for policy 0, policy_version 21470 (0.0008) +[2023-10-08 16:34:26,527][21194] Updated weights for policy 1, policy_version 21320 (0.0008) +[2023-10-08 16:34:26,892][21194] Updated weights for policy 1, policy_version 21330 (0.0009) +[2023-10-08 16:34:27,260][21194] Updated weights for policy 1, policy_version 21340 (0.0009) +[2023-10-08 16:34:28,318][21195] Updated weights for policy 0, policy_version 21480 (0.0010) +[2023-10-08 16:34:28,683][21195] Updated weights for policy 0, policy_version 21490 (0.0011) +[2023-10-08 16:34:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 43843584. Throughput: 0: 1762.3, 1: 1701.9. Samples: 10973184. Policy #0 lag: (min: 12.0, avg: 12.0, max: 16.0) +[2023-10-08 16:34:28,803][19739] Avg episode reward: [(0, '564.980'), (1, '693.720')] +[2023-10-08 16:34:29,055][21195] Updated weights for policy 0, policy_version 21500 (0.0012) +[2023-10-08 16:34:29,207][20740] Saving new best policy, reward=564.980! +[2023-10-08 16:34:31,193][21194] Updated weights for policy 1, policy_version 21350 (0.0009) +[2023-10-08 16:34:31,560][21194] Updated weights for policy 1, policy_version 21360 (0.0008) +[2023-10-08 16:34:31,932][21194] Updated weights for policy 1, policy_version 21370 (0.0008) +[2023-10-08 16:34:32,936][21195] Updated weights for policy 0, policy_version 21510 (0.0009) +[2023-10-08 16:34:33,304][21195] Updated weights for policy 0, policy_version 21520 (0.0008) +[2023-10-08 16:34:33,681][21195] Updated weights for policy 0, policy_version 21530 (0.0009) +[2023-10-08 16:34:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 43909120. Throughput: 0: 1734.3, 1: 1730.5. Samples: 10988560. Policy #0 lag: (min: 12.0, avg: 12.0, max: 16.0) +[2023-10-08 16:34:33,803][19739] Avg episode reward: [(0, '573.910'), (1, '693.720')] +[2023-10-08 16:34:33,904][20740] Saving new best policy, reward=573.910! +[2023-10-08 16:34:35,945][21194] Updated weights for policy 1, policy_version 21380 (0.0010) +[2023-10-08 16:34:36,318][21194] Updated weights for policy 1, policy_version 21390 (0.0008) +[2023-10-08 16:34:36,679][21194] Updated weights for policy 1, policy_version 21400 (0.0007) +[2023-10-08 16:34:37,490][21195] Updated weights for policy 0, policy_version 21540 (0.0007) +[2023-10-08 16:34:37,870][21195] Updated weights for policy 0, policy_version 21550 (0.0008) +[2023-10-08 16:34:38,237][21195] Updated weights for policy 0, policy_version 21560 (0.0008) +[2023-10-08 16:34:38,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 44007424. Throughput: 0: 1760.4, 1: 1701.9. Samples: 11003786. Policy #0 lag: (min: 10.0, avg: 27.0, max: 42.0) +[2023-10-08 16:34:38,803][19739] Avg episode reward: [(0, '573.910'), (1, '656.970')] +[2023-10-08 16:34:40,456][21194] Updated weights for policy 1, policy_version 21410 (0.0007) +[2023-10-08 16:34:40,826][21194] Updated weights for policy 1, policy_version 21420 (0.0007) +[2023-10-08 16:34:41,183][21194] Updated weights for policy 1, policy_version 21430 (0.0007) +[2023-10-08 16:34:41,557][21194] Updated weights for policy 1, policy_version 21440 (0.0007) +[2023-10-08 16:34:42,211][21195] Updated weights for policy 0, policy_version 21570 (0.0010) +[2023-10-08 16:34:42,589][21195] Updated weights for policy 0, policy_version 21580 (0.0010) +[2023-10-08 16:34:42,961][21195] Updated weights for policy 0, policy_version 21590 (0.0008) +[2023-10-08 16:34:43,328][21195] Updated weights for policy 0, policy_version 21600 (0.0010) +[2023-10-08 16:34:43,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 44072960. Throughput: 0: 1740.2, 1: 1719.8. Samples: 11024684. Policy #0 lag: (min: 10.0, avg: 27.0, max: 42.0) +[2023-10-08 16:34:43,803][19739] Avg episode reward: [(0, '573.910'), (1, '656.970')] +[2023-10-08 16:34:45,587][21194] Updated weights for policy 1, policy_version 21450 (0.0008) +[2023-10-08 16:34:45,954][21194] Updated weights for policy 1, policy_version 21460 (0.0008) +[2023-10-08 16:34:46,325][21194] Updated weights for policy 1, policy_version 21470 (0.0008) +[2023-10-08 16:34:47,456][21195] Updated weights for policy 0, policy_version 21610 (0.0008) +[2023-10-08 16:34:47,833][21195] Updated weights for policy 0, policy_version 21620 (0.0009) +[2023-10-08 16:34:48,203][21195] Updated weights for policy 0, policy_version 21630 (0.0008) +[2023-10-08 16:34:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 44138496. Throughput: 0: 1725.5, 1: 1714.8. Samples: 11039744. Policy #0 lag: (min: 10.0, avg: 27.0, max: 42.0) +[2023-10-08 16:34:48,803][19739] Avg episode reward: [(0, '573.910'), (1, '656.970')] +[2023-10-08 16:34:50,269][21194] Updated weights for policy 1, policy_version 21480 (0.0012) +[2023-10-08 16:34:50,637][21194] Updated weights for policy 1, policy_version 21490 (0.0010) +[2023-10-08 16:34:51,008][21194] Updated weights for policy 1, policy_version 21500 (0.0009) +[2023-10-08 16:34:51,990][21195] Updated weights for policy 0, policy_version 21640 (0.0007) +[2023-10-08 16:34:52,370][21195] Updated weights for policy 0, policy_version 21650 (0.0008) +[2023-10-08 16:34:52,738][21195] Updated weights for policy 0, policy_version 21660 (0.0009) +[2023-10-08 16:34:53,803][19739] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 44204032. Throughput: 0: 1758.3, 1: 1701.3. Samples: 11056050. Policy #0 lag: (min: 28.0, avg: 32.6, max: 60.0) +[2023-10-08 16:34:53,804][19739] Avg episode reward: [(0, '573.910'), (1, '656.970')] +[2023-10-08 16:34:54,960][21194] Updated weights for policy 1, policy_version 21510 (0.0007) +[2023-10-08 16:34:55,351][21194] Updated weights for policy 1, policy_version 21520 (0.0008) +[2023-10-08 16:34:55,718][21194] Updated weights for policy 1, policy_version 21530 (0.0008) +[2023-10-08 16:34:56,797][21195] Updated weights for policy 0, policy_version 21670 (0.0008) +[2023-10-08 16:34:57,169][21195] Updated weights for policy 0, policy_version 21680 (0.0007) +[2023-10-08 16:34:57,539][21195] Updated weights for policy 0, policy_version 21690 (0.0007) +[2023-10-08 16:34:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 44269568. Throughput: 0: 1726.4, 1: 1732.0. Samples: 11076332. Policy #0 lag: (min: 28.0, avg: 32.6, max: 60.0) +[2023-10-08 16:34:58,803][19739] Avg episode reward: [(0, '573.910'), (1, '656.970')] +[2023-10-08 16:34:59,422][21194] Updated weights for policy 1, policy_version 21540 (0.0009) +[2023-10-08 16:34:59,795][21194] Updated weights for policy 1, policy_version 21550 (0.0007) +[2023-10-08 16:35:00,158][21194] Updated weights for policy 1, policy_version 21560 (0.0008) +[2023-10-08 16:35:01,535][21195] Updated weights for policy 0, policy_version 21700 (0.0009) +[2023-10-08 16:35:01,902][21195] Updated weights for policy 0, policy_version 21710 (0.0010) +[2023-10-08 16:35:02,281][21195] Updated weights for policy 0, policy_version 21720 (0.0007) +[2023-10-08 16:35:03,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 44335104. Throughput: 0: 1714.1, 1: 1707.3. Samples: 11091386. Policy #0 lag: (min: 28.0, avg: 32.6, max: 60.0) +[2023-10-08 16:35:03,803][19739] Avg episode reward: [(0, '587.840'), (1, '656.970')] +[2023-10-08 16:35:03,804][20740] Saving new best policy, reward=587.840! +[2023-10-08 16:35:04,020][21194] Updated weights for policy 1, policy_version 21570 (0.0007) +[2023-10-08 16:35:04,391][21194] Updated weights for policy 1, policy_version 21580 (0.0010) +[2023-10-08 16:35:04,759][21194] Updated weights for policy 1, policy_version 21590 (0.0010) +[2023-10-08 16:35:05,133][21194] Updated weights for policy 1, policy_version 21600 (0.0010) +[2023-10-08 16:35:06,255][21195] Updated weights for policy 0, policy_version 21730 (0.0007) +[2023-10-08 16:35:06,618][21195] Updated weights for policy 0, policy_version 21740 (0.0007) +[2023-10-08 16:35:06,989][21195] Updated weights for policy 0, policy_version 21750 (0.0010) +[2023-10-08 16:35:07,366][21195] Updated weights for policy 0, policy_version 21760 (0.0007) +[2023-10-08 16:35:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 44400640. Throughput: 0: 1731.5, 1: 1728.8. Samples: 11107654. Policy #0 lag: (min: 28.0, avg: 32.6, max: 60.0) +[2023-10-08 16:35:08,803][19739] Avg episode reward: [(0, '587.840'), (1, '656.970')] +[2023-10-08 16:35:09,030][21194] Updated weights for policy 1, policy_version 21610 (0.0009) +[2023-10-08 16:35:09,404][21194] Updated weights for policy 1, policy_version 21620 (0.0010) +[2023-10-08 16:35:09,777][21194] Updated weights for policy 1, policy_version 21630 (0.0009) +[2023-10-08 16:35:11,171][21195] Updated weights for policy 0, policy_version 21770 (0.0009) +[2023-10-08 16:35:11,539][21195] Updated weights for policy 0, policy_version 21780 (0.0007) +[2023-10-08 16:35:11,905][21195] Updated weights for policy 0, policy_version 21790 (0.0010) +[2023-10-08 16:35:13,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 44466176. Throughput: 0: 1705.5, 1: 1742.4. Samples: 11128340. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:35:13,804][19739] Avg episode reward: [(0, '587.840'), (1, '656.970')] +[2023-10-08 16:35:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000021792_22315008.pth... +[2023-10-08 16:35:13,845][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000020160_20643840.pth +[2023-10-08 16:35:13,889][21194] Updated weights for policy 1, policy_version 21640 (0.0007) +[2023-10-08 16:35:14,261][21194] Updated weights for policy 1, policy_version 21650 (0.0011) +[2023-10-08 16:35:14,630][21194] Updated weights for policy 1, policy_version 21660 (0.0010) +[2023-10-08 16:35:14,774][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000021664_22183936.pth... +[2023-10-08 16:35:14,803][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000020032_20512768.pth +[2023-10-08 16:35:15,895][21195] Updated weights for policy 0, policy_version 21800 (0.0007) +[2023-10-08 16:35:16,269][21195] Updated weights for policy 0, policy_version 21810 (0.0008) +[2023-10-08 16:35:16,636][21195] Updated weights for policy 0, policy_version 21820 (0.0011) +[2023-10-08 16:35:18,571][21194] Updated weights for policy 1, policy_version 21670 (0.0008) +[2023-10-08 16:35:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 44531712. Throughput: 0: 1739.7, 1: 1709.2. Samples: 11143760. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:35:18,803][19739] Avg episode reward: [(0, '602.520'), (1, '656.970')] +[2023-10-08 16:35:18,804][20740] Saving new best policy, reward=602.520! +[2023-10-08 16:35:18,935][21194] Updated weights for policy 1, policy_version 21680 (0.0007) +[2023-10-08 16:35:19,302][21194] Updated weights for policy 1, policy_version 21690 (0.0007) +[2023-10-08 16:35:20,491][21195] Updated weights for policy 0, policy_version 21830 (0.0010) +[2023-10-08 16:35:20,857][21195] Updated weights for policy 0, policy_version 21840 (0.0008) +[2023-10-08 16:35:21,228][21195] Updated weights for policy 0, policy_version 21850 (0.0007) +[2023-10-08 16:35:23,120][21194] Updated weights for policy 1, policy_version 21700 (0.0007) +[2023-10-08 16:35:23,497][21194] Updated weights for policy 1, policy_version 21710 (0.0008) +[2023-10-08 16:35:23,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 44597248. Throughput: 0: 1713.7, 1: 1741.2. Samples: 11159258. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:35:23,803][19739] Avg episode reward: [(0, '602.520'), (1, '656.970')] +[2023-10-08 16:35:23,855][21194] Updated weights for policy 1, policy_version 21720 (0.0010) +[2023-10-08 16:35:25,211][21195] Updated weights for policy 0, policy_version 21860 (0.0008) +[2023-10-08 16:35:25,584][21195] Updated weights for policy 0, policy_version 21870 (0.0007) +[2023-10-08 16:35:25,951][21195] Updated weights for policy 0, policy_version 21880 (0.0007) +[2023-10-08 16:35:27,945][21194] Updated weights for policy 1, policy_version 21730 (0.0009) +[2023-10-08 16:35:28,316][21194] Updated weights for policy 1, policy_version 21740 (0.0008) +[2023-10-08 16:35:28,682][21194] Updated weights for policy 1, policy_version 21750 (0.0008) +[2023-10-08 16:35:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 44662784. Throughput: 0: 1735.1, 1: 1728.2. Samples: 11180530. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:35:28,803][19739] Avg episode reward: [(0, '602.520'), (1, '670.310')] +[2023-10-08 16:35:29,053][21194] Updated weights for policy 1, policy_version 21760 (0.0010) +[2023-10-08 16:35:29,760][21195] Updated weights for policy 0, policy_version 21890 (0.0007) +[2023-10-08 16:35:30,129][21195] Updated weights for policy 0, policy_version 21900 (0.0008) +[2023-10-08 16:35:30,495][21195] Updated weights for policy 0, policy_version 21910 (0.0008) +[2023-10-08 16:35:30,873][21195] Updated weights for policy 0, policy_version 21920 (0.0008) +[2023-10-08 16:35:32,894][21194] Updated weights for policy 1, policy_version 21770 (0.0008) +[2023-10-08 16:35:33,257][21194] Updated weights for policy 1, policy_version 21780 (0.0009) +[2023-10-08 16:35:33,625][21194] Updated weights for policy 1, policy_version 21790 (0.0010) +[2023-10-08 16:35:33,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 44761088. Throughput: 0: 1750.3, 1: 1728.9. Samples: 11196308. Policy #0 lag: (min: 6.0, avg: 6.0, max: 10.0) +[2023-10-08 16:35:33,803][19739] Avg episode reward: [(0, '602.520'), (1, '670.310')] +[2023-10-08 16:35:34,701][21195] Updated weights for policy 0, policy_version 21930 (0.0008) +[2023-10-08 16:35:35,079][21195] Updated weights for policy 0, policy_version 21940 (0.0008) +[2023-10-08 16:35:35,446][21195] Updated weights for policy 0, policy_version 21950 (0.0009) +[2023-10-08 16:35:37,486][21194] Updated weights for policy 1, policy_version 21800 (0.0009) +[2023-10-08 16:35:37,840][21194] Updated weights for policy 1, policy_version 21810 (0.0010) +[2023-10-08 16:35:38,201][21194] Updated weights for policy 1, policy_version 21820 (0.0008) +[2023-10-08 16:35:38,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 44826624. Throughput: 0: 1716.3, 1: 1739.7. Samples: 11211568. Policy #0 lag: (min: 6.0, avg: 6.0, max: 10.0) +[2023-10-08 16:35:38,803][19739] Avg episode reward: [(0, '617.050'), (1, '670.310')] +[2023-10-08 16:35:38,804][20740] Saving new best policy, reward=617.050! +[2023-10-08 16:35:39,359][21195] Updated weights for policy 0, policy_version 21960 (0.0008) +[2023-10-08 16:35:39,736][21195] Updated weights for policy 0, policy_version 21970 (0.0010) +[2023-10-08 16:35:40,109][21195] Updated weights for policy 0, policy_version 21980 (0.0010) +[2023-10-08 16:35:42,287][21194] Updated weights for policy 1, policy_version 21830 (0.0008) +[2023-10-08 16:35:42,675][21194] Updated weights for policy 1, policy_version 21840 (0.0009) +[2023-10-08 16:35:43,055][21194] Updated weights for policy 1, policy_version 21850 (0.0009) +[2023-10-08 16:35:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 44892160. Throughput: 0: 1754.3, 1: 1709.4. Samples: 11232196. Policy #0 lag: (min: 6.0, avg: 6.0, max: 10.0) +[2023-10-08 16:35:43,803][19739] Avg episode reward: [(0, '614.840'), (1, '670.310')] +[2023-10-08 16:35:43,929][21195] Updated weights for policy 0, policy_version 21990 (0.0008) +[2023-10-08 16:35:44,297][21195] Updated weights for policy 0, policy_version 22000 (0.0007) +[2023-10-08 16:35:44,679][21195] Updated weights for policy 0, policy_version 22010 (0.0008) +[2023-10-08 16:35:46,906][21194] Updated weights for policy 1, policy_version 21860 (0.0008) +[2023-10-08 16:35:47,282][21194] Updated weights for policy 1, policy_version 21870 (0.0009) +[2023-10-08 16:35:47,649][21194] Updated weights for policy 1, policy_version 21880 (0.0009) +[2023-10-08 16:35:48,531][21195] Updated weights for policy 0, policy_version 22020 (0.0008) +[2023-10-08 16:35:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 44957696. Throughput: 0: 1748.4, 1: 1734.0. Samples: 11248096. Policy #0 lag: (min: 6.0, avg: 6.0, max: 10.0) +[2023-10-08 16:35:48,803][19739] Avg episode reward: [(0, '636.100'), (1, '671.130')] +[2023-10-08 16:35:48,895][21195] Updated weights for policy 0, policy_version 22030 (0.0007) +[2023-10-08 16:35:49,267][21195] Updated weights for policy 0, policy_version 22040 (0.0007) +[2023-10-08 16:35:49,560][20740] Saving new best policy, reward=636.100! +[2023-10-08 16:35:51,677][21194] Updated weights for policy 1, policy_version 21890 (0.0009) +[2023-10-08 16:35:52,047][21194] Updated weights for policy 1, policy_version 21900 (0.0009) +[2023-10-08 16:35:52,411][21194] Updated weights for policy 1, policy_version 21910 (0.0007) +[2023-10-08 16:35:52,780][21194] Updated weights for policy 1, policy_version 21920 (0.0007) +[2023-10-08 16:35:53,245][21195] Updated weights for policy 0, policy_version 22050 (0.0007) +[2023-10-08 16:35:53,614][21195] Updated weights for policy 0, policy_version 22060 (0.0010) +[2023-10-08 16:35:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 45023232. Throughput: 0: 1743.9, 1: 1718.9. Samples: 11263478. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 16:35:53,803][19739] Avg episode reward: [(0, '636.100'), (1, '681.550')] +[2023-10-08 16:35:53,983][21195] Updated weights for policy 0, policy_version 22070 (0.0012) +[2023-10-08 16:35:54,353][21195] Updated weights for policy 0, policy_version 22080 (0.0010) +[2023-10-08 16:35:56,756][21194] Updated weights for policy 1, policy_version 21930 (0.0009) +[2023-10-08 16:35:57,120][21194] Updated weights for policy 1, policy_version 21940 (0.0007) +[2023-10-08 16:35:57,499][21194] Updated weights for policy 1, policy_version 21950 (0.0008) +[2023-10-08 16:35:58,261][21195] Updated weights for policy 0, policy_version 22090 (0.0007) +[2023-10-08 16:35:58,631][21195] Updated weights for policy 0, policy_version 22100 (0.0009) +[2023-10-08 16:35:58,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 45088768. Throughput: 0: 1757.4, 1: 1706.4. Samples: 11284210. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 16:35:58,803][19739] Avg episode reward: [(0, '648.390'), (1, '680.550')] +[2023-10-08 16:35:59,009][21195] Updated weights for policy 0, policy_version 22110 (0.0009) +[2023-10-08 16:35:59,074][20740] Saving new best policy, reward=648.390! +[2023-10-08 16:36:01,432][21194] Updated weights for policy 1, policy_version 21960 (0.0007) +[2023-10-08 16:36:01,798][21194] Updated weights for policy 1, policy_version 21970 (0.0007) +[2023-10-08 16:36:02,161][21194] Updated weights for policy 1, policy_version 21980 (0.0008) +[2023-10-08 16:36:02,850][21195] Updated weights for policy 0, policy_version 22120 (0.0007) +[2023-10-08 16:36:03,218][21195] Updated weights for policy 0, policy_version 22130 (0.0008) +[2023-10-08 16:36:03,593][21195] Updated weights for policy 0, policy_version 22140 (0.0008) +[2023-10-08 16:36:03,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 45187072. Throughput: 0: 1725.2, 1: 1741.0. Samples: 11299742. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 16:36:03,803][19739] Avg episode reward: [(0, '617.280'), (1, '681.300')] +[2023-10-08 16:36:06,107][21194] Updated weights for policy 1, policy_version 21990 (0.0007) +[2023-10-08 16:36:06,477][21194] Updated weights for policy 1, policy_version 22000 (0.0007) +[2023-10-08 16:36:06,843][21194] Updated weights for policy 1, policy_version 22010 (0.0007) +[2023-10-08 16:36:07,524][21195] Updated weights for policy 0, policy_version 22150 (0.0008) +[2023-10-08 16:36:07,892][21195] Updated weights for policy 0, policy_version 22160 (0.0009) +[2023-10-08 16:36:08,269][21195] Updated weights for policy 0, policy_version 22170 (0.0011) +[2023-10-08 16:36:08,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 45252608. Throughput: 0: 1754.5, 1: 1711.4. Samples: 11315224. Policy #0 lag: (min: 31.0, avg: 31.8, max: 48.0) +[2023-10-08 16:36:08,803][19739] Avg episode reward: [(0, '617.280'), (1, '681.300')] +[2023-10-08 16:36:10,761][21194] Updated weights for policy 1, policy_version 22020 (0.0008) +[2023-10-08 16:36:11,124][21194] Updated weights for policy 1, policy_version 22030 (0.0008) +[2023-10-08 16:36:11,489][21194] Updated weights for policy 1, policy_version 22040 (0.0009) +[2023-10-08 16:36:12,177][21195] Updated weights for policy 0, policy_version 22180 (0.0010) +[2023-10-08 16:36:12,547][21195] Updated weights for policy 0, policy_version 22190 (0.0010) +[2023-10-08 16:36:12,917][21195] Updated weights for policy 0, policy_version 22200 (0.0008) +[2023-10-08 16:36:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 45318144. Throughput: 0: 1733.6, 1: 1718.8. Samples: 11335888. Policy #0 lag: (min: 31.0, avg: 31.8, max: 48.0) +[2023-10-08 16:36:13,803][19739] Avg episode reward: [(0, '609.310'), (1, '652.810')] +[2023-10-08 16:36:15,476][21194] Updated weights for policy 1, policy_version 22050 (0.0010) +[2023-10-08 16:36:15,838][21194] Updated weights for policy 1, policy_version 22060 (0.0011) +[2023-10-08 16:36:16,205][21194] Updated weights for policy 1, policy_version 22070 (0.0007) +[2023-10-08 16:36:16,572][21194] Updated weights for policy 1, policy_version 22080 (0.0007) +[2023-10-08 16:36:16,747][21195] Updated weights for policy 0, policy_version 22210 (0.0008) +[2023-10-08 16:36:17,116][21195] Updated weights for policy 0, policy_version 22220 (0.0010) +[2023-10-08 16:36:17,493][21195] Updated weights for policy 0, policy_version 22230 (0.0009) +[2023-10-08 16:36:17,860][21195] Updated weights for policy 0, policy_version 22240 (0.0010) +[2023-10-08 16:36:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 45383680. Throughput: 0: 1727.9, 1: 1721.9. Samples: 11351548. Policy #0 lag: (min: 31.0, avg: 31.8, max: 48.0) +[2023-10-08 16:36:18,803][19739] Avg episode reward: [(0, '609.310'), (1, '653.580')] +[2023-10-08 16:36:20,617][21194] Updated weights for policy 1, policy_version 22090 (0.0008) +[2023-10-08 16:36:20,988][21194] Updated weights for policy 1, policy_version 22100 (0.0010) +[2023-10-08 16:36:21,367][21194] Updated weights for policy 1, policy_version 22110 (0.0009) +[2023-10-08 16:36:21,851][21195] Updated weights for policy 0, policy_version 22250 (0.0008) +[2023-10-08 16:36:22,219][21195] Updated weights for policy 0, policy_version 22260 (0.0008) +[2023-10-08 16:36:22,599][21195] Updated weights for policy 0, policy_version 22270 (0.0008) +[2023-10-08 16:36:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 45449216. Throughput: 0: 1747.6, 1: 1705.2. Samples: 11366948. Policy #0 lag: (min: 31.0, avg: 31.8, max: 48.0) +[2023-10-08 16:36:23,803][19739] Avg episode reward: [(0, '609.310'), (1, '653.580')] +[2023-10-08 16:36:25,346][21194] Updated weights for policy 1, policy_version 22120 (0.0009) +[2023-10-08 16:36:25,720][21194] Updated weights for policy 1, policy_version 22130 (0.0008) +[2023-10-08 16:36:26,078][21194] Updated weights for policy 1, policy_version 22140 (0.0007) +[2023-10-08 16:36:26,382][21195] Updated weights for policy 0, policy_version 22280 (0.0008) +[2023-10-08 16:36:26,753][21195] Updated weights for policy 0, policy_version 22290 (0.0009) +[2023-10-08 16:36:27,113][21195] Updated weights for policy 0, policy_version 22300 (0.0007) +[2023-10-08 16:36:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 45514752. Throughput: 0: 1722.4, 1: 1734.7. Samples: 11387762. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:36:28,803][19739] Avg episode reward: [(0, '609.310'), (1, '639.500')] +[2023-10-08 16:36:30,200][21194] Updated weights for policy 1, policy_version 22150 (0.0008) +[2023-10-08 16:36:30,584][21194] Updated weights for policy 1, policy_version 22160 (0.0008) +[2023-10-08 16:36:30,950][21194] Updated weights for policy 1, policy_version 22170 (0.0008) +[2023-10-08 16:36:31,060][21195] Updated weights for policy 0, policy_version 22310 (0.0008) +[2023-10-08 16:36:31,428][21195] Updated weights for policy 0, policy_version 22320 (0.0009) +[2023-10-08 16:36:31,799][21195] Updated weights for policy 0, policy_version 22330 (0.0009) +[2023-10-08 16:36:33,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 45580288. Throughput: 0: 1732.7, 1: 1712.8. Samples: 11403142. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:36:33,803][19739] Avg episode reward: [(0, '616.150'), (1, '639.500')] +[2023-10-08 16:36:34,656][21194] Updated weights for policy 1, policy_version 22180 (0.0008) +[2023-10-08 16:36:35,021][21194] Updated weights for policy 1, policy_version 22190 (0.0009) +[2023-10-08 16:36:35,385][21194] Updated weights for policy 1, policy_version 22200 (0.0009) +[2023-10-08 16:36:35,733][21195] Updated weights for policy 0, policy_version 22340 (0.0008) +[2023-10-08 16:36:36,109][21195] Updated weights for policy 0, policy_version 22350 (0.0008) +[2023-10-08 16:36:36,478][21195] Updated weights for policy 0, policy_version 22360 (0.0009) +[2023-10-08 16:36:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 45645824. Throughput: 0: 1722.0, 1: 1724.3. Samples: 11418558. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:36:38,803][19739] Avg episode reward: [(0, '616.150'), (1, '640.000')] +[2023-10-08 16:36:39,160][21194] Updated weights for policy 1, policy_version 22210 (0.0009) +[2023-10-08 16:36:39,522][21194] Updated weights for policy 1, policy_version 22220 (0.0009) +[2023-10-08 16:36:39,887][21194] Updated weights for policy 1, policy_version 22230 (0.0008) +[2023-10-08 16:36:40,250][21194] Updated weights for policy 1, policy_version 22240 (0.0009) +[2023-10-08 16:36:40,323][21195] Updated weights for policy 0, policy_version 22370 (0.0008) +[2023-10-08 16:36:40,690][21195] Updated weights for policy 0, policy_version 22380 (0.0008) +[2023-10-08 16:36:41,067][21195] Updated weights for policy 0, policy_version 22390 (0.0010) +[2023-10-08 16:36:41,436][21195] Updated weights for policy 0, policy_version 22400 (0.0007) +[2023-10-08 16:36:43,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 45711360. Throughput: 0: 1723.4, 1: 1739.8. Samples: 11440056. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:36:43,804][19739] Avg episode reward: [(0, '616.150'), (1, '641.560')] +[2023-10-08 16:36:44,174][21194] Updated weights for policy 1, policy_version 22250 (0.0010) +[2023-10-08 16:36:44,534][21194] Updated weights for policy 1, policy_version 22260 (0.0011) +[2023-10-08 16:36:44,911][21194] Updated weights for policy 1, policy_version 22270 (0.0008) +[2023-10-08 16:36:45,355][21195] Updated weights for policy 0, policy_version 22410 (0.0008) +[2023-10-08 16:36:45,724][21195] Updated weights for policy 0, policy_version 22420 (0.0008) +[2023-10-08 16:36:46,098][21195] Updated weights for policy 0, policy_version 22430 (0.0007) +[2023-10-08 16:36:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 45776896. Throughput: 0: 1754.4, 1: 1710.3. Samples: 11455654. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 16:36:48,803][19739] Avg episode reward: [(0, '624.050'), (1, '637.200')] +[2023-10-08 16:36:48,998][21194] Updated weights for policy 1, policy_version 22280 (0.0007) +[2023-10-08 16:36:49,366][21194] Updated weights for policy 1, policy_version 22290 (0.0008) +[2023-10-08 16:36:49,733][21194] Updated weights for policy 1, policy_version 22300 (0.0007) +[2023-10-08 16:36:49,947][21195] Updated weights for policy 0, policy_version 22440 (0.0008) +[2023-10-08 16:36:50,321][21195] Updated weights for policy 0, policy_version 22450 (0.0009) +[2023-10-08 16:36:50,681][21195] Updated weights for policy 0, policy_version 22460 (0.0007) +[2023-10-08 16:36:53,686][21194] Updated weights for policy 1, policy_version 22310 (0.0009) +[2023-10-08 16:36:53,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 45842432. Throughput: 0: 1728.8, 1: 1732.1. Samples: 11470966. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 16:36:53,803][19739] Avg episode reward: [(0, '638.750'), (1, '651.210')] +[2023-10-08 16:36:54,045][21194] Updated weights for policy 1, policy_version 22320 (0.0010) +[2023-10-08 16:36:54,407][21194] Updated weights for policy 1, policy_version 22330 (0.0008) +[2023-10-08 16:36:54,555][21195] Updated weights for policy 0, policy_version 22470 (0.0008) +[2023-10-08 16:36:54,943][21195] Updated weights for policy 0, policy_version 22480 (0.0010) +[2023-10-08 16:36:55,310][21195] Updated weights for policy 0, policy_version 22490 (0.0008) +[2023-10-08 16:36:58,361][21194] Updated weights for policy 1, policy_version 22340 (0.0008) +[2023-10-08 16:36:58,742][21194] Updated weights for policy 1, policy_version 22350 (0.0009) +[2023-10-08 16:36:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 45907968. Throughput: 0: 1749.8, 1: 1731.5. Samples: 11492546. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 16:36:58,803][19739] Avg episode reward: [(0, '638.920'), (1, '651.210')] +[2023-10-08 16:36:59,104][21194] Updated weights for policy 1, policy_version 22360 (0.0009) +[2023-10-08 16:36:59,121][21195] Updated weights for policy 0, policy_version 22500 (0.0009) +[2023-10-08 16:36:59,493][21195] Updated weights for policy 0, policy_version 22510 (0.0007) +[2023-10-08 16:36:59,862][21195] Updated weights for policy 0, policy_version 22520 (0.0008) +[2023-10-08 16:37:03,284][21194] Updated weights for policy 1, policy_version 22370 (0.0009) +[2023-10-08 16:37:03,654][21194] Updated weights for policy 1, policy_version 22380 (0.0009) +[2023-10-08 16:37:03,754][21195] Updated weights for policy 0, policy_version 22530 (0.0009) +[2023-10-08 16:37:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 45973504. Throughput: 0: 1751.3, 1: 1717.5. Samples: 11507642. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 16:37:03,803][19739] Avg episode reward: [(0, '638.920'), (1, '656.670')] +[2023-10-08 16:37:04,021][21194] Updated weights for policy 1, policy_version 22390 (0.0008) +[2023-10-08 16:37:04,127][21195] Updated weights for policy 0, policy_version 22540 (0.0007) +[2023-10-08 16:37:04,388][21194] Updated weights for policy 1, policy_version 22400 (0.0009) +[2023-10-08 16:37:04,487][21195] Updated weights for policy 0, policy_version 22550 (0.0009) +[2023-10-08 16:37:04,855][21195] Updated weights for policy 0, policy_version 22560 (0.0010) +[2023-10-08 16:37:08,324][21194] Updated weights for policy 1, policy_version 22410 (0.0010) +[2023-10-08 16:37:08,680][21194] Updated weights for policy 1, policy_version 22420 (0.0008) +[2023-10-08 16:37:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 46039040. Throughput: 0: 1735.6, 1: 1728.8. Samples: 11522846. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:37:08,803][19739] Avg episode reward: [(0, '628.590'), (1, '669.630')] +[2023-10-08 16:37:08,954][21195] Updated weights for policy 0, policy_version 22570 (0.0008) +[2023-10-08 16:37:09,044][21194] Updated weights for policy 1, policy_version 22430 (0.0008) +[2023-10-08 16:37:09,320][21195] Updated weights for policy 0, policy_version 22580 (0.0010) +[2023-10-08 16:37:09,693][21195] Updated weights for policy 0, policy_version 22590 (0.0007) +[2023-10-08 16:37:13,038][21194] Updated weights for policy 1, policy_version 22440 (0.0009) +[2023-10-08 16:37:13,407][21194] Updated weights for policy 1, policy_version 22450 (0.0008) +[2023-10-08 16:37:13,455][21195] Updated weights for policy 0, policy_version 22600 (0.0007) +[2023-10-08 16:37:13,772][21194] Updated weights for policy 1, policy_version 22460 (0.0008) +[2023-10-08 16:37:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 46104576. Throughput: 0: 1756.4, 1: 1720.1. Samples: 11544206. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:37:13,803][19739] Avg episode reward: [(0, '628.590'), (1, '669.630')] +[2023-10-08 16:37:13,816][21195] Updated weights for policy 0, policy_version 22610 (0.0008) +[2023-10-08 16:37:13,919][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000022464_23003136.pth... +[2023-10-08 16:37:13,956][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000020832_21331968.pth +[2023-10-08 16:37:14,185][21195] Updated weights for policy 0, policy_version 22620 (0.0009) +[2023-10-08 16:37:14,330][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000022624_23166976.pth... +[2023-10-08 16:37:14,359][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000020992_21495808.pth +[2023-10-08 16:37:17,743][21194] Updated weights for policy 1, policy_version 22470 (0.0007) +[2023-10-08 16:37:18,079][21195] Updated weights for policy 0, policy_version 22630 (0.0009) +[2023-10-08 16:37:18,122][21194] Updated weights for policy 1, policy_version 22480 (0.0008) +[2023-10-08 16:37:18,444][21195] Updated weights for policy 0, policy_version 22640 (0.0007) +[2023-10-08 16:37:18,500][21194] Updated weights for policy 1, policy_version 22490 (0.0009) +[2023-10-08 16:37:18,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 46202880. Throughput: 0: 1738.3, 1: 1722.8. Samples: 11558892. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:37:18,803][19739] Avg episode reward: [(0, '628.590'), (1, '669.630')] +[2023-10-08 16:37:18,816][21195] Updated weights for policy 0, policy_version 22650 (0.0007) +[2023-10-08 16:37:22,189][21194] Updated weights for policy 1, policy_version 22500 (0.0008) +[2023-10-08 16:37:22,561][21194] Updated weights for policy 1, policy_version 22510 (0.0008) +[2023-10-08 16:37:22,924][21194] Updated weights for policy 1, policy_version 22520 (0.0008) +[2023-10-08 16:37:22,953][21195] Updated weights for policy 0, policy_version 22660 (0.0009) +[2023-10-08 16:37:23,321][21195] Updated weights for policy 0, policy_version 22670 (0.0009) +[2023-10-08 16:37:23,692][21195] Updated weights for policy 0, policy_version 22680 (0.0008) +[2023-10-08 16:37:23,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 46268416. Throughput: 0: 1753.9, 1: 1728.4. Samples: 11575264. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:37:23,803][19739] Avg episode reward: [(0, '635.050'), (1, '669.630')] +[2023-10-08 16:37:26,868][21194] Updated weights for policy 1, policy_version 22530 (0.0007) +[2023-10-08 16:37:27,240][21194] Updated weights for policy 1, policy_version 22540 (0.0007) +[2023-10-08 16:37:27,510][21195] Updated weights for policy 0, policy_version 22690 (0.0009) +[2023-10-08 16:37:27,601][21194] Updated weights for policy 1, policy_version 22550 (0.0007) +[2023-10-08 16:37:27,870][21195] Updated weights for policy 0, policy_version 22700 (0.0009) +[2023-10-08 16:37:27,965][21194] Updated weights for policy 1, policy_version 22560 (0.0008) +[2023-10-08 16:37:28,245][21195] Updated weights for policy 0, policy_version 22710 (0.0010) +[2023-10-08 16:37:28,613][21195] Updated weights for policy 0, policy_version 22720 (0.0011) +[2023-10-08 16:37:28,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 46366720. Throughput: 0: 1747.0, 1: 1700.1. Samples: 11595174. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:37:28,803][19739] Avg episode reward: [(0, '635.050'), (1, '670.110')] +[2023-10-08 16:37:32,024][21194] Updated weights for policy 1, policy_version 22570 (0.0009) +[2023-10-08 16:37:32,395][21194] Updated weights for policy 1, policy_version 22580 (0.0008) +[2023-10-08 16:37:32,588][21195] Updated weights for policy 0, policy_version 22730 (0.0007) +[2023-10-08 16:37:32,770][21194] Updated weights for policy 1, policy_version 22590 (0.0008) +[2023-10-08 16:37:32,954][21195] Updated weights for policy 0, policy_version 22740 (0.0008) +[2023-10-08 16:37:33,324][21195] Updated weights for policy 0, policy_version 22750 (0.0007) +[2023-10-08 16:37:33,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 46432256. Throughput: 0: 1719.4, 1: 1727.8. Samples: 11610778. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:37:33,803][19739] Avg episode reward: [(0, '635.050'), (1, '679.830')] +[2023-10-08 16:37:36,676][21194] Updated weights for policy 1, policy_version 22600 (0.0009) +[2023-10-08 16:37:37,046][21194] Updated weights for policy 1, policy_version 22610 (0.0010) +[2023-10-08 16:37:37,204][21195] Updated weights for policy 0, policy_version 22760 (0.0010) +[2023-10-08 16:37:37,402][21194] Updated weights for policy 1, policy_version 22620 (0.0007) +[2023-10-08 16:37:37,564][21195] Updated weights for policy 0, policy_version 22770 (0.0009) +[2023-10-08 16:37:37,935][21195] Updated weights for policy 0, policy_version 22780 (0.0011) +[2023-10-08 16:37:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 46497792. Throughput: 0: 1745.5, 1: 1718.1. Samples: 11626830. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:37:38,803][19739] Avg episode reward: [(0, '635.050'), (1, '660.340')] +[2023-10-08 16:37:41,378][21194] Updated weights for policy 1, policy_version 22630 (0.0009) +[2023-10-08 16:37:41,749][21194] Updated weights for policy 1, policy_version 22640 (0.0008) +[2023-10-08 16:37:41,961][21195] Updated weights for policy 0, policy_version 22790 (0.0008) +[2023-10-08 16:37:42,110][21194] Updated weights for policy 1, policy_version 22650 (0.0008) +[2023-10-08 16:37:42,334][21195] Updated weights for policy 0, policy_version 22800 (0.0007) +[2023-10-08 16:37:42,712][21195] Updated weights for policy 0, policy_version 22810 (0.0008) +[2023-10-08 16:37:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 46563328. Throughput: 0: 1717.2, 1: 1701.8. Samples: 11646404. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 16:37:43,803][19739] Avg episode reward: [(0, '636.460'), (1, '660.340')] +[2023-10-08 16:37:46,075][21194] Updated weights for policy 1, policy_version 22660 (0.0008) +[2023-10-08 16:37:46,441][21194] Updated weights for policy 1, policy_version 22670 (0.0008) +[2023-10-08 16:37:46,515][21195] Updated weights for policy 0, policy_version 22820 (0.0009) +[2023-10-08 16:37:46,801][21194] Updated weights for policy 1, policy_version 22680 (0.0007) +[2023-10-08 16:37:46,886][21195] Updated weights for policy 0, policy_version 22830 (0.0008) +[2023-10-08 16:37:47,260][21195] Updated weights for policy 0, policy_version 22840 (0.0008) +[2023-10-08 16:37:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 46628864. Throughput: 0: 1717.3, 1: 1727.7. Samples: 11662668. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 16:37:48,803][19739] Avg episode reward: [(0, '636.460'), (1, '659.050')] +[2023-10-08 16:37:50,870][21194] Updated weights for policy 1, policy_version 22690 (0.0007) +[2023-10-08 16:37:51,145][21195] Updated weights for policy 0, policy_version 22850 (0.0008) +[2023-10-08 16:37:51,238][21194] Updated weights for policy 1, policy_version 22700 (0.0009) +[2023-10-08 16:37:51,521][21195] Updated weights for policy 0, policy_version 22860 (0.0009) +[2023-10-08 16:37:51,594][21194] Updated weights for policy 1, policy_version 22710 (0.0010) +[2023-10-08 16:37:51,893][21195] Updated weights for policy 0, policy_version 22870 (0.0008) +[2023-10-08 16:37:51,962][21194] Updated weights for policy 1, policy_version 22720 (0.0010) +[2023-10-08 16:37:52,255][21195] Updated weights for policy 0, policy_version 22880 (0.0007) +[2023-10-08 16:37:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 46694400. Throughput: 0: 1729.2, 1: 1701.9. Samples: 11677244. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 16:37:53,803][19739] Avg episode reward: [(0, '636.460'), (1, '659.050')] +[2023-10-08 16:37:55,870][21194] Updated weights for policy 1, policy_version 22730 (0.0010) +[2023-10-08 16:37:56,137][21195] Updated weights for policy 0, policy_version 22890 (0.0009) +[2023-10-08 16:37:56,231][21194] Updated weights for policy 1, policy_version 22740 (0.0007) +[2023-10-08 16:37:56,499][21195] Updated weights for policy 0, policy_version 22900 (0.0008) +[2023-10-08 16:37:56,599][21194] Updated weights for policy 1, policy_version 22750 (0.0009) +[2023-10-08 16:37:56,869][21195] Updated weights for policy 0, policy_version 22910 (0.0008) +[2023-10-08 16:37:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 46759936. Throughput: 0: 1710.1, 1: 1713.6. Samples: 11698272. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 16:37:58,803][19739] Avg episode reward: [(0, '636.460'), (1, '659.050')] +[2023-10-08 16:38:00,697][21194] Updated weights for policy 1, policy_version 22760 (0.0008) +[2023-10-08 16:38:00,730][21195] Updated weights for policy 0, policy_version 22920 (0.0009) +[2023-10-08 16:38:01,066][21194] Updated weights for policy 1, policy_version 22770 (0.0009) +[2023-10-08 16:38:01,100][21195] Updated weights for policy 0, policy_version 22930 (0.0009) +[2023-10-08 16:38:01,429][21194] Updated weights for policy 1, policy_version 22780 (0.0007) +[2023-10-08 16:38:01,463][21195] Updated weights for policy 0, policy_version 22940 (0.0007) +[2023-10-08 16:38:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 46825472. Throughput: 0: 1730.5, 1: 1718.9. Samples: 11714114. Policy #0 lag: (min: 13.0, avg: 20.2, max: 45.0) +[2023-10-08 16:38:03,803][19739] Avg episode reward: [(0, '641.320'), (1, '668.680')] +[2023-10-08 16:38:05,467][21194] Updated weights for policy 1, policy_version 22790 (0.0007) +[2023-10-08 16:38:05,539][21195] Updated weights for policy 0, policy_version 22950 (0.0009) +[2023-10-08 16:38:05,851][21194] Updated weights for policy 1, policy_version 22800 (0.0009) +[2023-10-08 16:38:05,905][21195] Updated weights for policy 0, policy_version 22960 (0.0007) +[2023-10-08 16:38:06,218][21194] Updated weights for policy 1, policy_version 22810 (0.0009) +[2023-10-08 16:38:06,276][21195] Updated weights for policy 0, policy_version 22970 (0.0008) +[2023-10-08 16:38:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 46891008. Throughput: 0: 1715.1, 1: 1700.1. Samples: 11728948. Policy #0 lag: (min: 13.0, avg: 20.2, max: 45.0) +[2023-10-08 16:38:08,803][19739] Avg episode reward: [(0, '641.320'), (1, '668.680')] +[2023-10-08 16:38:09,984][21194] Updated weights for policy 1, policy_version 22820 (0.0008) +[2023-10-08 16:38:10,204][21195] Updated weights for policy 0, policy_version 22980 (0.0008) +[2023-10-08 16:38:10,349][21194] Updated weights for policy 1, policy_version 22830 (0.0008) +[2023-10-08 16:38:10,573][21195] Updated weights for policy 0, policy_version 22990 (0.0009) +[2023-10-08 16:38:10,711][21194] Updated weights for policy 1, policy_version 22840 (0.0008) +[2023-10-08 16:38:10,944][21195] Updated weights for policy 0, policy_version 23000 (0.0007) +[2023-10-08 16:38:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 46956544. Throughput: 0: 1718.8, 1: 1728.2. Samples: 11750292. Policy #0 lag: (min: 13.0, avg: 20.2, max: 45.0) +[2023-10-08 16:38:13,803][19739] Avg episode reward: [(0, '641.320'), (1, '678.500')] +[2023-10-08 16:38:14,679][21194] Updated weights for policy 1, policy_version 22850 (0.0008) +[2023-10-08 16:38:14,990][21195] Updated weights for policy 0, policy_version 23010 (0.0008) +[2023-10-08 16:38:15,044][21194] Updated weights for policy 1, policy_version 22860 (0.0007) +[2023-10-08 16:38:15,358][21195] Updated weights for policy 0, policy_version 23020 (0.0007) +[2023-10-08 16:38:15,415][21194] Updated weights for policy 1, policy_version 22870 (0.0010) +[2023-10-08 16:38:15,726][21195] Updated weights for policy 0, policy_version 23030 (0.0008) +[2023-10-08 16:38:15,777][21194] Updated weights for policy 1, policy_version 22880 (0.0009) +[2023-10-08 16:38:16,099][21195] Updated weights for policy 0, policy_version 23040 (0.0009) +[2023-10-08 16:38:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 47022080. Throughput: 0: 1742.0, 1: 1698.0. Samples: 11765580. Policy #0 lag: (min: 13.0, avg: 20.2, max: 45.0) +[2023-10-08 16:38:18,803][19739] Avg episode reward: [(0, '641.320'), (1, '678.500')] +[2023-10-08 16:38:19,836][21195] Updated weights for policy 0, policy_version 23050 (0.0009) +[2023-10-08 16:38:20,027][21194] Updated weights for policy 1, policy_version 22890 (0.0007) +[2023-10-08 16:38:20,203][21195] Updated weights for policy 0, policy_version 23060 (0.0009) +[2023-10-08 16:38:20,385][21194] Updated weights for policy 1, policy_version 22900 (0.0007) +[2023-10-08 16:38:20,576][21195] Updated weights for policy 0, policy_version 23070 (0.0007) +[2023-10-08 16:38:20,747][21194] Updated weights for policy 1, policy_version 22910 (0.0007) +[2023-10-08 16:38:23,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 47087616. Throughput: 0: 1716.3, 1: 1706.4. Samples: 11780852. Policy #0 lag: (min: 31.0, avg: 35.0, max: 63.0) +[2023-10-08 16:38:23,803][19739] Avg episode reward: [(0, '636.580'), (1, '678.280')] +[2023-10-08 16:38:24,534][21195] Updated weights for policy 0, policy_version 23080 (0.0007) +[2023-10-08 16:38:24,785][21194] Updated weights for policy 1, policy_version 22920 (0.0010) +[2023-10-08 16:38:24,900][21195] Updated weights for policy 0, policy_version 23090 (0.0008) +[2023-10-08 16:38:25,162][21194] Updated weights for policy 1, policy_version 22930 (0.0007) +[2023-10-08 16:38:25,265][21195] Updated weights for policy 0, policy_version 23100 (0.0008) +[2023-10-08 16:38:25,519][21194] Updated weights for policy 1, policy_version 22940 (0.0008) +[2023-10-08 16:38:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 47153152. Throughput: 0: 1741.6, 1: 1722.0. Samples: 11802270. Policy #0 lag: (min: 31.0, avg: 35.0, max: 63.0) +[2023-10-08 16:38:28,804][19739] Avg episode reward: [(0, '643.220'), (1, '678.280')] +[2023-10-08 16:38:29,222][21195] Updated weights for policy 0, policy_version 23110 (0.0008) +[2023-10-08 16:38:29,347][21194] Updated weights for policy 1, policy_version 22950 (0.0009) +[2023-10-08 16:38:29,591][21195] Updated weights for policy 0, policy_version 23120 (0.0007) +[2023-10-08 16:38:29,706][21194] Updated weights for policy 1, policy_version 22960 (0.0007) +[2023-10-08 16:38:29,957][21195] Updated weights for policy 0, policy_version 23130 (0.0009) +[2023-10-08 16:38:30,072][21194] Updated weights for policy 1, policy_version 22970 (0.0007) +[2023-10-08 16:38:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 47218688. Throughput: 0: 1743.3, 1: 1698.7. Samples: 11817558. Policy #0 lag: (min: 31.0, avg: 35.0, max: 63.0) +[2023-10-08 16:38:33,803][19739] Avg episode reward: [(0, '653.210'), (1, '678.280')] +[2023-10-08 16:38:33,809][21195] Updated weights for policy 0, policy_version 23140 (0.0009) +[2023-10-08 16:38:33,942][21194] Updated weights for policy 1, policy_version 22980 (0.0008) +[2023-10-08 16:38:34,168][21195] Updated weights for policy 0, policy_version 23150 (0.0007) +[2023-10-08 16:38:34,306][21194] Updated weights for policy 1, policy_version 22990 (0.0008) +[2023-10-08 16:38:34,538][21195] Updated weights for policy 0, policy_version 23160 (0.0008) +[2023-10-08 16:38:34,681][21194] Updated weights for policy 1, policy_version 23000 (0.0008) +[2023-10-08 16:38:34,826][20740] Saving new best policy, reward=653.210! +[2023-10-08 16:38:38,553][21195] Updated weights for policy 0, policy_version 23170 (0.0009) +[2023-10-08 16:38:38,621][21194] Updated weights for policy 1, policy_version 23010 (0.0008) +[2023-10-08 16:38:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 47284224. Throughput: 0: 1735.4, 1: 1730.3. Samples: 11833202. Policy #0 lag: (min: 31.0, avg: 35.0, max: 63.0) +[2023-10-08 16:38:38,803][19739] Avg episode reward: [(0, '653.210'), (1, '678.280')] +[2023-10-08 16:38:38,918][21195] Updated weights for policy 0, policy_version 23180 (0.0007) +[2023-10-08 16:38:38,990][21194] Updated weights for policy 1, policy_version 23020 (0.0008) +[2023-10-08 16:38:39,297][21195] Updated weights for policy 0, policy_version 23190 (0.0007) +[2023-10-08 16:38:39,354][21194] Updated weights for policy 1, policy_version 23030 (0.0009) +[2023-10-08 16:38:39,671][21195] Updated weights for policy 0, policy_version 23200 (0.0007) +[2023-10-08 16:38:39,724][21194] Updated weights for policy 1, policy_version 23040 (0.0008) +[2023-10-08 16:38:43,557][21195] Updated weights for policy 0, policy_version 23210 (0.0007) +[2023-10-08 16:38:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 47349760. Throughput: 0: 1747.6, 1: 1723.4. Samples: 11854464. Policy #0 lag: (min: 27.0, avg: 30.5, max: 59.0) +[2023-10-08 16:38:43,803][19739] Avg episode reward: [(0, '664.420'), (1, '678.280')] +[2023-10-08 16:38:43,819][21194] Updated weights for policy 1, policy_version 23050 (0.0009) +[2023-10-08 16:38:43,931][21195] Updated weights for policy 0, policy_version 23220 (0.0008) +[2023-10-08 16:38:44,189][21194] Updated weights for policy 1, policy_version 23060 (0.0007) +[2023-10-08 16:38:44,290][21195] Updated weights for policy 0, policy_version 23230 (0.0007) +[2023-10-08 16:38:44,360][20740] Saving new best policy, reward=664.420! +[2023-10-08 16:38:44,543][21194] Updated weights for policy 1, policy_version 23070 (0.0010) +[2023-10-08 16:38:48,137][21195] Updated weights for policy 0, policy_version 23240 (0.0008) +[2023-10-08 16:38:48,497][21194] Updated weights for policy 1, policy_version 23080 (0.0008) +[2023-10-08 16:38:48,505][21195] Updated weights for policy 0, policy_version 23250 (0.0010) +[2023-10-08 16:38:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 47415296. Throughput: 0: 1726.6, 1: 1711.1. Samples: 11868808. Policy #0 lag: (min: 27.0, avg: 30.5, max: 59.0) +[2023-10-08 16:38:48,803][19739] Avg episode reward: [(0, '664.420'), (1, '678.280')] +[2023-10-08 16:38:48,859][21194] Updated weights for policy 1, policy_version 23090 (0.0007) +[2023-10-08 16:38:48,873][21195] Updated weights for policy 0, policy_version 23260 (0.0008) +[2023-10-08 16:38:49,219][21194] Updated weights for policy 1, policy_version 23100 (0.0009) +[2023-10-08 16:38:52,833][21195] Updated weights for policy 0, policy_version 23270 (0.0007) +[2023-10-08 16:38:53,200][21195] Updated weights for policy 0, policy_version 23280 (0.0007) +[2023-10-08 16:38:53,323][21194] Updated weights for policy 1, policy_version 23110 (0.0007) +[2023-10-08 16:38:53,564][21195] Updated weights for policy 0, policy_version 23290 (0.0009) +[2023-10-08 16:38:53,687][21194] Updated weights for policy 1, policy_version 23120 (0.0007) +[2023-10-08 16:38:53,803][19739] Fps is (10 sec: 16383.8, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 47513600. Throughput: 0: 1748.7, 1: 1725.2. Samples: 11885274. Policy #0 lag: (min: 27.0, avg: 30.5, max: 59.0) +[2023-10-08 16:38:53,803][19739] Avg episode reward: [(0, '664.420'), (1, '665.210')] +[2023-10-08 16:38:54,047][21194] Updated weights for policy 1, policy_version 23130 (0.0009) +[2023-10-08 16:38:57,375][21195] Updated weights for policy 0, policy_version 23300 (0.0010) +[2023-10-08 16:38:57,745][21195] Updated weights for policy 0, policy_version 23310 (0.0009) +[2023-10-08 16:38:57,845][21194] Updated weights for policy 1, policy_version 23140 (0.0009) +[2023-10-08 16:38:58,113][21195] Updated weights for policy 0, policy_version 23320 (0.0009) +[2023-10-08 16:38:58,213][21194] Updated weights for policy 1, policy_version 23150 (0.0008) +[2023-10-08 16:38:58,573][21194] Updated weights for policy 1, policy_version 23160 (0.0008) +[2023-10-08 16:38:58,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 47579136. Throughput: 0: 1743.9, 1: 1718.1. Samples: 11906082. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 16:38:58,803][19739] Avg episode reward: [(0, '664.420'), (1, '665.210')] +[2023-10-08 16:39:01,963][21195] Updated weights for policy 0, policy_version 23330 (0.0008) +[2023-10-08 16:39:02,333][21195] Updated weights for policy 0, policy_version 23340 (0.0008) +[2023-10-08 16:39:02,600][21194] Updated weights for policy 1, policy_version 23170 (0.0009) +[2023-10-08 16:39:02,712][21195] Updated weights for policy 0, policy_version 23350 (0.0009) +[2023-10-08 16:39:02,969][21194] Updated weights for policy 1, policy_version 23180 (0.0008) +[2023-10-08 16:39:03,083][21195] Updated weights for policy 0, policy_version 23360 (0.0009) +[2023-10-08 16:39:03,345][21194] Updated weights for policy 1, policy_version 23190 (0.0009) +[2023-10-08 16:39:03,705][21194] Updated weights for policy 1, policy_version 23200 (0.0008) +[2023-10-08 16:39:03,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 47677440. Throughput: 0: 1725.5, 1: 1728.2. Samples: 11920996. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 16:39:03,804][19739] Avg episode reward: [(0, '664.420'), (1, '665.210')] +[2023-10-08 16:39:07,026][21195] Updated weights for policy 0, policy_version 23370 (0.0010) +[2023-10-08 16:39:07,399][21195] Updated weights for policy 0, policy_version 23380 (0.0009) +[2023-10-08 16:39:07,760][21195] Updated weights for policy 0, policy_version 23390 (0.0008) +[2023-10-08 16:39:07,792][21194] Updated weights for policy 1, policy_version 23210 (0.0010) +[2023-10-08 16:39:08,155][21194] Updated weights for policy 1, policy_version 23220 (0.0007) +[2023-10-08 16:39:08,524][21194] Updated weights for policy 1, policy_version 23230 (0.0008) +[2023-10-08 16:39:08,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 47742976. Throughput: 0: 1747.6, 1: 1728.3. Samples: 11937266. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 16:39:08,803][19739] Avg episode reward: [(0, '671.780'), (1, '665.210')] +[2023-10-08 16:39:08,804][20740] Saving new best policy, reward=671.780! +[2023-10-08 16:39:11,775][21195] Updated weights for policy 0, policy_version 23400 (0.0010) +[2023-10-08 16:39:12,151][21195] Updated weights for policy 0, policy_version 23410 (0.0008) +[2023-10-08 16:39:12,476][21194] Updated weights for policy 1, policy_version 23240 (0.0009) +[2023-10-08 16:39:12,518][21195] Updated weights for policy 0, policy_version 23420 (0.0008) +[2023-10-08 16:39:12,837][21194] Updated weights for policy 1, policy_version 23250 (0.0009) +[2023-10-08 16:39:13,202][21194] Updated weights for policy 1, policy_version 23260 (0.0010) +[2023-10-08 16:39:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 47808512. Throughput: 0: 1718.7, 1: 1705.8. Samples: 11956374. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 16:39:13,804][19739] Avg episode reward: [(0, '665.850'), (1, '665.210')] +[2023-10-08 16:39:13,816][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000023264_23822336.pth... +[2023-10-08 16:39:13,816][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000023424_23986176.pth... +[2023-10-08 16:39:13,848][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000021664_22183936.pth +[2023-10-08 16:39:13,860][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000021792_22315008.pth +[2023-10-08 16:39:16,350][21195] Updated weights for policy 0, policy_version 23430 (0.0007) +[2023-10-08 16:39:16,720][21195] Updated weights for policy 0, policy_version 23440 (0.0009) +[2023-10-08 16:39:17,090][21195] Updated weights for policy 0, policy_version 23450 (0.0008) +[2023-10-08 16:39:17,319][21194] Updated weights for policy 1, policy_version 23270 (0.0007) +[2023-10-08 16:39:17,686][21194] Updated weights for policy 1, policy_version 23280 (0.0007) +[2023-10-08 16:39:18,047][21194] Updated weights for policy 1, policy_version 23290 (0.0008) +[2023-10-08 16:39:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 47874048. Throughput: 0: 1722.8, 1: 1725.0. Samples: 11972708. Policy #0 lag: (min: 20.0, avg: 22.7, max: 52.0) +[2023-10-08 16:39:18,803][19739] Avg episode reward: [(0, '665.850'), (1, '665.210')] +[2023-10-08 16:39:20,952][21195] Updated weights for policy 0, policy_version 23460 (0.0009) +[2023-10-08 16:39:21,317][21195] Updated weights for policy 0, policy_version 23470 (0.0008) +[2023-10-08 16:39:21,699][21195] Updated weights for policy 0, policy_version 23480 (0.0008) +[2023-10-08 16:39:21,846][21194] Updated weights for policy 1, policy_version 23300 (0.0007) +[2023-10-08 16:39:22,217][21194] Updated weights for policy 1, policy_version 23310 (0.0009) +[2023-10-08 16:39:22,587][21194] Updated weights for policy 1, policy_version 23320 (0.0007) +[2023-10-08 16:39:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 47939584. Throughput: 0: 1724.7, 1: 1714.6. Samples: 11987970. Policy #0 lag: (min: 20.0, avg: 22.7, max: 52.0) +[2023-10-08 16:39:23,804][19739] Avg episode reward: [(0, '665.850'), (1, '665.210')] +[2023-10-08 16:39:25,745][21195] Updated weights for policy 0, policy_version 23490 (0.0008) +[2023-10-08 16:39:26,121][21195] Updated weights for policy 0, policy_version 23500 (0.0008) +[2023-10-08 16:39:26,328][21194] Updated weights for policy 1, policy_version 23330 (0.0007) +[2023-10-08 16:39:26,487][21195] Updated weights for policy 0, policy_version 23510 (0.0009) +[2023-10-08 16:39:26,694][21194] Updated weights for policy 1, policy_version 23340 (0.0007) +[2023-10-08 16:39:26,869][21195] Updated weights for policy 0, policy_version 23520 (0.0010) +[2023-10-08 16:39:27,056][21194] Updated weights for policy 1, policy_version 23350 (0.0007) +[2023-10-08 16:39:27,430][21194] Updated weights for policy 1, policy_version 23360 (0.0007) +[2023-10-08 16:39:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 48005120. Throughput: 0: 1718.5, 1: 1699.3. Samples: 12008264. Policy #0 lag: (min: 20.0, avg: 22.7, max: 52.0) +[2023-10-08 16:39:28,803][19739] Avg episode reward: [(0, '657.980'), (1, '665.210')] +[2023-10-08 16:39:30,877][21195] Updated weights for policy 0, policy_version 23530 (0.0009) +[2023-10-08 16:39:31,252][21195] Updated weights for policy 0, policy_version 23540 (0.0009) +[2023-10-08 16:39:31,418][21194] Updated weights for policy 1, policy_version 23370 (0.0007) +[2023-10-08 16:39:31,625][21195] Updated weights for policy 0, policy_version 23550 (0.0008) +[2023-10-08 16:39:31,774][21194] Updated weights for policy 1, policy_version 23380 (0.0007) +[2023-10-08 16:39:32,149][21194] Updated weights for policy 1, policy_version 23390 (0.0008) +[2023-10-08 16:39:33,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 48070656. Throughput: 0: 1733.9, 1: 1728.7. Samples: 12024624. Policy #0 lag: (min: 20.0, avg: 22.7, max: 52.0) +[2023-10-08 16:39:33,803][19739] Avg episode reward: [(0, '657.980'), (1, '665.210')] +[2023-10-08 16:39:35,467][21195] Updated weights for policy 0, policy_version 23560 (0.0008) +[2023-10-08 16:39:35,828][21195] Updated weights for policy 0, policy_version 23570 (0.0008) +[2023-10-08 16:39:36,134][21194] Updated weights for policy 1, policy_version 23400 (0.0008) +[2023-10-08 16:39:36,205][21195] Updated weights for policy 0, policy_version 23580 (0.0007) +[2023-10-08 16:39:36,510][21194] Updated weights for policy 1, policy_version 23410 (0.0007) +[2023-10-08 16:39:36,875][21194] Updated weights for policy 1, policy_version 23420 (0.0007) +[2023-10-08 16:39:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 48136192. Throughput: 0: 1709.3, 1: 1696.4. Samples: 12038534. Policy #0 lag: (min: 26.0, avg: 30.4, max: 58.0) +[2023-10-08 16:39:38,803][19739] Avg episode reward: [(0, '657.980'), (1, '659.250')] +[2023-10-08 16:39:40,130][21195] Updated weights for policy 0, policy_version 23590 (0.0010) +[2023-10-08 16:39:40,496][21195] Updated weights for policy 0, policy_version 23600 (0.0007) +[2023-10-08 16:39:40,870][21195] Updated weights for policy 0, policy_version 23610 (0.0008) +[2023-10-08 16:39:40,896][21194] Updated weights for policy 1, policy_version 23430 (0.0008) +[2023-10-08 16:39:41,275][21194] Updated weights for policy 1, policy_version 23440 (0.0010) +[2023-10-08 16:39:41,645][21194] Updated weights for policy 1, policy_version 23450 (0.0008) +[2023-10-08 16:39:43,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 48201728. Throughput: 0: 1718.8, 1: 1697.2. Samples: 12059804. Policy #0 lag: (min: 26.0, avg: 30.4, max: 58.0) +[2023-10-08 16:39:43,803][19739] Avg episode reward: [(0, '663.440'), (1, '659.250')] +[2023-10-08 16:39:44,749][21195] Updated weights for policy 0, policy_version 23620 (0.0009) +[2023-10-08 16:39:45,116][21195] Updated weights for policy 0, policy_version 23630 (0.0007) +[2023-10-08 16:39:45,476][21195] Updated weights for policy 0, policy_version 23640 (0.0009) +[2023-10-08 16:39:45,695][21194] Updated weights for policy 1, policy_version 23460 (0.0008) +[2023-10-08 16:39:46,067][21194] Updated weights for policy 1, policy_version 23470 (0.0009) +[2023-10-08 16:39:46,430][21194] Updated weights for policy 1, policy_version 23480 (0.0009) +[2023-10-08 16:39:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 48267264. Throughput: 0: 1738.5, 1: 1706.4. Samples: 12076014. Policy #0 lag: (min: 26.0, avg: 30.4, max: 58.0) +[2023-10-08 16:39:48,803][19739] Avg episode reward: [(0, '663.440'), (1, '659.250')] +[2023-10-08 16:39:49,488][21195] Updated weights for policy 0, policy_version 23650 (0.0008) +[2023-10-08 16:39:49,853][21195] Updated weights for policy 0, policy_version 23660 (0.0008) +[2023-10-08 16:39:50,234][21195] Updated weights for policy 0, policy_version 23670 (0.0007) +[2023-10-08 16:39:50,490][21194] Updated weights for policy 1, policy_version 23490 (0.0008) +[2023-10-08 16:39:50,599][21195] Updated weights for policy 0, policy_version 23680 (0.0009) +[2023-10-08 16:39:50,850][21194] Updated weights for policy 1, policy_version 23500 (0.0008) +[2023-10-08 16:39:51,221][21194] Updated weights for policy 1, policy_version 23510 (0.0007) +[2023-10-08 16:39:51,587][21194] Updated weights for policy 1, policy_version 23520 (0.0009) +[2023-10-08 16:39:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 48332800. Throughput: 0: 1713.0, 1: 1690.5. Samples: 12090426. Policy #0 lag: (min: 26.0, avg: 30.4, max: 58.0) +[2023-10-08 16:39:53,803][19739] Avg episode reward: [(0, '648.150'), (1, '659.250')] +[2023-10-08 16:39:54,476][21195] Updated weights for policy 0, policy_version 23690 (0.0008) +[2023-10-08 16:39:54,851][21195] Updated weights for policy 0, policy_version 23700 (0.0007) +[2023-10-08 16:39:55,233][21195] Updated weights for policy 0, policy_version 23710 (0.0009) +[2023-10-08 16:39:55,398][21194] Updated weights for policy 1, policy_version 23530 (0.0008) +[2023-10-08 16:39:55,774][21194] Updated weights for policy 1, policy_version 23540 (0.0007) +[2023-10-08 16:39:56,137][21194] Updated weights for policy 1, policy_version 23550 (0.0007) +[2023-10-08 16:39:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 48398336. Throughput: 0: 1745.9, 1: 1720.9. Samples: 12112376. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:39:58,803][19739] Avg episode reward: [(0, '638.080'), (1, '665.590')] +[2023-10-08 16:39:59,158][21195] Updated weights for policy 0, policy_version 23720 (0.0008) +[2023-10-08 16:39:59,528][21195] Updated weights for policy 0, policy_version 23730 (0.0008) +[2023-10-08 16:39:59,901][21195] Updated weights for policy 0, policy_version 23740 (0.0008) +[2023-10-08 16:40:00,056][21194] Updated weights for policy 1, policy_version 23560 (0.0008) +[2023-10-08 16:40:00,421][21194] Updated weights for policy 1, policy_version 23570 (0.0010) +[2023-10-08 16:40:00,788][21194] Updated weights for policy 1, policy_version 23580 (0.0007) +[2023-10-08 16:40:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 48463872. Throughput: 0: 1736.7, 1: 1700.7. Samples: 12127390. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:40:03,803][19739] Avg episode reward: [(0, '624.510'), (1, '664.680')] +[2023-10-08 16:40:03,828][21195] Updated weights for policy 0, policy_version 23750 (0.0007) +[2023-10-08 16:40:04,195][21195] Updated weights for policy 0, policy_version 23760 (0.0008) +[2023-10-08 16:40:04,570][21195] Updated weights for policy 0, policy_version 23770 (0.0008) +[2023-10-08 16:40:04,608][21194] Updated weights for policy 1, policy_version 23590 (0.0008) +[2023-10-08 16:40:04,982][21194] Updated weights for policy 1, policy_version 23600 (0.0009) +[2023-10-08 16:40:05,351][21194] Updated weights for policy 1, policy_version 23610 (0.0008) +[2023-10-08 16:40:08,523][21195] Updated weights for policy 0, policy_version 23780 (0.0008) +[2023-10-08 16:40:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 48529408. Throughput: 0: 1736.6, 1: 1711.5. Samples: 12143134. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:40:08,803][19739] Avg episode reward: [(0, '641.140'), (1, '673.400')] +[2023-10-08 16:40:08,889][21195] Updated weights for policy 0, policy_version 23790 (0.0008) +[2023-10-08 16:40:09,255][21195] Updated weights for policy 0, policy_version 23800 (0.0007) +[2023-10-08 16:40:09,376][21194] Updated weights for policy 1, policy_version 23620 (0.0007) +[2023-10-08 16:40:09,742][21194] Updated weights for policy 1, policy_version 23630 (0.0009) +[2023-10-08 16:40:10,111][21194] Updated weights for policy 1, policy_version 23640 (0.0009) +[2023-10-08 16:40:13,088][21195] Updated weights for policy 0, policy_version 23810 (0.0007) +[2023-10-08 16:40:13,468][21195] Updated weights for policy 0, policy_version 23820 (0.0008) +[2023-10-08 16:40:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.3, 300 sec: 13773.7). Total num frames: 48594944. Throughput: 0: 1746.8, 1: 1728.0. Samples: 12164628. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:40:13,803][19739] Avg episode reward: [(0, '641.140'), (1, '681.690')] +[2023-10-08 16:40:13,828][21195] Updated weights for policy 0, policy_version 23830 (0.0008) +[2023-10-08 16:40:14,026][21194] Updated weights for policy 1, policy_version 23650 (0.0008) +[2023-10-08 16:40:14,204][21195] Updated weights for policy 0, policy_version 23840 (0.0007) +[2023-10-08 16:40:14,387][21194] Updated weights for policy 1, policy_version 23660 (0.0009) +[2023-10-08 16:40:14,751][21194] Updated weights for policy 1, policy_version 23670 (0.0008) +[2023-10-08 16:40:15,120][21194] Updated weights for policy 1, policy_version 23680 (0.0009) +[2023-10-08 16:40:18,156][21195] Updated weights for policy 0, policy_version 23850 (0.0010) +[2023-10-08 16:40:18,525][21195] Updated weights for policy 0, policy_version 23860 (0.0008) +[2023-10-08 16:40:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 48660480. Throughput: 0: 1728.8, 1: 1698.2. Samples: 12178840. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:40:18,803][19739] Avg episode reward: [(0, '641.140'), (1, '628.410')] +[2023-10-08 16:40:18,894][21195] Updated weights for policy 0, policy_version 23870 (0.0007) +[2023-10-08 16:40:19,117][21194] Updated weights for policy 1, policy_version 23690 (0.0009) +[2023-10-08 16:40:19,496][21194] Updated weights for policy 1, policy_version 23700 (0.0010) +[2023-10-08 16:40:19,867][21194] Updated weights for policy 1, policy_version 23710 (0.0008) +[2023-10-08 16:40:22,724][21195] Updated weights for policy 0, policy_version 23880 (0.0010) +[2023-10-08 16:40:23,088][21195] Updated weights for policy 0, policy_version 23890 (0.0007) +[2023-10-08 16:40:23,455][21195] Updated weights for policy 0, policy_version 23900 (0.0008) +[2023-10-08 16:40:23,802][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 48758784. Throughput: 0: 1754.8, 1: 1723.7. Samples: 12195066. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:40:23,803][19739] Avg episode reward: [(0, '641.140'), (1, '625.310')] +[2023-10-08 16:40:23,905][21194] Updated weights for policy 1, policy_version 23720 (0.0009) +[2023-10-08 16:40:24,266][21194] Updated weights for policy 1, policy_version 23730 (0.0010) +[2023-10-08 16:40:24,623][21194] Updated weights for policy 1, policy_version 23740 (0.0007) +[2023-10-08 16:40:27,536][21195] Updated weights for policy 0, policy_version 23910 (0.0008) +[2023-10-08 16:40:27,911][21195] Updated weights for policy 0, policy_version 23920 (0.0008) +[2023-10-08 16:40:28,276][21195] Updated weights for policy 0, policy_version 23930 (0.0008) +[2023-10-08 16:40:28,711][21194] Updated weights for policy 1, policy_version 23750 (0.0008) +[2023-10-08 16:40:28,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 48824320. Throughput: 0: 1738.3, 1: 1730.1. Samples: 12215882. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:40:28,803][19739] Avg episode reward: [(0, '641.310'), (1, '625.540')] +[2023-10-08 16:40:29,093][21194] Updated weights for policy 1, policy_version 23760 (0.0010) +[2023-10-08 16:40:29,451][21194] Updated weights for policy 1, policy_version 23770 (0.0008) +[2023-10-08 16:40:32,124][21195] Updated weights for policy 0, policy_version 23940 (0.0008) +[2023-10-08 16:40:32,493][21195] Updated weights for policy 0, policy_version 23950 (0.0008) +[2023-10-08 16:40:32,863][21195] Updated weights for policy 0, policy_version 23960 (0.0008) +[2023-10-08 16:40:33,578][21194] Updated weights for policy 1, policy_version 23780 (0.0007) +[2023-10-08 16:40:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 48889856. Throughput: 0: 1722.1, 1: 1707.2. Samples: 12230334. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 16:40:33,803][19739] Avg episode reward: [(0, '641.310'), (1, '625.540')] +[2023-10-08 16:40:33,950][21194] Updated weights for policy 1, policy_version 23790 (0.0008) +[2023-10-08 16:40:34,306][21194] Updated weights for policy 1, policy_version 23800 (0.0010) +[2023-10-08 16:40:36,753][21195] Updated weights for policy 0, policy_version 23970 (0.0008) +[2023-10-08 16:40:37,123][21195] Updated weights for policy 0, policy_version 23980 (0.0009) +[2023-10-08 16:40:37,496][21195] Updated weights for policy 0, policy_version 23990 (0.0010) +[2023-10-08 16:40:37,863][21195] Updated weights for policy 0, policy_version 24000 (0.0009) +[2023-10-08 16:40:38,269][21194] Updated weights for policy 1, policy_version 23810 (0.0010) +[2023-10-08 16:40:38,635][21194] Updated weights for policy 1, policy_version 23820 (0.0007) +[2023-10-08 16:40:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 48955392. Throughput: 0: 1750.2, 1: 1724.5. Samples: 12246786. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 16:40:38,803][19739] Avg episode reward: [(0, '633.970'), (1, '637.280')] +[2023-10-08 16:40:39,002][21194] Updated weights for policy 1, policy_version 23830 (0.0008) +[2023-10-08 16:40:39,365][21194] Updated weights for policy 1, policy_version 23840 (0.0007) +[2023-10-08 16:40:41,794][21195] Updated weights for policy 0, policy_version 24010 (0.0008) +[2023-10-08 16:40:42,166][21195] Updated weights for policy 0, policy_version 24020 (0.0009) +[2023-10-08 16:40:42,524][21195] Updated weights for policy 0, policy_version 24030 (0.0007) +[2023-10-08 16:40:43,290][21194] Updated weights for policy 1, policy_version 23850 (0.0007) +[2023-10-08 16:40:43,657][21194] Updated weights for policy 1, policy_version 23860 (0.0008) +[2023-10-08 16:40:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 49020928. Throughput: 0: 1719.3, 1: 1719.4. Samples: 12267118. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 16:40:43,803][19739] Avg episode reward: [(0, '636.180'), (1, '637.280')] +[2023-10-08 16:40:44,022][21194] Updated weights for policy 1, policy_version 23870 (0.0008) +[2023-10-08 16:40:46,249][21195] Updated weights for policy 0, policy_version 24040 (0.0007) +[2023-10-08 16:40:46,616][21195] Updated weights for policy 0, policy_version 24050 (0.0007) +[2023-10-08 16:40:46,981][21195] Updated weights for policy 0, policy_version 24060 (0.0007) +[2023-10-08 16:40:47,877][21194] Updated weights for policy 1, policy_version 23880 (0.0009) +[2023-10-08 16:40:48,239][21194] Updated weights for policy 1, policy_version 23890 (0.0011) +[2023-10-08 16:40:48,619][21194] Updated weights for policy 1, policy_version 23900 (0.0011) +[2023-10-08 16:40:48,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 49119232. Throughput: 0: 1731.5, 1: 1721.3. Samples: 12282766. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 16:40:48,803][19739] Avg episode reward: [(0, '636.180'), (1, '666.380')] +[2023-10-08 16:40:50,867][21195] Updated weights for policy 0, policy_version 24070 (0.0008) +[2023-10-08 16:40:51,238][21195] Updated weights for policy 0, policy_version 24080 (0.0008) +[2023-10-08 16:40:51,609][21195] Updated weights for policy 0, policy_version 24090 (0.0007) +[2023-10-08 16:40:52,495][21194] Updated weights for policy 1, policy_version 23910 (0.0009) +[2023-10-08 16:40:52,865][21194] Updated weights for policy 1, policy_version 23920 (0.0007) +[2023-10-08 16:40:53,225][21194] Updated weights for policy 1, policy_version 23930 (0.0008) +[2023-10-08 16:40:53,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 49184768. Throughput: 0: 1727.2, 1: 1720.8. Samples: 12298298. Policy #0 lag: (min: 31.0, avg: 40.9, max: 63.0) +[2023-10-08 16:40:53,804][19739] Avg episode reward: [(0, '636.180'), (1, '666.380')] +[2023-10-08 16:40:55,431][21195] Updated weights for policy 0, policy_version 24100 (0.0008) +[2023-10-08 16:40:55,806][21195] Updated weights for policy 0, policy_version 24110 (0.0008) +[2023-10-08 16:40:56,178][21195] Updated weights for policy 0, policy_version 24120 (0.0009) +[2023-10-08 16:40:57,266][21194] Updated weights for policy 1, policy_version 23940 (0.0008) +[2023-10-08 16:40:57,637][21194] Updated weights for policy 1, policy_version 23950 (0.0008) +[2023-10-08 16:40:58,002][21194] Updated weights for policy 1, policy_version 23960 (0.0007) +[2023-10-08 16:40:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 49250304. Throughput: 0: 1730.0, 1: 1699.3. Samples: 12318948. Policy #0 lag: (min: 31.0, avg: 40.9, max: 63.0) +[2023-10-08 16:40:58,803][19739] Avg episode reward: [(0, '636.180'), (1, '666.380')] +[2023-10-08 16:41:00,016][21195] Updated weights for policy 0, policy_version 24130 (0.0007) +[2023-10-08 16:41:00,387][21195] Updated weights for policy 0, policy_version 24140 (0.0008) +[2023-10-08 16:41:00,760][21195] Updated weights for policy 0, policy_version 24150 (0.0008) +[2023-10-08 16:41:01,122][21195] Updated weights for policy 0, policy_version 24160 (0.0008) +[2023-10-08 16:41:01,929][21194] Updated weights for policy 1, policy_version 23970 (0.0008) +[2023-10-08 16:41:02,286][21194] Updated weights for policy 1, policy_version 23980 (0.0008) +[2023-10-08 16:41:02,654][21194] Updated weights for policy 1, policy_version 23990 (0.0007) +[2023-10-08 16:41:03,031][21194] Updated weights for policy 1, policy_version 24000 (0.0009) +[2023-10-08 16:41:03,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 49315840. Throughput: 0: 1756.1, 1: 1725.3. Samples: 12335504. Policy #0 lag: (min: 31.0, avg: 40.9, max: 63.0) +[2023-10-08 16:41:03,803][19739] Avg episode reward: [(0, '644.990'), (1, '659.840')] +[2023-10-08 16:41:05,138][21195] Updated weights for policy 0, policy_version 24170 (0.0011) +[2023-10-08 16:41:05,508][21195] Updated weights for policy 0, policy_version 24180 (0.0010) +[2023-10-08 16:41:05,882][21195] Updated weights for policy 0, policy_version 24190 (0.0007) +[2023-10-08 16:41:07,049][21194] Updated weights for policy 1, policy_version 24010 (0.0011) +[2023-10-08 16:41:07,410][21194] Updated weights for policy 1, policy_version 24020 (0.0011) +[2023-10-08 16:41:07,784][21194] Updated weights for policy 1, policy_version 24030 (0.0008) +[2023-10-08 16:41:08,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 49381376. Throughput: 0: 1725.4, 1: 1720.1. Samples: 12350116. Policy #0 lag: (min: 31.0, avg: 40.9, max: 63.0) +[2023-10-08 16:41:08,803][19739] Avg episode reward: [(0, '646.660'), (1, '673.560')] +[2023-10-08 16:41:09,828][21195] Updated weights for policy 0, policy_version 24200 (0.0009) +[2023-10-08 16:41:10,201][21195] Updated weights for policy 0, policy_version 24210 (0.0010) +[2023-10-08 16:41:10,566][21195] Updated weights for policy 0, policy_version 24220 (0.0010) +[2023-10-08 16:41:11,755][21194] Updated weights for policy 1, policy_version 24040 (0.0008) +[2023-10-08 16:41:12,134][21194] Updated weights for policy 1, policy_version 24050 (0.0008) +[2023-10-08 16:41:12,505][21194] Updated weights for policy 1, policy_version 24060 (0.0007) +[2023-10-08 16:41:13,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 49446912. Throughput: 0: 1739.4, 1: 1700.3. Samples: 12370666. Policy #0 lag: (min: 5.0, avg: 28.1, max: 32.0) +[2023-10-08 16:41:13,804][19739] Avg episode reward: [(0, '646.660'), (1, '685.750')] +[2023-10-08 16:41:13,816][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000024224_24805376.pth... +[2023-10-08 16:41:13,816][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000024064_24641536.pth... +[2023-10-08 16:41:13,849][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000022464_23003136.pth +[2023-10-08 16:41:13,850][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000022624_23166976.pth +[2023-10-08 16:41:13,853][20836] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p1/milestones/checkpoint_000024064_24641536.pth +[2023-10-08 16:41:13,854][20740] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p0/milestones/checkpoint_000024224_24805376.pth +[2023-10-08 16:41:14,552][21195] Updated weights for policy 0, policy_version 24230 (0.0009) +[2023-10-08 16:41:14,924][21195] Updated weights for policy 0, policy_version 24240 (0.0007) +[2023-10-08 16:41:15,290][21195] Updated weights for policy 0, policy_version 24250 (0.0008) +[2023-10-08 16:41:16,492][21194] Updated weights for policy 1, policy_version 24070 (0.0008) +[2023-10-08 16:41:16,857][21194] Updated weights for policy 1, policy_version 24080 (0.0007) +[2023-10-08 16:41:17,228][21194] Updated weights for policy 1, policy_version 24090 (0.0009) +[2023-10-08 16:41:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 49512448. Throughput: 0: 1758.2, 1: 1736.3. Samples: 12387584. Policy #0 lag: (min: 5.0, avg: 28.1, max: 32.0) +[2023-10-08 16:41:18,803][19739] Avg episode reward: [(0, '646.660'), (1, '706.510')] +[2023-10-08 16:41:19,160][21195] Updated weights for policy 0, policy_version 24260 (0.0009) +[2023-10-08 16:41:19,524][21195] Updated weights for policy 0, policy_version 24270 (0.0010) +[2023-10-08 16:41:19,901][21195] Updated weights for policy 0, policy_version 24280 (0.0007) +[2023-10-08 16:41:21,304][21194] Updated weights for policy 1, policy_version 24100 (0.0009) +[2023-10-08 16:41:21,658][21194] Updated weights for policy 1, policy_version 24110 (0.0009) +[2023-10-08 16:41:22,030][21194] Updated weights for policy 1, policy_version 24120 (0.0007) +[2023-10-08 16:41:23,659][21195] Updated weights for policy 0, policy_version 24290 (0.0008) +[2023-10-08 16:41:23,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 49577984. Throughput: 0: 1728.9, 1: 1716.4. Samples: 12401822. Policy #0 lag: (min: 5.0, avg: 28.1, max: 32.0) +[2023-10-08 16:41:23,803][19739] Avg episode reward: [(0, '646.660'), (1, '684.190')] +[2023-10-08 16:41:24,035][21195] Updated weights for policy 0, policy_version 24300 (0.0010) +[2023-10-08 16:41:24,398][21195] Updated weights for policy 0, policy_version 24310 (0.0007) +[2023-10-08 16:41:24,757][21195] Updated weights for policy 0, policy_version 24320 (0.0009) +[2023-10-08 16:41:25,915][21194] Updated weights for policy 1, policy_version 24130 (0.0008) +[2023-10-08 16:41:26,287][21194] Updated weights for policy 1, policy_version 24140 (0.0007) +[2023-10-08 16:41:26,641][21194] Updated weights for policy 1, policy_version 24150 (0.0007) +[2023-10-08 16:41:27,010][21194] Updated weights for policy 1, policy_version 24160 (0.0008) +[2023-10-08 16:41:28,764][21195] Updated weights for policy 0, policy_version 24330 (0.0009) +[2023-10-08 16:41:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 49643520. Throughput: 0: 1757.0, 1: 1706.8. Samples: 12422992. Policy #0 lag: (min: 5.0, avg: 28.1, max: 32.0) +[2023-10-08 16:41:28,803][19739] Avg episode reward: [(0, '640.500'), (1, '650.140')] +[2023-10-08 16:41:29,127][21195] Updated weights for policy 0, policy_version 24340 (0.0007) +[2023-10-08 16:41:29,502][21195] Updated weights for policy 0, policy_version 24350 (0.0008) +[2023-10-08 16:41:30,897][21194] Updated weights for policy 1, policy_version 24170 (0.0007) +[2023-10-08 16:41:31,263][21194] Updated weights for policy 1, policy_version 24180 (0.0007) +[2023-10-08 16:41:31,636][21194] Updated weights for policy 1, policy_version 24190 (0.0008) +[2023-10-08 16:41:33,442][21195] Updated weights for policy 0, policy_version 24360 (0.0010) +[2023-10-08 16:41:33,798][21195] Updated weights for policy 0, policy_version 24370 (0.0010) +[2023-10-08 16:41:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 49709056. Throughput: 0: 1734.6, 1: 1726.0. Samples: 12438494. Policy #0 lag: (min: 31.0, avg: 31.6, max: 49.0) +[2023-10-08 16:41:33,803][19739] Avg episode reward: [(0, '640.500'), (1, '650.140')] +[2023-10-08 16:41:34,173][21195] Updated weights for policy 0, policy_version 24380 (0.0011) +[2023-10-08 16:41:35,509][21194] Updated weights for policy 1, policy_version 24200 (0.0009) +[2023-10-08 16:41:35,865][21194] Updated weights for policy 1, policy_version 24210 (0.0009) +[2023-10-08 16:41:36,234][21194] Updated weights for policy 1, policy_version 24220 (0.0008) +[2023-10-08 16:41:38,137][21195] Updated weights for policy 0, policy_version 24390 (0.0009) +[2023-10-08 16:41:38,504][21195] Updated weights for policy 0, policy_version 24400 (0.0009) +[2023-10-08 16:41:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 49774592. Throughput: 0: 1748.0, 1: 1713.6. Samples: 12454068. Policy #0 lag: (min: 31.0, avg: 31.6, max: 49.0) +[2023-10-08 16:41:38,803][19739] Avg episode reward: [(0, '646.530'), (1, '650.140')] +[2023-10-08 16:41:38,868][21195] Updated weights for policy 0, policy_version 24410 (0.0010) +[2023-10-08 16:41:40,024][21194] Updated weights for policy 1, policy_version 24230 (0.0009) +[2023-10-08 16:41:40,395][21194] Updated weights for policy 1, policy_version 24240 (0.0007) +[2023-10-08 16:41:40,757][21194] Updated weights for policy 1, policy_version 24250 (0.0008) +[2023-10-08 16:41:42,817][21195] Updated weights for policy 0, policy_version 24420 (0.0011) +[2023-10-08 16:41:43,192][21195] Updated weights for policy 0, policy_version 24430 (0.0010) +[2023-10-08 16:41:43,572][21195] Updated weights for policy 0, policy_version 24440 (0.0008) +[2023-10-08 16:41:43,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 49840128. Throughput: 0: 1739.8, 1: 1739.5. Samples: 12475516. Policy #0 lag: (min: 31.0, avg: 31.6, max: 49.0) +[2023-10-08 16:41:43,804][19739] Avg episode reward: [(0, '646.530'), (1, '641.020')] +[2023-10-08 16:41:44,723][21194] Updated weights for policy 1, policy_version 24260 (0.0007) +[2023-10-08 16:41:45,089][21194] Updated weights for policy 1, policy_version 24270 (0.0009) +[2023-10-08 16:41:45,452][21194] Updated weights for policy 1, policy_version 24280 (0.0009) +[2023-10-08 16:41:47,471][21195] Updated weights for policy 0, policy_version 24450 (0.0009) +[2023-10-08 16:41:47,835][21195] Updated weights for policy 0, policy_version 24460 (0.0009) +[2023-10-08 16:41:48,206][21195] Updated weights for policy 0, policy_version 24470 (0.0007) +[2023-10-08 16:41:48,579][21195] Updated weights for policy 0, policy_version 24480 (0.0008) +[2023-10-08 16:41:48,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 49938432. Throughput: 0: 1713.2, 1: 1713.5. Samples: 12489708. Policy #0 lag: (min: 31.0, avg: 31.1, max: 39.0) +[2023-10-08 16:41:48,803][19739] Avg episode reward: [(0, '646.530'), (1, '641.200')] +[2023-10-08 16:41:49,482][21194] Updated weights for policy 1, policy_version 24290 (0.0009) +[2023-10-08 16:41:49,846][21194] Updated weights for policy 1, policy_version 24300 (0.0011) +[2023-10-08 16:41:50,222][21194] Updated weights for policy 1, policy_version 24310 (0.0008) +[2023-10-08 16:41:50,590][21194] Updated weights for policy 1, policy_version 24320 (0.0009) +[2023-10-08 16:41:52,567][21195] Updated weights for policy 0, policy_version 24490 (0.0008) +[2023-10-08 16:41:52,944][21195] Updated weights for policy 0, policy_version 24500 (0.0007) +[2023-10-08 16:41:53,322][21195] Updated weights for policy 0, policy_version 24510 (0.0007) +[2023-10-08 16:41:53,802][19739] Fps is (10 sec: 16384.4, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 50003968. Throughput: 0: 1749.3, 1: 1719.6. Samples: 12506216. Policy #0 lag: (min: 31.0, avg: 31.1, max: 39.0) +[2023-10-08 16:41:53,803][19739] Avg episode reward: [(0, '646.530'), (1, '616.580')] +[2023-10-08 16:41:54,438][21194] Updated weights for policy 1, policy_version 24330 (0.0008) +[2023-10-08 16:41:54,809][21194] Updated weights for policy 1, policy_version 24340 (0.0011) +[2023-10-08 16:41:55,173][21194] Updated weights for policy 1, policy_version 24350 (0.0008) +[2023-10-08 16:41:57,233][21195] Updated weights for policy 0, policy_version 24520 (0.0007) +[2023-10-08 16:41:57,604][21195] Updated weights for policy 0, policy_version 24530 (0.0007) +[2023-10-08 16:41:57,967][21195] Updated weights for policy 0, policy_version 24540 (0.0008) +[2023-10-08 16:41:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 50069504. Throughput: 0: 1724.9, 1: 1747.5. Samples: 12526922. Policy #0 lag: (min: 31.0, avg: 31.1, max: 39.0) +[2023-10-08 16:41:58,803][19739] Avg episode reward: [(0, '647.870'), (1, '616.580')] +[2023-10-08 16:41:59,079][21194] Updated weights for policy 1, policy_version 24360 (0.0008) +[2023-10-08 16:41:59,450][21194] Updated weights for policy 1, policy_version 24370 (0.0008) +[2023-10-08 16:41:59,819][21194] Updated weights for policy 1, policy_version 24380 (0.0007) +[2023-10-08 16:42:01,989][21195] Updated weights for policy 0, policy_version 24550 (0.0010) +[2023-10-08 16:42:02,353][21195] Updated weights for policy 0, policy_version 24560 (0.0008) +[2023-10-08 16:42:02,723][21195] Updated weights for policy 0, policy_version 24570 (0.0008) +[2023-10-08 16:42:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 50135040. Throughput: 0: 1710.0, 1: 1717.5. Samples: 12541818. Policy #0 lag: (min: 31.0, avg: 31.1, max: 39.0) +[2023-10-08 16:42:03,803][19739] Avg episode reward: [(0, '647.870'), (1, '608.990')] +[2023-10-08 16:42:03,896][21194] Updated weights for policy 1, policy_version 24390 (0.0009) +[2023-10-08 16:42:04,258][21194] Updated weights for policy 1, policy_version 24400 (0.0010) +[2023-10-08 16:42:04,615][21194] Updated weights for policy 1, policy_version 24410 (0.0009) +[2023-10-08 16:42:06,593][21195] Updated weights for policy 0, policy_version 24580 (0.0009) +[2023-10-08 16:42:06,963][21195] Updated weights for policy 0, policy_version 24590 (0.0007) +[2023-10-08 16:42:07,341][21195] Updated weights for policy 0, policy_version 24600 (0.0007) +[2023-10-08 16:42:08,482][21194] Updated weights for policy 1, policy_version 24420 (0.0008) +[2023-10-08 16:42:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 50200576. Throughput: 0: 1732.8, 1: 1742.8. Samples: 12558222. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 16:42:08,803][19739] Avg episode reward: [(0, '649.950'), (1, '608.990')] +[2023-10-08 16:42:08,847][21194] Updated weights for policy 1, policy_version 24430 (0.0009) +[2023-10-08 16:42:09,209][21194] Updated weights for policy 1, policy_version 24440 (0.0009) +[2023-10-08 16:42:11,406][21195] Updated weights for policy 0, policy_version 24610 (0.0008) +[2023-10-08 16:42:11,783][21195] Updated weights for policy 0, policy_version 24620 (0.0008) +[2023-10-08 16:42:12,147][21195] Updated weights for policy 0, policy_version 24630 (0.0010) +[2023-10-08 16:42:12,519][21195] Updated weights for policy 0, policy_version 24640 (0.0009) +[2023-10-08 16:42:13,148][21194] Updated weights for policy 1, policy_version 24450 (0.0007) +[2023-10-08 16:42:13,510][21194] Updated weights for policy 1, policy_version 24460 (0.0007) +[2023-10-08 16:42:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 50266112. Throughput: 0: 1707.1, 1: 1754.2. Samples: 12578750. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 16:42:13,803][19739] Avg episode reward: [(0, '649.950'), (1, '602.650')] +[2023-10-08 16:42:13,874][21194] Updated weights for policy 1, policy_version 24470 (0.0008) +[2023-10-08 16:42:14,243][21194] Updated weights for policy 1, policy_version 24480 (0.0007) +[2023-10-08 16:42:16,299][21195] Updated weights for policy 0, policy_version 24650 (0.0009) +[2023-10-08 16:42:16,673][21195] Updated weights for policy 0, policy_version 24660 (0.0008) +[2023-10-08 16:42:17,037][21195] Updated weights for policy 0, policy_version 24670 (0.0009) +[2023-10-08 16:42:18,228][21194] Updated weights for policy 1, policy_version 24490 (0.0007) +[2023-10-08 16:42:18,595][21194] Updated weights for policy 1, policy_version 24500 (0.0007) +[2023-10-08 16:42:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 50331648. Throughput: 0: 1728.6, 1: 1730.2. Samples: 12594142. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 16:42:18,803][19739] Avg episode reward: [(0, '649.950'), (1, '602.650')] +[2023-10-08 16:42:18,962][21194] Updated weights for policy 1, policy_version 24510 (0.0009) +[2023-10-08 16:42:21,057][21195] Updated weights for policy 0, policy_version 24680 (0.0009) +[2023-10-08 16:42:21,437][21195] Updated weights for policy 0, policy_version 24690 (0.0007) +[2023-10-08 16:42:21,804][21195] Updated weights for policy 0, policy_version 24700 (0.0008) +[2023-10-08 16:42:22,803][21194] Updated weights for policy 1, policy_version 24520 (0.0010) +[2023-10-08 16:42:23,165][21194] Updated weights for policy 1, policy_version 24530 (0.0009) +[2023-10-08 16:42:23,535][21194] Updated weights for policy 1, policy_version 24540 (0.0008) +[2023-10-08 16:42:23,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 50429952. Throughput: 0: 1716.1, 1: 1743.6. Samples: 12609754. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 16:42:23,804][19739] Avg episode reward: [(0, '649.950'), (1, '602.650')] +[2023-10-08 16:42:25,451][21195] Updated weights for policy 0, policy_version 24710 (0.0011) +[2023-10-08 16:42:25,813][21195] Updated weights for policy 0, policy_version 24720 (0.0009) +[2023-10-08 16:42:26,188][21195] Updated weights for policy 0, policy_version 24730 (0.0009) +[2023-10-08 16:42:27,391][21194] Updated weights for policy 1, policy_version 24550 (0.0008) +[2023-10-08 16:42:27,763][21194] Updated weights for policy 1, policy_version 24560 (0.0009) +[2023-10-08 16:42:28,117][21194] Updated weights for policy 1, policy_version 24570 (0.0009) +[2023-10-08 16:42:28,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 50495488. Throughput: 0: 1724.8, 1: 1724.5. Samples: 12630734. Policy #0 lag: (min: 3.0, avg: 17.0, max: 35.0) +[2023-10-08 16:42:28,803][19739] Avg episode reward: [(0, '656.870'), (1, '608.450')] +[2023-10-08 16:42:29,894][21195] Updated weights for policy 0, policy_version 24740 (0.0008) +[2023-10-08 16:42:30,270][21195] Updated weights for policy 0, policy_version 24750 (0.0007) +[2023-10-08 16:42:30,642][21195] Updated weights for policy 0, policy_version 24760 (0.0009) +[2023-10-08 16:42:31,934][21194] Updated weights for policy 1, policy_version 24580 (0.0009) +[2023-10-08 16:42:32,298][21194] Updated weights for policy 1, policy_version 24590 (0.0007) +[2023-10-08 16:42:32,668][21194] Updated weights for policy 1, policy_version 24600 (0.0007) +[2023-10-08 16:42:33,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 50561024. Throughput: 0: 1750.8, 1: 1750.2. Samples: 12647254. Policy #0 lag: (min: 3.0, avg: 17.0, max: 35.0) +[2023-10-08 16:42:33,803][19739] Avg episode reward: [(0, '657.140'), (1, '608.450')] +[2023-10-08 16:42:34,537][21195] Updated weights for policy 0, policy_version 24770 (0.0010) +[2023-10-08 16:42:34,908][21195] Updated weights for policy 0, policy_version 24780 (0.0011) +[2023-10-08 16:42:35,270][21195] Updated weights for policy 0, policy_version 24790 (0.0007) +[2023-10-08 16:42:35,635][21195] Updated weights for policy 0, policy_version 24800 (0.0007) +[2023-10-08 16:42:36,700][21194] Updated weights for policy 1, policy_version 24610 (0.0008) +[2023-10-08 16:42:37,066][21194] Updated weights for policy 1, policy_version 24620 (0.0007) +[2023-10-08 16:42:37,434][21194] Updated weights for policy 1, policy_version 24630 (0.0009) +[2023-10-08 16:42:37,802][21194] Updated weights for policy 1, policy_version 24640 (0.0008) +[2023-10-08 16:42:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 50626560. Throughput: 0: 1724.4, 1: 1743.6. Samples: 12662272. Policy #0 lag: (min: 3.0, avg: 17.0, max: 35.0) +[2023-10-08 16:42:38,803][19739] Avg episode reward: [(0, '657.140'), (1, '609.700')] +[2023-10-08 16:42:39,605][21195] Updated weights for policy 0, policy_version 24810 (0.0007) +[2023-10-08 16:42:39,979][21195] Updated weights for policy 0, policy_version 24820 (0.0008) +[2023-10-08 16:42:40,350][21195] Updated weights for policy 0, policy_version 24830 (0.0007) +[2023-10-08 16:42:41,889][21194] Updated weights for policy 1, policy_version 24650 (0.0008) +[2023-10-08 16:42:42,253][21194] Updated weights for policy 1, policy_version 24660 (0.0008) +[2023-10-08 16:42:42,621][21194] Updated weights for policy 1, policy_version 24670 (0.0008) +[2023-10-08 16:42:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 50692096. Throughput: 0: 1747.5, 1: 1712.5. Samples: 12682622. Policy #0 lag: (min: 3.0, avg: 17.0, max: 35.0) +[2023-10-08 16:42:43,803][19739] Avg episode reward: [(0, '657.150'), (1, '596.190')] +[2023-10-08 16:42:44,231][21195] Updated weights for policy 0, policy_version 24840 (0.0007) +[2023-10-08 16:42:44,600][21195] Updated weights for policy 0, policy_version 24850 (0.0008) +[2023-10-08 16:42:44,960][21195] Updated weights for policy 0, policy_version 24860 (0.0007) +[2023-10-08 16:42:46,566][21194] Updated weights for policy 1, policy_version 24680 (0.0011) +[2023-10-08 16:42:46,935][21194] Updated weights for policy 1, policy_version 24690 (0.0008) +[2023-10-08 16:42:47,301][21194] Updated weights for policy 1, policy_version 24700 (0.0010) +[2023-10-08 16:42:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 50757632. Throughput: 0: 1758.4, 1: 1744.4. Samples: 12699442. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:42:48,803][19739] Avg episode reward: [(0, '657.150'), (1, '596.190')] +[2023-10-08 16:42:48,972][21195] Updated weights for policy 0, policy_version 24870 (0.0008) +[2023-10-08 16:42:49,343][21195] Updated weights for policy 0, policy_version 24880 (0.0009) +[2023-10-08 16:42:49,716][21195] Updated weights for policy 0, policy_version 24890 (0.0007) +[2023-10-08 16:42:51,424][21194] Updated weights for policy 1, policy_version 24710 (0.0009) +[2023-10-08 16:42:51,807][21194] Updated weights for policy 1, policy_version 24720 (0.0008) +[2023-10-08 16:42:52,181][21194] Updated weights for policy 1, policy_version 24730 (0.0007) +[2023-10-08 16:42:53,537][21195] Updated weights for policy 0, policy_version 24900 (0.0007) +[2023-10-08 16:42:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 50823168. Throughput: 0: 1739.7, 1: 1719.5. Samples: 12713884. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:42:53,803][19739] Avg episode reward: [(0, '643.690'), (1, '596.190')] +[2023-10-08 16:42:53,911][21195] Updated weights for policy 0, policy_version 24910 (0.0009) +[2023-10-08 16:42:54,283][21195] Updated weights for policy 0, policy_version 24920 (0.0008) +[2023-10-08 16:42:56,106][21194] Updated weights for policy 1, policy_version 24740 (0.0009) +[2023-10-08 16:42:56,479][21194] Updated weights for policy 1, policy_version 24750 (0.0010) +[2023-10-08 16:42:56,830][21194] Updated weights for policy 1, policy_version 24760 (0.0007) +[2023-10-08 16:42:58,271][21195] Updated weights for policy 0, policy_version 24930 (0.0009) +[2023-10-08 16:42:58,646][21195] Updated weights for policy 0, policy_version 24940 (0.0007) +[2023-10-08 16:42:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 50888704. Throughput: 0: 1763.7, 1: 1708.8. Samples: 12735012. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:42:58,803][19739] Avg episode reward: [(0, '645.910'), (1, '589.380')] +[2023-10-08 16:42:59,011][21195] Updated weights for policy 0, policy_version 24950 (0.0007) +[2023-10-08 16:42:59,370][21195] Updated weights for policy 0, policy_version 24960 (0.0009) +[2023-10-08 16:43:00,442][21194] Updated weights for policy 1, policy_version 24770 (0.0008) +[2023-10-08 16:43:00,805][21194] Updated weights for policy 1, policy_version 24780 (0.0008) +[2023-10-08 16:43:01,172][21194] Updated weights for policy 1, policy_version 24790 (0.0008) +[2023-10-08 16:43:01,539][21194] Updated weights for policy 1, policy_version 24800 (0.0007) +[2023-10-08 16:43:03,262][21195] Updated weights for policy 0, policy_version 24970 (0.0009) +[2023-10-08 16:43:03,640][21195] Updated weights for policy 0, policy_version 24980 (0.0007) +[2023-10-08 16:43:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 50954240. Throughput: 0: 1740.0, 1: 1731.5. Samples: 12750356. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:43:03,803][19739] Avg episode reward: [(0, '645.910'), (1, '581.990')] +[2023-10-08 16:43:04,008][21195] Updated weights for policy 0, policy_version 24990 (0.0007) +[2023-10-08 16:43:05,424][21194] Updated weights for policy 1, policy_version 24810 (0.0009) +[2023-10-08 16:43:05,794][21194] Updated weights for policy 1, policy_version 24820 (0.0009) +[2023-10-08 16:43:06,161][21194] Updated weights for policy 1, policy_version 24830 (0.0008) +[2023-10-08 16:43:07,761][21195] Updated weights for policy 0, policy_version 25000 (0.0009) +[2023-10-08 16:43:08,127][21195] Updated weights for policy 0, policy_version 25010 (0.0008) +[2023-10-08 16:43:08,507][21195] Updated weights for policy 0, policy_version 25020 (0.0011) +[2023-10-08 16:43:08,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 51052544. Throughput: 0: 1764.3, 1: 1719.6. Samples: 12766530. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 16:43:08,803][19739] Avg episode reward: [(0, '645.910'), (1, '581.990')] +[2023-10-08 16:43:10,166][21194] Updated weights for policy 1, policy_version 24840 (0.0010) +[2023-10-08 16:43:10,534][21194] Updated weights for policy 1, policy_version 24850 (0.0010) +[2023-10-08 16:43:10,895][21194] Updated weights for policy 1, policy_version 24860 (0.0008) +[2023-10-08 16:43:12,446][21195] Updated weights for policy 0, policy_version 25030 (0.0009) +[2023-10-08 16:43:12,820][21195] Updated weights for policy 0, policy_version 25040 (0.0007) +[2023-10-08 16:43:13,199][21195] Updated weights for policy 0, policy_version 25050 (0.0007) +[2023-10-08 16:43:13,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 51118080. Throughput: 0: 1746.7, 1: 1731.3. Samples: 12787244. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 16:43:13,803][19739] Avg episode reward: [(0, '645.910'), (1, '581.990')] +[2023-10-08 16:43:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000025056_25657344.pth... +[2023-10-08 16:43:13,811][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000024864_25460736.pth... +[2023-10-08 16:43:13,852][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000023264_23822336.pth +[2023-10-08 16:43:13,853][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000023424_23986176.pth +[2023-10-08 16:43:14,742][21194] Updated weights for policy 1, policy_version 24870 (0.0009) +[2023-10-08 16:43:15,108][21194] Updated weights for policy 1, policy_version 24880 (0.0007) +[2023-10-08 16:43:15,475][21194] Updated weights for policy 1, policy_version 24890 (0.0008) +[2023-10-08 16:43:17,066][21195] Updated weights for policy 0, policy_version 25060 (0.0011) +[2023-10-08 16:43:17,440][21195] Updated weights for policy 0, policy_version 25070 (0.0009) +[2023-10-08 16:43:17,819][21195] Updated weights for policy 0, policy_version 25080 (0.0011) +[2023-10-08 16:43:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 51183616. Throughput: 0: 1726.9, 1: 1709.5. Samples: 12801894. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 16:43:18,803][19739] Avg episode reward: [(0, '660.500'), (1, '581.990')] +[2023-10-08 16:43:19,293][21194] Updated weights for policy 1, policy_version 24900 (0.0008) +[2023-10-08 16:43:19,669][21194] Updated weights for policy 1, policy_version 24910 (0.0009) +[2023-10-08 16:43:20,035][21194] Updated weights for policy 1, policy_version 24920 (0.0010) +[2023-10-08 16:43:21,713][21195] Updated weights for policy 0, policy_version 25090 (0.0010) +[2023-10-08 16:43:22,083][21195] Updated weights for policy 0, policy_version 25100 (0.0009) +[2023-10-08 16:43:22,451][21195] Updated weights for policy 0, policy_version 25110 (0.0007) +[2023-10-08 16:43:22,814][21195] Updated weights for policy 0, policy_version 25120 (0.0008) +[2023-10-08 16:43:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 51249152. Throughput: 0: 1749.6, 1: 1718.5. Samples: 12818336. Policy #0 lag: (min: 10.0, avg: 10.1, max: 17.0) +[2023-10-08 16:43:23,803][19739] Avg episode reward: [(0, '660.500'), (1, '581.990')] +[2023-10-08 16:43:24,107][21194] Updated weights for policy 1, policy_version 24930 (0.0008) +[2023-10-08 16:43:24,480][21194] Updated weights for policy 1, policy_version 24940 (0.0008) +[2023-10-08 16:43:24,852][21194] Updated weights for policy 1, policy_version 24950 (0.0009) +[2023-10-08 16:43:25,217][21194] Updated weights for policy 1, policy_version 24960 (0.0007) +[2023-10-08 16:43:26,711][21195] Updated weights for policy 0, policy_version 25130 (0.0007) +[2023-10-08 16:43:27,084][21195] Updated weights for policy 0, policy_version 25140 (0.0009) +[2023-10-08 16:43:27,467][21195] Updated weights for policy 0, policy_version 25150 (0.0008) +[2023-10-08 16:43:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 51314688. Throughput: 0: 1726.1, 1: 1745.3. Samples: 12838836. Policy #0 lag: (min: 10.0, avg: 10.1, max: 17.0) +[2023-10-08 16:43:28,803][19739] Avg episode reward: [(0, '654.540'), (1, '581.990')] +[2023-10-08 16:43:29,015][21194] Updated weights for policy 1, policy_version 24970 (0.0009) +[2023-10-08 16:43:29,378][21194] Updated weights for policy 1, policy_version 24980 (0.0008) +[2023-10-08 16:43:29,750][21194] Updated weights for policy 1, policy_version 24990 (0.0009) +[2023-10-08 16:43:31,399][21195] Updated weights for policy 0, policy_version 25160 (0.0008) +[2023-10-08 16:43:31,777][21195] Updated weights for policy 0, policy_version 25170 (0.0010) +[2023-10-08 16:43:32,143][21195] Updated weights for policy 0, policy_version 25180 (0.0009) +[2023-10-08 16:43:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 51380224. Throughput: 0: 1726.3, 1: 1711.8. Samples: 12854156. Policy #0 lag: (min: 10.0, avg: 10.1, max: 17.0) +[2023-10-08 16:43:33,804][19739] Avg episode reward: [(0, '654.540'), (1, '581.990')] +[2023-10-08 16:43:33,813][21194] Updated weights for policy 1, policy_version 25000 (0.0008) +[2023-10-08 16:43:34,187][21194] Updated weights for policy 1, policy_version 25010 (0.0007) +[2023-10-08 16:43:34,544][21194] Updated weights for policy 1, policy_version 25020 (0.0007) +[2023-10-08 16:43:36,062][21195] Updated weights for policy 0, policy_version 25190 (0.0008) +[2023-10-08 16:43:36,435][21195] Updated weights for policy 0, policy_version 25200 (0.0010) +[2023-10-08 16:43:36,809][21195] Updated weights for policy 0, policy_version 25210 (0.0008) +[2023-10-08 16:43:38,565][21194] Updated weights for policy 1, policy_version 25030 (0.0007) +[2023-10-08 16:43:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 51445760. Throughput: 0: 1731.2, 1: 1737.9. Samples: 12869992. Policy #0 lag: (min: 10.0, avg: 10.1, max: 17.0) +[2023-10-08 16:43:38,803][19739] Avg episode reward: [(0, '653.650'), (1, '581.990')] +[2023-10-08 16:43:38,928][21194] Updated weights for policy 1, policy_version 25040 (0.0008) +[2023-10-08 16:43:39,294][21194] Updated weights for policy 1, policy_version 25050 (0.0011) +[2023-10-08 16:43:40,813][21195] Updated weights for policy 0, policy_version 25220 (0.0009) +[2023-10-08 16:43:41,188][21195] Updated weights for policy 0, policy_version 25230 (0.0009) +[2023-10-08 16:43:41,556][21195] Updated weights for policy 0, policy_version 25240 (0.0008) +[2023-10-08 16:43:43,293][21194] Updated weights for policy 1, policy_version 25060 (0.0009) +[2023-10-08 16:43:43,662][21194] Updated weights for policy 1, policy_version 25070 (0.0009) +[2023-10-08 16:43:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 51511296. Throughput: 0: 1724.4, 1: 1744.2. Samples: 12891096. Policy #0 lag: (min: 25.0, avg: 28.1, max: 57.0) +[2023-10-08 16:43:43,803][19739] Avg episode reward: [(0, '650.950'), (1, '581.990')] +[2023-10-08 16:43:44,023][21194] Updated weights for policy 1, policy_version 25080 (0.0010) +[2023-10-08 16:43:45,115][21195] Updated weights for policy 0, policy_version 25250 (0.0010) +[2023-10-08 16:43:45,491][21195] Updated weights for policy 0, policy_version 25260 (0.0009) +[2023-10-08 16:43:45,857][21195] Updated weights for policy 0, policy_version 25270 (0.0010) +[2023-10-08 16:43:46,221][21195] Updated weights for policy 0, policy_version 25280 (0.0009) +[2023-10-08 16:43:47,970][21194] Updated weights for policy 1, policy_version 25090 (0.0010) +[2023-10-08 16:43:48,336][21194] Updated weights for policy 1, policy_version 25100 (0.0010) +[2023-10-08 16:43:48,705][21194] Updated weights for policy 1, policy_version 25110 (0.0009) +[2023-10-08 16:43:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 51576832. Throughput: 0: 1751.5, 1: 1725.1. Samples: 12906802. Policy #0 lag: (min: 25.0, avg: 28.1, max: 57.0) +[2023-10-08 16:43:48,803][19739] Avg episode reward: [(0, '662.410'), (1, '581.990')] +[2023-10-08 16:43:49,076][21194] Updated weights for policy 1, policy_version 25120 (0.0008) +[2023-10-08 16:43:50,124][21195] Updated weights for policy 0, policy_version 25290 (0.0009) +[2023-10-08 16:43:50,494][21195] Updated weights for policy 0, policy_version 25300 (0.0011) +[2023-10-08 16:43:50,858][21195] Updated weights for policy 0, policy_version 25310 (0.0010) +[2023-10-08 16:43:53,095][21194] Updated weights for policy 1, policy_version 25130 (0.0011) +[2023-10-08 16:43:53,457][21194] Updated weights for policy 1, policy_version 25140 (0.0009) +[2023-10-08 16:43:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 51642368. Throughput: 0: 1722.8, 1: 1733.3. Samples: 12922056. Policy #0 lag: (min: 25.0, avg: 28.1, max: 57.0) +[2023-10-08 16:43:53,803][19739] Avg episode reward: [(0, '662.410'), (1, '590.990')] +[2023-10-08 16:43:53,833][21194] Updated weights for policy 1, policy_version 25150 (0.0007) +[2023-10-08 16:43:54,808][21195] Updated weights for policy 0, policy_version 25320 (0.0009) +[2023-10-08 16:43:55,172][21195] Updated weights for policy 0, policy_version 25330 (0.0009) +[2023-10-08 16:43:55,540][21195] Updated weights for policy 0, policy_version 25340 (0.0009) +[2023-10-08 16:43:57,844][21194] Updated weights for policy 1, policy_version 25160 (0.0007) +[2023-10-08 16:43:58,218][21194] Updated weights for policy 1, policy_version 25170 (0.0008) +[2023-10-08 16:43:58,581][21194] Updated weights for policy 1, policy_version 25180 (0.0009) +[2023-10-08 16:43:58,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 51740672. Throughput: 0: 1738.0, 1: 1723.5. Samples: 12943008. Policy #0 lag: (min: 25.0, avg: 28.1, max: 57.0) +[2023-10-08 16:43:58,803][19739] Avg episode reward: [(0, '662.410'), (1, '590.990')] +[2023-10-08 16:43:59,426][21195] Updated weights for policy 0, policy_version 25350 (0.0008) +[2023-10-08 16:43:59,793][21195] Updated weights for policy 0, policy_version 25360 (0.0008) +[2023-10-08 16:44:00,161][21195] Updated weights for policy 0, policy_version 25370 (0.0009) +[2023-10-08 16:44:02,501][21194] Updated weights for policy 1, policy_version 25190 (0.0007) +[2023-10-08 16:44:02,860][21194] Updated weights for policy 1, policy_version 25200 (0.0010) +[2023-10-08 16:44:03,226][21194] Updated weights for policy 1, policy_version 25210 (0.0011) +[2023-10-08 16:44:03,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 51806208. Throughput: 0: 1754.5, 1: 1734.0. Samples: 12958876. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 16:44:03,803][19739] Avg episode reward: [(0, '676.790'), (1, '596.950')] +[2023-10-08 16:44:03,804][20740] Saving new best policy, reward=676.790! +[2023-10-08 16:44:04,161][21195] Updated weights for policy 0, policy_version 25380 (0.0007) +[2023-10-08 16:44:04,538][21195] Updated weights for policy 0, policy_version 25390 (0.0008) +[2023-10-08 16:44:04,908][21195] Updated weights for policy 0, policy_version 25400 (0.0009) +[2023-10-08 16:44:07,160][21194] Updated weights for policy 1, policy_version 25220 (0.0009) +[2023-10-08 16:44:07,530][21194] Updated weights for policy 1, policy_version 25230 (0.0007) +[2023-10-08 16:44:07,890][21194] Updated weights for policy 1, policy_version 25240 (0.0008) +[2023-10-08 16:44:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 51871744. Throughput: 0: 1724.4, 1: 1740.1. Samples: 12974240. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 16:44:08,803][19739] Avg episode reward: [(0, '692.890'), (1, '596.950')] +[2023-10-08 16:44:08,875][21195] Updated weights for policy 0, policy_version 25410 (0.0008) +[2023-10-08 16:44:09,251][21195] Updated weights for policy 0, policy_version 25420 (0.0010) +[2023-10-08 16:44:09,622][21195] Updated weights for policy 0, policy_version 25430 (0.0009) +[2023-10-08 16:44:09,989][20740] Saving new best policy, reward=692.890! +[2023-10-08 16:44:09,991][21195] Updated weights for policy 0, policy_version 25440 (0.0009) +[2023-10-08 16:44:11,905][21194] Updated weights for policy 1, policy_version 25250 (0.0009) +[2023-10-08 16:44:12,276][21194] Updated weights for policy 1, policy_version 25260 (0.0009) +[2023-10-08 16:44:12,646][21194] Updated weights for policy 1, policy_version 25270 (0.0008) +[2023-10-08 16:44:13,011][21194] Updated weights for policy 1, policy_version 25280 (0.0008) +[2023-10-08 16:44:13,803][19739] Fps is (10 sec: 13106.7, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 51937280. Throughput: 0: 1751.0, 1: 1707.5. Samples: 12994470. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 16:44:13,804][19739] Avg episode reward: [(0, '678.390'), (1, '602.870')] +[2023-10-08 16:44:14,011][21195] Updated weights for policy 0, policy_version 25450 (0.0007) +[2023-10-08 16:44:14,375][21195] Updated weights for policy 0, policy_version 25460 (0.0009) +[2023-10-08 16:44:14,744][21195] Updated weights for policy 0, policy_version 25470 (0.0011) +[2023-10-08 16:44:16,895][21194] Updated weights for policy 1, policy_version 25290 (0.0007) +[2023-10-08 16:44:17,262][21194] Updated weights for policy 1, policy_version 25300 (0.0009) +[2023-10-08 16:44:17,626][21194] Updated weights for policy 1, policy_version 25310 (0.0008) +[2023-10-08 16:44:18,717][21195] Updated weights for policy 0, policy_version 25480 (0.0008) +[2023-10-08 16:44:18,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 52002816. Throughput: 0: 1738.5, 1: 1739.2. Samples: 13010652. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 16:44:18,804][19739] Avg episode reward: [(0, '670.970'), (1, '602.690')] +[2023-10-08 16:44:19,083][21195] Updated weights for policy 0, policy_version 25490 (0.0008) +[2023-10-08 16:44:19,451][21195] Updated weights for policy 0, policy_version 25500 (0.0009) +[2023-10-08 16:44:21,606][21194] Updated weights for policy 1, policy_version 25320 (0.0007) +[2023-10-08 16:44:21,975][21194] Updated weights for policy 1, policy_version 25330 (0.0008) +[2023-10-08 16:44:22,334][21194] Updated weights for policy 1, policy_version 25340 (0.0008) +[2023-10-08 16:44:23,534][21195] Updated weights for policy 0, policy_version 25510 (0.0008) +[2023-10-08 16:44:23,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 52068352. Throughput: 0: 1736.1, 1: 1720.1. Samples: 13025522. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 16:44:23,803][19739] Avg episode reward: [(0, '653.300'), (1, '602.690')] +[2023-10-08 16:44:23,899][21195] Updated weights for policy 0, policy_version 25520 (0.0009) +[2023-10-08 16:44:24,265][21195] Updated weights for policy 0, policy_version 25530 (0.0007) +[2023-10-08 16:44:26,342][21194] Updated weights for policy 1, policy_version 25350 (0.0009) +[2023-10-08 16:44:26,717][21194] Updated weights for policy 1, policy_version 25360 (0.0007) +[2023-10-08 16:44:27,081][21194] Updated weights for policy 1, policy_version 25370 (0.0007) +[2023-10-08 16:44:28,207][21195] Updated weights for policy 0, policy_version 25540 (0.0008) +[2023-10-08 16:44:28,581][21195] Updated weights for policy 0, policy_version 25550 (0.0007) +[2023-10-08 16:44:28,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 52133888. Throughput: 0: 1743.3, 1: 1704.7. Samples: 13046258. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 16:44:28,803][19739] Avg episode reward: [(0, '653.300'), (1, '602.690')] +[2023-10-08 16:44:28,954][21195] Updated weights for policy 0, policy_version 25560 (0.0007) +[2023-10-08 16:44:31,048][21194] Updated weights for policy 1, policy_version 25380 (0.0009) +[2023-10-08 16:44:31,417][21194] Updated weights for policy 1, policy_version 25390 (0.0009) +[2023-10-08 16:44:31,781][21194] Updated weights for policy 1, policy_version 25400 (0.0007) +[2023-10-08 16:44:32,834][21195] Updated weights for policy 0, policy_version 25570 (0.0008) +[2023-10-08 16:44:33,191][21195] Updated weights for policy 0, policy_version 25580 (0.0010) +[2023-10-08 16:44:33,564][21195] Updated weights for policy 0, policy_version 25590 (0.0010) +[2023-10-08 16:44:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 52199424. Throughput: 0: 1711.6, 1: 1730.4. Samples: 13061692. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 16:44:33,803][19739] Avg episode reward: [(0, '635.380'), (1, '614.030')] +[2023-10-08 16:44:33,933][21195] Updated weights for policy 0, policy_version 25600 (0.0010) +[2023-10-08 16:44:35,639][21194] Updated weights for policy 1, policy_version 25410 (0.0010) +[2023-10-08 16:44:36,014][21194] Updated weights for policy 1, policy_version 25420 (0.0007) +[2023-10-08 16:44:36,373][21194] Updated weights for policy 1, policy_version 25430 (0.0008) +[2023-10-08 16:44:36,733][21194] Updated weights for policy 1, policy_version 25440 (0.0008) +[2023-10-08 16:44:37,486][21195] Updated weights for policy 0, policy_version 25610 (0.0007) +[2023-10-08 16:44:37,853][21195] Updated weights for policy 0, policy_version 25620 (0.0008) +[2023-10-08 16:44:38,224][21195] Updated weights for policy 0, policy_version 25630 (0.0007) +[2023-10-08 16:44:38,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 52297728. Throughput: 0: 1743.6, 1: 1704.1. Samples: 13077204. Policy #0 lag: (min: 17.0, avg: 27.2, max: 49.0) +[2023-10-08 16:44:38,803][19739] Avg episode reward: [(0, '635.380'), (1, '614.030')] +[2023-10-08 16:44:40,585][21194] Updated weights for policy 1, policy_version 25450 (0.0010) +[2023-10-08 16:44:40,952][21194] Updated weights for policy 1, policy_version 25460 (0.0010) +[2023-10-08 16:44:41,318][21194] Updated weights for policy 1, policy_version 25470 (0.0009) +[2023-10-08 16:44:42,257][21195] Updated weights for policy 0, policy_version 25640 (0.0008) +[2023-10-08 16:44:42,629][21195] Updated weights for policy 0, policy_version 25650 (0.0007) +[2023-10-08 16:44:43,004][21195] Updated weights for policy 0, policy_version 25660 (0.0008) +[2023-10-08 16:44:43,803][19739] Fps is (10 sec: 16383.4, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 52363264. Throughput: 0: 1721.0, 1: 1717.6. Samples: 13097746. Policy #0 lag: (min: 17.0, avg: 27.2, max: 49.0) +[2023-10-08 16:44:43,804][19739] Avg episode reward: [(0, '635.380'), (1, '614.030')] +[2023-10-08 16:44:45,329][21194] Updated weights for policy 1, policy_version 25480 (0.0009) +[2023-10-08 16:44:45,691][21194] Updated weights for policy 1, policy_version 25490 (0.0010) +[2023-10-08 16:44:46,065][21194] Updated weights for policy 1, policy_version 25500 (0.0008) +[2023-10-08 16:44:46,944][21195] Updated weights for policy 0, policy_version 25670 (0.0007) +[2023-10-08 16:44:47,314][21195] Updated weights for policy 0, policy_version 25680 (0.0007) +[2023-10-08 16:44:47,694][21195] Updated weights for policy 0, policy_version 25690 (0.0007) +[2023-10-08 16:44:48,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 52428800. Throughput: 0: 1716.3, 1: 1710.8. Samples: 13113096. Policy #0 lag: (min: 17.0, avg: 27.2, max: 49.0) +[2023-10-08 16:44:48,803][19739] Avg episode reward: [(0, '641.180'), (1, '614.030')] +[2023-10-08 16:44:50,068][21194] Updated weights for policy 1, policy_version 25510 (0.0008) +[2023-10-08 16:44:50,429][21194] Updated weights for policy 1, policy_version 25520 (0.0011) +[2023-10-08 16:44:50,797][21194] Updated weights for policy 1, policy_version 25530 (0.0009) +[2023-10-08 16:44:51,549][21195] Updated weights for policy 0, policy_version 25700 (0.0007) +[2023-10-08 16:44:51,908][21195] Updated weights for policy 0, policy_version 25710 (0.0010) +[2023-10-08 16:44:52,280][21195] Updated weights for policy 0, policy_version 25720 (0.0008) +[2023-10-08 16:44:53,803][19739] Fps is (10 sec: 13107.7, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 52494336. Throughput: 0: 1741.6, 1: 1701.5. Samples: 13129180. Policy #0 lag: (min: 17.0, avg: 27.2, max: 49.0) +[2023-10-08 16:44:53,803][19739] Avg episode reward: [(0, '641.180'), (1, '625.150')] +[2023-10-08 16:44:54,598][21194] Updated weights for policy 1, policy_version 25540 (0.0010) +[2023-10-08 16:44:54,955][21194] Updated weights for policy 1, policy_version 25550 (0.0010) +[2023-10-08 16:44:55,320][21194] Updated weights for policy 1, policy_version 25560 (0.0009) +[2023-10-08 16:44:56,276][21195] Updated weights for policy 0, policy_version 25730 (0.0007) +[2023-10-08 16:44:56,658][21195] Updated weights for policy 0, policy_version 25740 (0.0007) +[2023-10-08 16:44:57,037][21195] Updated weights for policy 0, policy_version 25750 (0.0008) +[2023-10-08 16:44:57,400][21195] Updated weights for policy 0, policy_version 25760 (0.0008) +[2023-10-08 16:44:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 52559872. Throughput: 0: 1717.6, 1: 1736.0. Samples: 13149880. Policy #0 lag: (min: 17.0, avg: 24.3, max: 49.0) +[2023-10-08 16:44:58,803][19739] Avg episode reward: [(0, '641.180'), (1, '646.500')] +[2023-10-08 16:44:59,090][21194] Updated weights for policy 1, policy_version 25570 (0.0009) +[2023-10-08 16:44:59,454][21194] Updated weights for policy 1, policy_version 25580 (0.0011) +[2023-10-08 16:44:59,821][21194] Updated weights for policy 1, policy_version 25590 (0.0009) +[2023-10-08 16:45:00,184][21194] Updated weights for policy 1, policy_version 25600 (0.0008) +[2023-10-08 16:45:01,428][21195] Updated weights for policy 0, policy_version 25770 (0.0010) +[2023-10-08 16:45:01,801][21195] Updated weights for policy 0, policy_version 25780 (0.0009) +[2023-10-08 16:45:02,166][21195] Updated weights for policy 0, policy_version 25790 (0.0007) +[2023-10-08 16:45:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 52625408. Throughput: 0: 1731.6, 1: 1704.7. Samples: 13165282. Policy #0 lag: (min: 17.0, avg: 24.3, max: 49.0) +[2023-10-08 16:45:03,803][19739] Avg episode reward: [(0, '641.180'), (1, '646.820')] +[2023-10-08 16:45:04,221][21194] Updated weights for policy 1, policy_version 25610 (0.0008) +[2023-10-08 16:45:04,594][21194] Updated weights for policy 1, policy_version 25620 (0.0009) +[2023-10-08 16:45:04,957][21194] Updated weights for policy 1, policy_version 25630 (0.0009) +[2023-10-08 16:45:06,035][21195] Updated weights for policy 0, policy_version 25800 (0.0008) +[2023-10-08 16:45:06,409][21195] Updated weights for policy 0, policy_version 25810 (0.0007) +[2023-10-08 16:45:06,776][21195] Updated weights for policy 0, policy_version 25820 (0.0008) +[2023-10-08 16:45:08,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 52690944. Throughput: 0: 1732.6, 1: 1726.7. Samples: 13181190. Policy #0 lag: (min: 17.0, avg: 24.3, max: 49.0) +[2023-10-08 16:45:08,804][19739] Avg episode reward: [(0, '641.180'), (1, '647.390')] +[2023-10-08 16:45:09,023][21194] Updated weights for policy 1, policy_version 25640 (0.0009) +[2023-10-08 16:45:09,391][21194] Updated weights for policy 1, policy_version 25650 (0.0007) +[2023-10-08 16:45:09,765][21194] Updated weights for policy 1, policy_version 25660 (0.0007) +[2023-10-08 16:45:10,499][21195] Updated weights for policy 0, policy_version 25830 (0.0008) +[2023-10-08 16:45:10,866][21195] Updated weights for policy 0, policy_version 25840 (0.0010) +[2023-10-08 16:45:11,232][21195] Updated weights for policy 0, policy_version 25850 (0.0010) +[2023-10-08 16:45:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 52756480. Throughput: 0: 1729.7, 1: 1738.7. Samples: 13202336. Policy #0 lag: (min: 17.0, avg: 24.3, max: 49.0) +[2023-10-08 16:45:13,803][19739] Avg episode reward: [(0, '641.110'), (1, '647.630')] +[2023-10-08 16:45:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000025856_26476544.pth... +[2023-10-08 16:45:13,855][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000024224_24805376.pth +[2023-10-08 16:45:13,868][21194] Updated weights for policy 1, policy_version 25670 (0.0009) +[2023-10-08 16:45:14,253][21194] Updated weights for policy 1, policy_version 25680 (0.0009) +[2023-10-08 16:45:14,615][21194] Updated weights for policy 1, policy_version 25690 (0.0007) +[2023-10-08 16:45:14,835][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000025696_26312704.pth... +[2023-10-08 16:45:14,873][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000024064_24641536.pth +[2023-10-08 16:45:15,089][21195] Updated weights for policy 0, policy_version 25860 (0.0008) +[2023-10-08 16:45:15,464][21195] Updated weights for policy 0, policy_version 25870 (0.0009) +[2023-10-08 16:45:15,831][21195] Updated weights for policy 0, policy_version 25880 (0.0007) +[2023-10-08 16:45:18,487][21194] Updated weights for policy 1, policy_version 25700 (0.0007) +[2023-10-08 16:45:18,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 52822016. Throughput: 0: 1764.3, 1: 1710.1. Samples: 13218040. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 16:45:18,803][19739] Avg episode reward: [(0, '641.110'), (1, '647.630')] +[2023-10-08 16:45:18,862][21194] Updated weights for policy 1, policy_version 25710 (0.0007) +[2023-10-08 16:45:19,219][21194] Updated weights for policy 1, policy_version 25720 (0.0007) +[2023-10-08 16:45:19,600][21195] Updated weights for policy 0, policy_version 25890 (0.0008) +[2023-10-08 16:45:19,973][21195] Updated weights for policy 0, policy_version 25900 (0.0007) +[2023-10-08 16:45:20,351][21195] Updated weights for policy 0, policy_version 25910 (0.0009) +[2023-10-08 16:45:20,718][21195] Updated weights for policy 0, policy_version 25920 (0.0008) +[2023-10-08 16:45:23,085][21194] Updated weights for policy 1, policy_version 25730 (0.0009) +[2023-10-08 16:45:23,447][21194] Updated weights for policy 1, policy_version 25740 (0.0008) +[2023-10-08 16:45:23,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 52887552. Throughput: 0: 1732.2, 1: 1737.2. Samples: 13233326. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 16:45:23,804][19739] Avg episode reward: [(0, '631.140'), (1, '641.240')] +[2023-10-08 16:45:23,816][21194] Updated weights for policy 1, policy_version 25750 (0.0009) +[2023-10-08 16:45:24,180][21194] Updated weights for policy 1, policy_version 25760 (0.0011) +[2023-10-08 16:45:24,708][21195] Updated weights for policy 0, policy_version 25930 (0.0011) +[2023-10-08 16:45:25,077][21195] Updated weights for policy 0, policy_version 25940 (0.0007) +[2023-10-08 16:45:25,445][21195] Updated weights for policy 0, policy_version 25950 (0.0009) +[2023-10-08 16:45:28,237][21194] Updated weights for policy 1, policy_version 25770 (0.0010) +[2023-10-08 16:45:28,606][21194] Updated weights for policy 1, policy_version 25780 (0.0008) +[2023-10-08 16:45:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 52953088. Throughput: 0: 1750.5, 1: 1732.8. Samples: 13254490. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 16:45:28,803][19739] Avg episode reward: [(0, '631.140'), (1, '652.800')] +[2023-10-08 16:45:28,964][21194] Updated weights for policy 1, policy_version 25790 (0.0008) +[2023-10-08 16:45:29,385][21195] Updated weights for policy 0, policy_version 25960 (0.0008) +[2023-10-08 16:45:29,754][21195] Updated weights for policy 0, policy_version 25970 (0.0011) +[2023-10-08 16:45:30,124][21195] Updated weights for policy 0, policy_version 25980 (0.0007) +[2023-10-08 16:45:32,855][21194] Updated weights for policy 1, policy_version 25800 (0.0008) +[2023-10-08 16:45:33,223][21194] Updated weights for policy 1, policy_version 25810 (0.0008) +[2023-10-08 16:45:33,589][21194] Updated weights for policy 1, policy_version 25820 (0.0009) +[2023-10-08 16:45:33,803][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 53051392. Throughput: 0: 1756.7, 1: 1733.2. Samples: 13270138. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 16:45:33,803][19739] Avg episode reward: [(0, '629.870'), (1, '644.000')] +[2023-10-08 16:45:34,017][21195] Updated weights for policy 0, policy_version 25990 (0.0008) +[2023-10-08 16:45:34,387][21195] Updated weights for policy 0, policy_version 26000 (0.0008) +[2023-10-08 16:45:34,762][21195] Updated weights for policy 0, policy_version 26010 (0.0009) +[2023-10-08 16:45:37,513][21194] Updated weights for policy 1, policy_version 25830 (0.0009) +[2023-10-08 16:45:37,881][21194] Updated weights for policy 1, policy_version 25840 (0.0007) +[2023-10-08 16:45:38,249][21194] Updated weights for policy 1, policy_version 25850 (0.0010) +[2023-10-08 16:45:38,645][21195] Updated weights for policy 0, policy_version 26020 (0.0009) +[2023-10-08 16:45:38,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 53116928. Throughput: 0: 1734.0, 1: 1740.0. Samples: 13285512. Policy #0 lag: (min: 1.0, avg: 15.5, max: 33.0) +[2023-10-08 16:45:38,805][19739] Avg episode reward: [(0, '629.870'), (1, '644.000')] +[2023-10-08 16:45:39,017][21195] Updated weights for policy 0, policy_version 26030 (0.0009) +[2023-10-08 16:45:39,395][21195] Updated weights for policy 0, policy_version 26040 (0.0008) +[2023-10-08 16:45:42,069][21194] Updated weights for policy 1, policy_version 25860 (0.0008) +[2023-10-08 16:45:42,431][21194] Updated weights for policy 1, policy_version 25870 (0.0007) +[2023-10-08 16:45:42,798][21194] Updated weights for policy 1, policy_version 25880 (0.0009) +[2023-10-08 16:45:43,325][21195] Updated weights for policy 0, policy_version 26050 (0.0009) +[2023-10-08 16:45:43,696][21195] Updated weights for policy 0, policy_version 26060 (0.0007) +[2023-10-08 16:45:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 53182464. Throughput: 0: 1758.3, 1: 1709.3. Samples: 13305922. Policy #0 lag: (min: 1.0, avg: 15.5, max: 33.0) +[2023-10-08 16:45:43,803][19739] Avg episode reward: [(0, '627.790'), (1, '644.000')] +[2023-10-08 16:45:44,073][21195] Updated weights for policy 0, policy_version 26070 (0.0010) +[2023-10-08 16:45:44,436][21195] Updated weights for policy 0, policy_version 26080 (0.0010) +[2023-10-08 16:45:46,811][21194] Updated weights for policy 1, policy_version 25890 (0.0009) +[2023-10-08 16:45:47,178][21194] Updated weights for policy 1, policy_version 25900 (0.0009) +[2023-10-08 16:45:47,555][21194] Updated weights for policy 1, policy_version 25910 (0.0011) +[2023-10-08 16:45:47,919][21194] Updated weights for policy 1, policy_version 25920 (0.0007) +[2023-10-08 16:45:48,236][21195] Updated weights for policy 0, policy_version 26090 (0.0008) +[2023-10-08 16:45:48,605][21195] Updated weights for policy 0, policy_version 26100 (0.0007) +[2023-10-08 16:45:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 53248000. Throughput: 0: 1734.6, 1: 1738.4. Samples: 13321564. Policy #0 lag: (min: 1.0, avg: 15.5, max: 33.0) +[2023-10-08 16:45:48,803][19739] Avg episode reward: [(0, '627.790'), (1, '644.000')] +[2023-10-08 16:45:48,976][21195] Updated weights for policy 0, policy_version 26110 (0.0007) +[2023-10-08 16:45:51,947][21194] Updated weights for policy 1, policy_version 25930 (0.0010) +[2023-10-08 16:45:52,310][21194] Updated weights for policy 1, policy_version 25940 (0.0008) +[2023-10-08 16:45:52,674][21194] Updated weights for policy 1, policy_version 25950 (0.0009) +[2023-10-08 16:45:52,897][21195] Updated weights for policy 0, policy_version 26120 (0.0008) +[2023-10-08 16:45:53,274][21195] Updated weights for policy 0, policy_version 26130 (0.0008) +[2023-10-08 16:45:53,643][21195] Updated weights for policy 0, policy_version 26140 (0.0009) +[2023-10-08 16:45:53,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 53346304. Throughput: 0: 1749.8, 1: 1716.9. Samples: 13337192. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 16:45:53,803][19739] Avg episode reward: [(0, '627.790'), (1, '644.940')] +[2023-10-08 16:45:56,608][21194] Updated weights for policy 1, policy_version 25960 (0.0008) +[2023-10-08 16:45:56,980][21194] Updated weights for policy 1, policy_version 25970 (0.0007) +[2023-10-08 16:45:57,340][21194] Updated weights for policy 1, policy_version 25980 (0.0008) +[2023-10-08 16:45:57,410][21195] Updated weights for policy 0, policy_version 26150 (0.0009) +[2023-10-08 16:45:57,785][21195] Updated weights for policy 0, policy_version 26160 (0.0009) +[2023-10-08 16:45:58,152][21195] Updated weights for policy 0, policy_version 26170 (0.0008) +[2023-10-08 16:45:58,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 53411840. Throughput: 0: 1748.3, 1: 1703.7. Samples: 13357676. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 16:45:58,803][19739] Avg episode reward: [(0, '627.790'), (1, '659.780')] +[2023-10-08 16:46:01,436][21194] Updated weights for policy 1, policy_version 25990 (0.0009) +[2023-10-08 16:46:01,820][21194] Updated weights for policy 1, policy_version 26000 (0.0010) +[2023-10-08 16:46:02,056][21195] Updated weights for policy 0, policy_version 26180 (0.0008) +[2023-10-08 16:46:02,186][21194] Updated weights for policy 1, policy_version 26010 (0.0008) +[2023-10-08 16:46:02,432][21195] Updated weights for policy 0, policy_version 26190 (0.0008) +[2023-10-08 16:46:02,797][21195] Updated weights for policy 0, policy_version 26200 (0.0007) +[2023-10-08 16:46:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 53477376. Throughput: 0: 1726.3, 1: 1732.2. Samples: 13373670. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 16:46:03,804][19739] Avg episode reward: [(0, '627.790'), (1, '659.780')] +[2023-10-08 16:46:06,277][21194] Updated weights for policy 1, policy_version 26020 (0.0007) +[2023-10-08 16:46:06,644][21194] Updated weights for policy 1, policy_version 26030 (0.0008) +[2023-10-08 16:46:06,671][21195] Updated weights for policy 0, policy_version 26210 (0.0007) +[2023-10-08 16:46:07,003][21194] Updated weights for policy 1, policy_version 26040 (0.0008) +[2023-10-08 16:46:07,035][21195] Updated weights for policy 0, policy_version 26220 (0.0008) +[2023-10-08 16:46:07,410][21195] Updated weights for policy 0, policy_version 26230 (0.0007) +[2023-10-08 16:46:07,784][21195] Updated weights for policy 0, policy_version 26240 (0.0007) +[2023-10-08 16:46:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 53542912. Throughput: 0: 1754.8, 1: 1701.7. Samples: 13388868. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 16:46:08,803][19739] Avg episode reward: [(0, '627.790'), (1, '659.780')] +[2023-10-08 16:46:11,077][21194] Updated weights for policy 1, policy_version 26050 (0.0007) +[2023-10-08 16:46:11,441][21194] Updated weights for policy 1, policy_version 26060 (0.0007) +[2023-10-08 16:46:11,802][21194] Updated weights for policy 1, policy_version 26070 (0.0007) +[2023-10-08 16:46:11,851][21195] Updated weights for policy 0, policy_version 26250 (0.0008) +[2023-10-08 16:46:12,170][21194] Updated weights for policy 1, policy_version 26080 (0.0007) +[2023-10-08 16:46:12,212][21195] Updated weights for policy 0, policy_version 26260 (0.0009) +[2023-10-08 16:46:12,591][21195] Updated weights for policy 0, policy_version 26270 (0.0008) +[2023-10-08 16:46:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 53608448. Throughput: 0: 1723.5, 1: 1698.6. Samples: 13408484. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:46:13,804][19739] Avg episode reward: [(0, '627.790'), (1, '659.780')] +[2023-10-08 16:46:16,192][21194] Updated weights for policy 1, policy_version 26090 (0.0007) +[2023-10-08 16:46:16,465][21195] Updated weights for policy 0, policy_version 26280 (0.0008) +[2023-10-08 16:46:16,557][21194] Updated weights for policy 1, policy_version 26100 (0.0009) +[2023-10-08 16:46:16,838][21195] Updated weights for policy 0, policy_version 26290 (0.0008) +[2023-10-08 16:46:16,917][21194] Updated weights for policy 1, policy_version 26110 (0.0009) +[2023-10-08 16:46:17,211][21195] Updated weights for policy 0, policy_version 26300 (0.0008) +[2023-10-08 16:46:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 53673984. Throughput: 0: 1726.8, 1: 1713.9. Samples: 13424972. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:46:18,803][19739] Avg episode reward: [(0, '615.100'), (1, '659.780')] +[2023-10-08 16:46:20,927][21194] Updated weights for policy 1, policy_version 26120 (0.0010) +[2023-10-08 16:46:21,058][21195] Updated weights for policy 0, policy_version 26310 (0.0008) +[2023-10-08 16:46:21,290][21194] Updated weights for policy 1, policy_version 26130 (0.0009) +[2023-10-08 16:46:21,425][21195] Updated weights for policy 0, policy_version 26320 (0.0007) +[2023-10-08 16:46:21,654][21194] Updated weights for policy 1, policy_version 26140 (0.0008) +[2023-10-08 16:46:21,794][21195] Updated weights for policy 0, policy_version 26330 (0.0008) +[2023-10-08 16:46:23,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 53739520. Throughput: 0: 1733.6, 1: 1685.1. Samples: 13439350. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:46:23,803][19739] Avg episode reward: [(0, '615.100'), (1, '659.780')] +[2023-10-08 16:46:25,412][21194] Updated weights for policy 1, policy_version 26150 (0.0010) +[2023-10-08 16:46:25,769][21194] Updated weights for policy 1, policy_version 26160 (0.0011) +[2023-10-08 16:46:25,911][21195] Updated weights for policy 0, policy_version 26340 (0.0010) +[2023-10-08 16:46:26,132][21194] Updated weights for policy 1, policy_version 26170 (0.0008) +[2023-10-08 16:46:26,280][21195] Updated weights for policy 0, policy_version 26350 (0.0008) +[2023-10-08 16:46:26,654][21195] Updated weights for policy 0, policy_version 26360 (0.0010) +[2023-10-08 16:46:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 53805056. Throughput: 0: 1717.8, 1: 1715.6. Samples: 13460424. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:46:28,803][19739] Avg episode reward: [(0, '615.100'), (1, '658.270')] +[2023-10-08 16:46:30,196][21194] Updated weights for policy 1, policy_version 26180 (0.0008) +[2023-10-08 16:46:30,538][21195] Updated weights for policy 0, policy_version 26370 (0.0010) +[2023-10-08 16:46:30,569][21194] Updated weights for policy 1, policy_version 26190 (0.0008) +[2023-10-08 16:46:30,909][21195] Updated weights for policy 0, policy_version 26380 (0.0009) +[2023-10-08 16:46:30,931][21194] Updated weights for policy 1, policy_version 26200 (0.0008) +[2023-10-08 16:46:31,283][21195] Updated weights for policy 0, policy_version 26390 (0.0008) +[2023-10-08 16:46:31,652][21195] Updated weights for policy 0, policy_version 26400 (0.0008) +[2023-10-08 16:46:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 53870592. Throughput: 0: 1738.2, 1: 1692.1. Samples: 13475928. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:46:33,803][19739] Avg episode reward: [(0, '613.950'), (1, '652.770')] +[2023-10-08 16:46:34,935][21194] Updated weights for policy 1, policy_version 26210 (0.0008) +[2023-10-08 16:46:35,300][21194] Updated weights for policy 1, policy_version 26220 (0.0008) +[2023-10-08 16:46:35,671][21194] Updated weights for policy 1, policy_version 26230 (0.0008) +[2023-10-08 16:46:35,702][21195] Updated weights for policy 0, policy_version 26410 (0.0008) +[2023-10-08 16:46:36,031][21194] Updated weights for policy 1, policy_version 26240 (0.0007) +[2023-10-08 16:46:36,067][21195] Updated weights for policy 0, policy_version 26420 (0.0008) +[2023-10-08 16:46:36,445][21195] Updated weights for policy 0, policy_version 26430 (0.0007) +[2023-10-08 16:46:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 53936128. Throughput: 0: 1714.4, 1: 1700.6. Samples: 13490864. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:46:38,803][19739] Avg episode reward: [(0, '613.950'), (1, '667.050')] +[2023-10-08 16:46:39,977][21194] Updated weights for policy 1, policy_version 26250 (0.0007) +[2023-10-08 16:46:40,320][21195] Updated weights for policy 0, policy_version 26440 (0.0007) +[2023-10-08 16:46:40,354][21194] Updated weights for policy 1, policy_version 26260 (0.0008) +[2023-10-08 16:46:40,679][21195] Updated weights for policy 0, policy_version 26450 (0.0009) +[2023-10-08 16:46:40,720][21194] Updated weights for policy 1, policy_version 26270 (0.0008) +[2023-10-08 16:46:41,050][21195] Updated weights for policy 0, policy_version 26460 (0.0010) +[2023-10-08 16:46:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 54001664. Throughput: 0: 1720.5, 1: 1722.8. Samples: 13512626. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:46:43,803][19739] Avg episode reward: [(0, '613.950'), (1, '667.050')] +[2023-10-08 16:46:44,543][21194] Updated weights for policy 1, policy_version 26280 (0.0009) +[2023-10-08 16:46:44,911][21194] Updated weights for policy 1, policy_version 26290 (0.0009) +[2023-10-08 16:46:44,924][21195] Updated weights for policy 0, policy_version 26470 (0.0009) +[2023-10-08 16:46:45,276][21194] Updated weights for policy 1, policy_version 26300 (0.0009) +[2023-10-08 16:46:45,291][21195] Updated weights for policy 0, policy_version 26480 (0.0008) +[2023-10-08 16:46:45,657][21195] Updated weights for policy 0, policy_version 26490 (0.0009) +[2023-10-08 16:46:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 54067200. Throughput: 0: 1734.1, 1: 1695.5. Samples: 13528004. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:46:48,803][19739] Avg episode reward: [(0, '628.400'), (1, '671.080')] +[2023-10-08 16:46:49,321][21194] Updated weights for policy 1, policy_version 26310 (0.0008) +[2023-10-08 16:46:49,660][21195] Updated weights for policy 0, policy_version 26500 (0.0008) +[2023-10-08 16:46:49,681][21194] Updated weights for policy 1, policy_version 26320 (0.0010) +[2023-10-08 16:46:50,028][21195] Updated weights for policy 0, policy_version 26510 (0.0008) +[2023-10-08 16:46:50,043][21194] Updated weights for policy 1, policy_version 26330 (0.0007) +[2023-10-08 16:46:50,388][21195] Updated weights for policy 0, policy_version 26520 (0.0007) +[2023-10-08 16:46:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 54132736. Throughput: 0: 1705.2, 1: 1720.9. Samples: 13543040. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 16:46:53,803][19739] Avg episode reward: [(0, '628.400'), (1, '671.080')] +[2023-10-08 16:46:53,969][21194] Updated weights for policy 1, policy_version 26340 (0.0007) +[2023-10-08 16:46:54,339][21194] Updated weights for policy 1, policy_version 26350 (0.0007) +[2023-10-08 16:46:54,466][21195] Updated weights for policy 0, policy_version 26530 (0.0009) +[2023-10-08 16:46:54,709][21194] Updated weights for policy 1, policy_version 26360 (0.0007) +[2023-10-08 16:46:54,835][21195] Updated weights for policy 0, policy_version 26540 (0.0007) +[2023-10-08 16:46:55,205][21195] Updated weights for policy 0, policy_version 26550 (0.0007) +[2023-10-08 16:46:55,574][21195] Updated weights for policy 0, policy_version 26560 (0.0008) +[2023-10-08 16:46:58,637][21194] Updated weights for policy 1, policy_version 26370 (0.0007) +[2023-10-08 16:46:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 54198272. Throughput: 0: 1741.8, 1: 1724.2. Samples: 13564454. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 16:46:58,803][19739] Avg episode reward: [(0, '628.400'), (1, '671.080')] +[2023-10-08 16:46:58,999][21194] Updated weights for policy 1, policy_version 26380 (0.0008) +[2023-10-08 16:46:59,334][21195] Updated weights for policy 0, policy_version 26570 (0.0008) +[2023-10-08 16:46:59,365][21194] Updated weights for policy 1, policy_version 26390 (0.0008) +[2023-10-08 16:46:59,706][21195] Updated weights for policy 0, policy_version 26580 (0.0007) +[2023-10-08 16:46:59,726][21194] Updated weights for policy 1, policy_version 26400 (0.0007) +[2023-10-08 16:47:00,078][21195] Updated weights for policy 0, policy_version 26590 (0.0007) +[2023-10-08 16:47:03,744][21194] Updated weights for policy 1, policy_version 26410 (0.0009) +[2023-10-08 16:47:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.3, 300 sec: 13773.7). Total num frames: 54263808. Throughput: 0: 1733.6, 1: 1704.4. Samples: 13579684. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 16:47:03,803][19739] Avg episode reward: [(0, '628.400'), (1, '671.080')] +[2023-10-08 16:47:04,112][21194] Updated weights for policy 1, policy_version 26420 (0.0008) +[2023-10-08 16:47:04,122][21195] Updated weights for policy 0, policy_version 26600 (0.0009) +[2023-10-08 16:47:04,474][21194] Updated weights for policy 1, policy_version 26430 (0.0008) +[2023-10-08 16:47:04,493][21195] Updated weights for policy 0, policy_version 26610 (0.0007) +[2023-10-08 16:47:04,867][21195] Updated weights for policy 0, policy_version 26620 (0.0011) +[2023-10-08 16:47:08,465][21194] Updated weights for policy 1, policy_version 26440 (0.0007) +[2023-10-08 16:47:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 54329344. Throughput: 0: 1727.3, 1: 1726.9. Samples: 13594792. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 16:47:08,803][19739] Avg episode reward: [(0, '641.830'), (1, '662.340')] +[2023-10-08 16:47:08,839][21194] Updated weights for policy 1, policy_version 26450 (0.0008) +[2023-10-08 16:47:08,919][21195] Updated weights for policy 0, policy_version 26630 (0.0007) +[2023-10-08 16:47:09,202][21194] Updated weights for policy 1, policy_version 26460 (0.0008) +[2023-10-08 16:47:09,282][21195] Updated weights for policy 0, policy_version 26640 (0.0007) +[2023-10-08 16:47:09,664][21195] Updated weights for policy 0, policy_version 26650 (0.0008) +[2023-10-08 16:47:13,179][21194] Updated weights for policy 1, policy_version 26470 (0.0010) +[2023-10-08 16:47:13,508][21195] Updated weights for policy 0, policy_version 26660 (0.0008) +[2023-10-08 16:47:13,544][21194] Updated weights for policy 1, policy_version 26480 (0.0008) +[2023-10-08 16:47:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 54394880. Throughput: 0: 1738.1, 1: 1719.7. Samples: 13616024. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:47:13,803][19739] Avg episode reward: [(0, '641.830'), (1, '662.340')] +[2023-10-08 16:47:13,883][21195] Updated weights for policy 0, policy_version 26670 (0.0008) +[2023-10-08 16:47:13,903][21194] Updated weights for policy 1, policy_version 26490 (0.0008) +[2023-10-08 16:47:14,120][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000026496_27131904.pth... +[2023-10-08 16:47:14,148][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000024864_25460736.pth +[2023-10-08 16:47:14,242][21195] Updated weights for policy 0, policy_version 26680 (0.0008) +[2023-10-08 16:47:14,538][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000026688_27328512.pth... +[2023-10-08 16:47:14,567][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000025056_25657344.pth +[2023-10-08 16:47:17,783][21194] Updated weights for policy 1, policy_version 26500 (0.0009) +[2023-10-08 16:47:18,152][21194] Updated weights for policy 1, policy_version 26510 (0.0010) +[2023-10-08 16:47:18,225][21195] Updated weights for policy 0, policy_version 26690 (0.0010) +[2023-10-08 16:47:18,514][21194] Updated weights for policy 1, policy_version 26520 (0.0008) +[2023-10-08 16:47:18,594][21195] Updated weights for policy 0, policy_version 26700 (0.0007) +[2023-10-08 16:47:18,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 54493184. Throughput: 0: 1719.9, 1: 1718.8. Samples: 13630668. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:47:18,803][19739] Avg episode reward: [(0, '636.520'), (1, '662.340')] +[2023-10-08 16:47:18,965][21195] Updated weights for policy 0, policy_version 26710 (0.0009) +[2023-10-08 16:47:19,334][21195] Updated weights for policy 0, policy_version 26720 (0.0008) +[2023-10-08 16:47:22,631][21194] Updated weights for policy 1, policy_version 26530 (0.0007) +[2023-10-08 16:47:22,994][21194] Updated weights for policy 1, policy_version 26540 (0.0008) +[2023-10-08 16:47:23,356][21194] Updated weights for policy 1, policy_version 26550 (0.0009) +[2023-10-08 16:47:23,418][21195] Updated weights for policy 0, policy_version 26730 (0.0008) +[2023-10-08 16:47:23,727][21194] Updated weights for policy 1, policy_version 26560 (0.0008) +[2023-10-08 16:47:23,793][21195] Updated weights for policy 0, policy_version 26740 (0.0008) +[2023-10-08 16:47:23,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 54558720. Throughput: 0: 1733.2, 1: 1726.0. Samples: 13646526. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:47:23,803][19739] Avg episode reward: [(0, '636.360'), (1, '662.340')] +[2023-10-08 16:47:24,161][21195] Updated weights for policy 0, policy_version 26750 (0.0008) +[2023-10-08 16:47:27,786][21194] Updated weights for policy 1, policy_version 26570 (0.0007) +[2023-10-08 16:47:28,047][21195] Updated weights for policy 0, policy_version 26760 (0.0009) +[2023-10-08 16:47:28,153][21194] Updated weights for policy 1, policy_version 26580 (0.0007) +[2023-10-08 16:47:28,417][21195] Updated weights for policy 0, policy_version 26770 (0.0008) +[2023-10-08 16:47:28,512][21194] Updated weights for policy 1, policy_version 26590 (0.0007) +[2023-10-08 16:47:28,791][21195] Updated weights for policy 0, policy_version 26780 (0.0007) +[2023-10-08 16:47:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 54624256. Throughput: 0: 1727.2, 1: 1705.4. Samples: 13667092. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:47:28,804][19739] Avg episode reward: [(0, '636.360'), (1, '662.340')] +[2023-10-08 16:47:32,292][21194] Updated weights for policy 1, policy_version 26600 (0.0008) +[2023-10-08 16:47:32,658][21195] Updated weights for policy 0, policy_version 26790 (0.0008) +[2023-10-08 16:47:32,660][21194] Updated weights for policy 1, policy_version 26610 (0.0007) +[2023-10-08 16:47:33,019][21194] Updated weights for policy 1, policy_version 26620 (0.0007) +[2023-10-08 16:47:33,024][21195] Updated weights for policy 0, policy_version 26800 (0.0008) +[2023-10-08 16:47:33,394][21195] Updated weights for policy 0, policy_version 26810 (0.0007) +[2023-10-08 16:47:33,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 54722560. Throughput: 0: 1696.7, 1: 1721.2. Samples: 13681812. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 16:47:33,803][19739] Avg episode reward: [(0, '636.360'), (1, '662.340')] +[2023-10-08 16:47:37,055][21194] Updated weights for policy 1, policy_version 26630 (0.0010) +[2023-10-08 16:47:37,248][21195] Updated weights for policy 0, policy_version 26820 (0.0007) +[2023-10-08 16:47:37,431][21194] Updated weights for policy 1, policy_version 26640 (0.0010) +[2023-10-08 16:47:37,618][21195] Updated weights for policy 0, policy_version 26830 (0.0007) +[2023-10-08 16:47:37,803][21194] Updated weights for policy 1, policy_version 26650 (0.0008) +[2023-10-08 16:47:37,989][21195] Updated weights for policy 0, policy_version 26840 (0.0007) +[2023-10-08 16:47:38,803][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 54788096. Throughput: 0: 1726.5, 1: 1718.8. Samples: 13698078. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 16:47:38,803][19739] Avg episode reward: [(0, '636.360'), (1, '662.340')] +[2023-10-08 16:47:41,778][21194] Updated weights for policy 1, policy_version 26660 (0.0009) +[2023-10-08 16:47:42,013][21195] Updated weights for policy 0, policy_version 26850 (0.0010) +[2023-10-08 16:47:42,148][21194] Updated weights for policy 1, policy_version 26670 (0.0007) +[2023-10-08 16:47:42,389][21195] Updated weights for policy 0, policy_version 26860 (0.0009) +[2023-10-08 16:47:42,513][21194] Updated weights for policy 1, policy_version 26680 (0.0007) +[2023-10-08 16:47:42,750][21195] Updated weights for policy 0, policy_version 26870 (0.0007) +[2023-10-08 16:47:43,120][21195] Updated weights for policy 0, policy_version 26880 (0.0007) +[2023-10-08 16:47:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 54853632. Throughput: 0: 1701.4, 1: 1700.1. Samples: 13717524. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 16:47:43,803][19739] Avg episode reward: [(0, '636.360'), (1, '662.340')] +[2023-10-08 16:47:46,476][21194] Updated weights for policy 1, policy_version 26690 (0.0008) +[2023-10-08 16:47:46,841][21194] Updated weights for policy 1, policy_version 26700 (0.0007) +[2023-10-08 16:47:47,032][21195] Updated weights for policy 0, policy_version 26890 (0.0007) +[2023-10-08 16:47:47,202][21194] Updated weights for policy 1, policy_version 26710 (0.0007) +[2023-10-08 16:47:47,400][21195] Updated weights for policy 0, policy_version 26900 (0.0008) +[2023-10-08 16:47:47,567][21194] Updated weights for policy 1, policy_version 26720 (0.0007) +[2023-10-08 16:47:47,769][21195] Updated weights for policy 0, policy_version 26910 (0.0009) +[2023-10-08 16:47:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 54919168. Throughput: 0: 1696.1, 1: 1728.7. Samples: 13733800. Policy #0 lag: (min: 24.0, avg: 48.8, max: 56.0) +[2023-10-08 16:47:48,803][19739] Avg episode reward: [(0, '642.420'), (1, '662.340')] +[2023-10-08 16:47:51,569][21194] Updated weights for policy 1, policy_version 26730 (0.0007) +[2023-10-08 16:47:51,754][21195] Updated weights for policy 0, policy_version 26920 (0.0008) +[2023-10-08 16:47:51,937][21194] Updated weights for policy 1, policy_version 26740 (0.0008) +[2023-10-08 16:47:52,132][21195] Updated weights for policy 0, policy_version 26930 (0.0007) +[2023-10-08 16:47:52,306][21194] Updated weights for policy 1, policy_version 26750 (0.0008) +[2023-10-08 16:47:52,499][21195] Updated weights for policy 0, policy_version 26940 (0.0008) +[2023-10-08 16:47:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 54984704. Throughput: 0: 1716.4, 1: 1715.8. Samples: 13749240. Policy #0 lag: (min: 24.0, avg: 48.8, max: 56.0) +[2023-10-08 16:47:53,803][19739] Avg episode reward: [(0, '629.690'), (1, '662.340')] +[2023-10-08 16:47:56,186][21194] Updated weights for policy 1, policy_version 26760 (0.0008) +[2023-10-08 16:47:56,475][21195] Updated weights for policy 0, policy_version 26950 (0.0007) +[2023-10-08 16:47:56,559][21194] Updated weights for policy 1, policy_version 26770 (0.0007) +[2023-10-08 16:47:56,849][21195] Updated weights for policy 0, policy_version 26960 (0.0008) +[2023-10-08 16:47:56,923][21194] Updated weights for policy 1, policy_version 26780 (0.0008) +[2023-10-08 16:47:57,218][21195] Updated weights for policy 0, policy_version 26970 (0.0007) +[2023-10-08 16:47:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 55050240. Throughput: 0: 1696.4, 1: 1704.5. Samples: 13769064. Policy #0 lag: (min: 24.0, avg: 48.8, max: 56.0) +[2023-10-08 16:47:58,803][19739] Avg episode reward: [(0, '630.050'), (1, '662.340')] +[2023-10-08 16:48:01,014][21194] Updated weights for policy 1, policy_version 26790 (0.0007) +[2023-10-08 16:48:01,160][21195] Updated weights for policy 0, policy_version 26980 (0.0009) +[2023-10-08 16:48:01,388][21194] Updated weights for policy 1, policy_version 26800 (0.0007) +[2023-10-08 16:48:01,521][21195] Updated weights for policy 0, policy_version 26990 (0.0007) +[2023-10-08 16:48:01,747][21194] Updated weights for policy 1, policy_version 26810 (0.0008) +[2023-10-08 16:48:01,908][21195] Updated weights for policy 0, policy_version 27000 (0.0008) +[2023-10-08 16:48:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 55115776. Throughput: 0: 1713.7, 1: 1718.8. Samples: 13785128. Policy #0 lag: (min: 24.0, avg: 48.8, max: 56.0) +[2023-10-08 16:48:03,803][19739] Avg episode reward: [(0, '630.050'), (1, '656.840')] +[2023-10-08 16:48:05,774][21194] Updated weights for policy 1, policy_version 26820 (0.0008) +[2023-10-08 16:48:05,882][21195] Updated weights for policy 0, policy_version 27010 (0.0009) +[2023-10-08 16:48:06,136][21194] Updated weights for policy 1, policy_version 26830 (0.0007) +[2023-10-08 16:48:06,252][21195] Updated weights for policy 0, policy_version 27020 (0.0009) +[2023-10-08 16:48:06,503][21194] Updated weights for policy 1, policy_version 26840 (0.0007) +[2023-10-08 16:48:06,628][21195] Updated weights for policy 0, policy_version 27030 (0.0008) +[2023-10-08 16:48:06,998][21195] Updated weights for policy 0, policy_version 27040 (0.0011) +[2023-10-08 16:48:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 55181312. Throughput: 0: 1705.1, 1: 1692.4. Samples: 13799412. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:48:08,803][19739] Avg episode reward: [(0, '643.390'), (1, '673.860')] +[2023-10-08 16:48:10,518][21194] Updated weights for policy 1, policy_version 26850 (0.0008) +[2023-10-08 16:48:10,884][21194] Updated weights for policy 1, policy_version 26860 (0.0008) +[2023-10-08 16:48:11,063][21195] Updated weights for policy 0, policy_version 27050 (0.0007) +[2023-10-08 16:48:11,254][21194] Updated weights for policy 1, policy_version 26870 (0.0008) +[2023-10-08 16:48:11,438][21195] Updated weights for policy 0, policy_version 27060 (0.0007) +[2023-10-08 16:48:11,614][21194] Updated weights for policy 1, policy_version 26880 (0.0009) +[2023-10-08 16:48:11,806][21195] Updated weights for policy 0, policy_version 27070 (0.0008) +[2023-10-08 16:48:13,803][19739] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 55246848. Throughput: 0: 1703.2, 1: 1704.3. Samples: 13820430. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:48:13,804][19739] Avg episode reward: [(0, '644.080'), (1, '673.860')] +[2023-10-08 16:48:15,633][21194] Updated weights for policy 1, policy_version 26890 (0.0008) +[2023-10-08 16:48:15,813][21195] Updated weights for policy 0, policy_version 27080 (0.0007) +[2023-10-08 16:48:16,004][21194] Updated weights for policy 1, policy_version 26900 (0.0008) +[2023-10-08 16:48:16,176][21195] Updated weights for policy 0, policy_version 27090 (0.0007) +[2023-10-08 16:48:16,379][21194] Updated weights for policy 1, policy_version 26910 (0.0007) +[2023-10-08 16:48:16,543][21195] Updated weights for policy 0, policy_version 27100 (0.0008) +[2023-10-08 16:48:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 55312384. Throughput: 0: 1735.2, 1: 1702.1. Samples: 13836488. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:48:18,803][19739] Avg episode reward: [(0, '644.080'), (1, '673.860')] +[2023-10-08 16:48:20,381][21195] Updated weights for policy 0, policy_version 27110 (0.0007) +[2023-10-08 16:48:20,443][21194] Updated weights for policy 1, policy_version 26920 (0.0008) +[2023-10-08 16:48:20,748][21195] Updated weights for policy 0, policy_version 27120 (0.0007) +[2023-10-08 16:48:20,806][21194] Updated weights for policy 1, policy_version 26930 (0.0008) +[2023-10-08 16:48:21,121][21195] Updated weights for policy 0, policy_version 27130 (0.0008) +[2023-10-08 16:48:21,160][21194] Updated weights for policy 1, policy_version 26940 (0.0008) +[2023-10-08 16:48:23,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 55377920. Throughput: 0: 1706.0, 1: 1691.1. Samples: 13850950. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:48:23,803][19739] Avg episode reward: [(0, '658.310'), (1, '673.860')] +[2023-10-08 16:48:25,037][21195] Updated weights for policy 0, policy_version 27140 (0.0008) +[2023-10-08 16:48:25,294][21194] Updated weights for policy 1, policy_version 26950 (0.0009) +[2023-10-08 16:48:25,409][21195] Updated weights for policy 0, policy_version 27150 (0.0007) +[2023-10-08 16:48:25,671][21194] Updated weights for policy 1, policy_version 26960 (0.0007) +[2023-10-08 16:48:25,776][21195] Updated weights for policy 0, policy_version 27160 (0.0009) +[2023-10-08 16:48:26,025][21194] Updated weights for policy 1, policy_version 26970 (0.0008) +[2023-10-08 16:48:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 55443456. Throughput: 0: 1728.4, 1: 1710.5. Samples: 13872274. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:48:28,803][19739] Avg episode reward: [(0, '658.310'), (1, '695.280')] +[2023-10-08 16:48:29,629][21195] Updated weights for policy 0, policy_version 27170 (0.0007) +[2023-10-08 16:48:29,898][21194] Updated weights for policy 1, policy_version 26980 (0.0009) +[2023-10-08 16:48:29,996][21195] Updated weights for policy 0, policy_version 27180 (0.0007) +[2023-10-08 16:48:30,267][21194] Updated weights for policy 1, policy_version 26990 (0.0008) +[2023-10-08 16:48:30,377][21195] Updated weights for policy 0, policy_version 27190 (0.0008) +[2023-10-08 16:48:30,635][21194] Updated weights for policy 1, policy_version 27000 (0.0008) +[2023-10-08 16:48:30,742][21195] Updated weights for policy 0, policy_version 27200 (0.0009) +[2023-10-08 16:48:33,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 55508992. Throughput: 0: 1741.5, 1: 1679.2. Samples: 13887734. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:48:33,803][19739] Avg episode reward: [(0, '686.610'), (1, '695.280')] +[2023-10-08 16:48:34,694][21195] Updated weights for policy 0, policy_version 27210 (0.0008) +[2023-10-08 16:48:34,715][21194] Updated weights for policy 1, policy_version 27010 (0.0008) +[2023-10-08 16:48:35,063][21195] Updated weights for policy 0, policy_version 27220 (0.0007) +[2023-10-08 16:48:35,079][21194] Updated weights for policy 1, policy_version 27020 (0.0007) +[2023-10-08 16:48:35,423][21195] Updated weights for policy 0, policy_version 27230 (0.0008) +[2023-10-08 16:48:35,454][21194] Updated weights for policy 1, policy_version 27030 (0.0008) +[2023-10-08 16:48:35,815][21194] Updated weights for policy 1, policy_version 27040 (0.0008) +[2023-10-08 16:48:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 55574528. Throughput: 0: 1723.5, 1: 1692.2. Samples: 13902948. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:48:38,803][19739] Avg episode reward: [(0, '686.610'), (1, '695.280')] +[2023-10-08 16:48:39,356][21195] Updated weights for policy 0, policy_version 27240 (0.0009) +[2023-10-08 16:48:39,739][21195] Updated weights for policy 0, policy_version 27250 (0.0009) +[2023-10-08 16:48:39,819][21194] Updated weights for policy 1, policy_version 27050 (0.0009) +[2023-10-08 16:48:40,108][21195] Updated weights for policy 0, policy_version 27260 (0.0007) +[2023-10-08 16:48:40,193][21194] Updated weights for policy 1, policy_version 27060 (0.0007) +[2023-10-08 16:48:40,556][21194] Updated weights for policy 1, policy_version 27070 (0.0007) +[2023-10-08 16:48:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 55640064. Throughput: 0: 1750.7, 1: 1705.9. Samples: 13924610. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:48:43,803][19739] Avg episode reward: [(0, '686.610'), (1, '709.050')] +[2023-10-08 16:48:43,884][21195] Updated weights for policy 0, policy_version 27270 (0.0008) +[2023-10-08 16:48:44,254][21195] Updated weights for policy 0, policy_version 27280 (0.0009) +[2023-10-08 16:48:44,359][21194] Updated weights for policy 1, policy_version 27080 (0.0007) +[2023-10-08 16:48:44,629][21195] Updated weights for policy 0, policy_version 27290 (0.0007) +[2023-10-08 16:48:44,728][21194] Updated weights for policy 1, policy_version 27090 (0.0009) +[2023-10-08 16:48:45,100][21194] Updated weights for policy 1, policy_version 27100 (0.0011) +[2023-10-08 16:48:48,606][21195] Updated weights for policy 0, policy_version 27300 (0.0008) +[2023-10-08 16:48:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 55705600. Throughput: 0: 1747.6, 1: 1688.7. Samples: 13939764. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:48:48,803][19739] Avg episode reward: [(0, '686.610'), (1, '709.050')] +[2023-10-08 16:48:48,972][21195] Updated weights for policy 0, policy_version 27310 (0.0007) +[2023-10-08 16:48:49,039][21194] Updated weights for policy 1, policy_version 27110 (0.0008) +[2023-10-08 16:48:49,339][21195] Updated weights for policy 0, policy_version 27320 (0.0007) +[2023-10-08 16:48:49,400][21194] Updated weights for policy 1, policy_version 27120 (0.0007) +[2023-10-08 16:48:49,773][21194] Updated weights for policy 1, policy_version 27130 (0.0009) +[2023-10-08 16:48:53,071][21195] Updated weights for policy 0, policy_version 27330 (0.0010) +[2023-10-08 16:48:53,445][21195] Updated weights for policy 0, policy_version 27340 (0.0008) +[2023-10-08 16:48:53,693][21194] Updated weights for policy 1, policy_version 27140 (0.0008) +[2023-10-08 16:48:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 55771136. Throughput: 0: 1752.7, 1: 1711.8. Samples: 13955316. Policy #0 lag: (min: 31.0, avg: 31.4, max: 44.0) +[2023-10-08 16:48:53,803][19739] Avg episode reward: [(0, '686.610'), (1, '709.050')] +[2023-10-08 16:48:53,827][21195] Updated weights for policy 0, policy_version 27350 (0.0008) +[2023-10-08 16:48:54,063][21194] Updated weights for policy 1, policy_version 27150 (0.0009) +[2023-10-08 16:48:54,183][21195] Updated weights for policy 0, policy_version 27360 (0.0007) +[2023-10-08 16:48:54,424][21194] Updated weights for policy 1, policy_version 27160 (0.0010) +[2023-10-08 16:48:58,145][21195] Updated weights for policy 0, policy_version 27370 (0.0009) +[2023-10-08 16:48:58,327][21194] Updated weights for policy 1, policy_version 27170 (0.0010) +[2023-10-08 16:48:58,516][21195] Updated weights for policy 0, policy_version 27380 (0.0009) +[2023-10-08 16:48:58,693][21194] Updated weights for policy 1, policy_version 27180 (0.0007) +[2023-10-08 16:48:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 55836672. Throughput: 0: 1751.2, 1: 1719.5. Samples: 13976608. Policy #0 lag: (min: 31.0, avg: 31.4, max: 44.0) +[2023-10-08 16:48:58,803][19739] Avg episode reward: [(0, '701.760'), (1, '709.050')] +[2023-10-08 16:48:58,886][21195] Updated weights for policy 0, policy_version 27390 (0.0008) +[2023-10-08 16:48:58,955][20740] Saving new best policy, reward=701.760! +[2023-10-08 16:48:59,051][21194] Updated weights for policy 1, policy_version 27190 (0.0007) +[2023-10-08 16:48:59,423][21194] Updated weights for policy 1, policy_version 27200 (0.0010) +[2023-10-08 16:49:02,715][21195] Updated weights for policy 0, policy_version 27400 (0.0008) +[2023-10-08 16:49:03,087][21195] Updated weights for policy 0, policy_version 27410 (0.0007) +[2023-10-08 16:49:03,366][21194] Updated weights for policy 1, policy_version 27210 (0.0008) +[2023-10-08 16:49:03,453][21195] Updated weights for policy 0, policy_version 27420 (0.0009) +[2023-10-08 16:49:03,733][21194] Updated weights for policy 1, policy_version 27220 (0.0010) +[2023-10-08 16:49:03,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 55934976. Throughput: 0: 1720.3, 1: 1710.0. Samples: 13990850. Policy #0 lag: (min: 31.0, avg: 31.4, max: 44.0) +[2023-10-08 16:49:03,803][19739] Avg episode reward: [(0, '700.580'), (1, '737.300')] +[2023-10-08 16:49:04,103][21194] Updated weights for policy 1, policy_version 27230 (0.0009) +[2023-10-08 16:49:04,175][20836] Saving new best policy, reward=737.300! +[2023-10-08 16:49:07,461][21195] Updated weights for policy 0, policy_version 27430 (0.0009) +[2023-10-08 16:49:07,824][21195] Updated weights for policy 0, policy_version 27440 (0.0009) +[2023-10-08 16:49:08,114][21194] Updated weights for policy 1, policy_version 27240 (0.0007) +[2023-10-08 16:49:08,190][21195] Updated weights for policy 0, policy_version 27450 (0.0009) +[2023-10-08 16:49:08,471][21194] Updated weights for policy 1, policy_version 27250 (0.0007) +[2023-10-08 16:49:08,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 56000512. Throughput: 0: 1750.1, 1: 1724.2. Samples: 14007294. Policy #0 lag: (min: 31.0, avg: 31.4, max: 44.0) +[2023-10-08 16:49:08,803][19739] Avg episode reward: [(0, '700.580'), (1, '749.880')] +[2023-10-08 16:49:08,836][21194] Updated weights for policy 1, policy_version 27260 (0.0007) +[2023-10-08 16:49:08,971][20836] Saving new best policy, reward=749.880! +[2023-10-08 16:49:12,107][21195] Updated weights for policy 0, policy_version 27460 (0.0007) +[2023-10-08 16:49:12,471][21195] Updated weights for policy 0, policy_version 27470 (0.0009) +[2023-10-08 16:49:12,810][21194] Updated weights for policy 1, policy_version 27270 (0.0010) +[2023-10-08 16:49:12,843][21195] Updated weights for policy 0, policy_version 27480 (0.0007) +[2023-10-08 16:49:13,192][21194] Updated weights for policy 1, policy_version 27280 (0.0009) +[2023-10-08 16:49:13,546][21194] Updated weights for policy 1, policy_version 27290 (0.0011) +[2023-10-08 16:49:13,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 56098816. Throughput: 0: 1729.5, 1: 1714.6. Samples: 14027260. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:49:13,803][19739] Avg episode reward: [(0, '700.580'), (1, '749.880')] +[2023-10-08 16:49:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000027488_28147712.pth... +[2023-10-08 16:49:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000027296_27951104.pth... +[2023-10-08 16:49:13,849][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000025696_26312704.pth +[2023-10-08 16:49:13,852][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000025856_26476544.pth +[2023-10-08 16:49:16,817][21195] Updated weights for policy 0, policy_version 27490 (0.0007) +[2023-10-08 16:49:17,197][21195] Updated weights for policy 0, policy_version 27500 (0.0008) +[2023-10-08 16:49:17,563][21195] Updated weights for policy 0, policy_version 27510 (0.0009) +[2023-10-08 16:49:17,629][21194] Updated weights for policy 1, policy_version 27300 (0.0009) +[2023-10-08 16:49:17,929][21195] Updated weights for policy 0, policy_version 27520 (0.0007) +[2023-10-08 16:49:17,995][21194] Updated weights for policy 1, policy_version 27310 (0.0007) +[2023-10-08 16:49:18,374][21194] Updated weights for policy 1, policy_version 27320 (0.0011) +[2023-10-08 16:49:18,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 56164352. Throughput: 0: 1718.7, 1: 1723.6. Samples: 14042636. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:49:18,803][19739] Avg episode reward: [(0, '700.580'), (1, '735.550')] +[2023-10-08 16:49:21,811][21195] Updated weights for policy 0, policy_version 27530 (0.0010) +[2023-10-08 16:49:22,184][21195] Updated weights for policy 0, policy_version 27540 (0.0010) +[2023-10-08 16:49:22,427][21194] Updated weights for policy 1, policy_version 27330 (0.0010) +[2023-10-08 16:49:22,549][21195] Updated weights for policy 0, policy_version 27550 (0.0007) +[2023-10-08 16:49:22,806][21194] Updated weights for policy 1, policy_version 27340 (0.0009) +[2023-10-08 16:49:23,180][21194] Updated weights for policy 1, policy_version 27350 (0.0010) +[2023-10-08 16:49:23,544][21194] Updated weights for policy 1, policy_version 27360 (0.0010) +[2023-10-08 16:49:23,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 56229888. Throughput: 0: 1736.0, 1: 1728.2. Samples: 14058836. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:49:23,803][19739] Avg episode reward: [(0, '687.140'), (1, '737.210')] +[2023-10-08 16:49:26,515][21195] Updated weights for policy 0, policy_version 27560 (0.0007) +[2023-10-08 16:49:26,893][21195] Updated weights for policy 0, policy_version 27570 (0.0008) +[2023-10-08 16:49:27,252][21195] Updated weights for policy 0, policy_version 27580 (0.0008) +[2023-10-08 16:49:27,567][21194] Updated weights for policy 1, policy_version 27370 (0.0008) +[2023-10-08 16:49:27,927][21194] Updated weights for policy 1, policy_version 27380 (0.0007) +[2023-10-08 16:49:28,291][21194] Updated weights for policy 1, policy_version 27390 (0.0010) +[2023-10-08 16:49:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 56295424. Throughput: 0: 1709.7, 1: 1703.9. Samples: 14078222. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:49:28,803][19739] Avg episode reward: [(0, '687.140'), (1, '737.210')] +[2023-10-08 16:49:31,217][21195] Updated weights for policy 0, policy_version 27590 (0.0010) +[2023-10-08 16:49:31,580][21195] Updated weights for policy 0, policy_version 27600 (0.0010) +[2023-10-08 16:49:31,949][21195] Updated weights for policy 0, policy_version 27610 (0.0010) +[2023-10-08 16:49:32,219][21194] Updated weights for policy 1, policy_version 27400 (0.0008) +[2023-10-08 16:49:32,582][21194] Updated weights for policy 1, policy_version 27410 (0.0011) +[2023-10-08 16:49:32,947][21194] Updated weights for policy 1, policy_version 27420 (0.0008) +[2023-10-08 16:49:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 56360960. Throughput: 0: 1721.1, 1: 1721.3. Samples: 14094670. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:49:33,803][19739] Avg episode reward: [(0, '687.140'), (1, '737.210')] +[2023-10-08 16:49:35,802][21195] Updated weights for policy 0, policy_version 27620 (0.0009) +[2023-10-08 16:49:36,176][21195] Updated weights for policy 0, policy_version 27630 (0.0010) +[2023-10-08 16:49:36,544][21195] Updated weights for policy 0, policy_version 27640 (0.0010) +[2023-10-08 16:49:37,010][21194] Updated weights for policy 1, policy_version 27430 (0.0008) +[2023-10-08 16:49:37,378][21194] Updated weights for policy 1, policy_version 27440 (0.0008) +[2023-10-08 16:49:37,745][21194] Updated weights for policy 1, policy_version 27450 (0.0007) +[2023-10-08 16:49:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 56426496. Throughput: 0: 1714.2, 1: 1717.4. Samples: 14109738. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 16:49:38,803][19739] Avg episode reward: [(0, '701.070'), (1, '734.760')] +[2023-10-08 16:49:40,600][21195] Updated weights for policy 0, policy_version 27650 (0.0009) +[2023-10-08 16:49:40,966][21195] Updated weights for policy 0, policy_version 27660 (0.0009) +[2023-10-08 16:49:41,340][21195] Updated weights for policy 0, policy_version 27670 (0.0007) +[2023-10-08 16:49:41,706][21195] Updated weights for policy 0, policy_version 27680 (0.0008) +[2023-10-08 16:49:41,760][21194] Updated weights for policy 1, policy_version 27460 (0.0008) +[2023-10-08 16:49:42,129][21194] Updated weights for policy 1, policy_version 27470 (0.0008) +[2023-10-08 16:49:42,498][21194] Updated weights for policy 1, policy_version 27480 (0.0007) +[2023-10-08 16:49:43,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 56492032. Throughput: 0: 1720.1, 1: 1690.4. Samples: 14130080. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 16:49:43,803][19739] Avg episode reward: [(0, '701.190'), (1, '730.390')] +[2023-10-08 16:49:45,751][21195] Updated weights for policy 0, policy_version 27690 (0.0010) +[2023-10-08 16:49:46,129][21195] Updated weights for policy 0, policy_version 27700 (0.0009) +[2023-10-08 16:49:46,350][21194] Updated weights for policy 1, policy_version 27490 (0.0007) +[2023-10-08 16:49:46,500][21195] Updated weights for policy 0, policy_version 27710 (0.0008) +[2023-10-08 16:49:46,713][21194] Updated weights for policy 1, policy_version 27500 (0.0007) +[2023-10-08 16:49:47,071][21194] Updated weights for policy 1, policy_version 27510 (0.0007) +[2023-10-08 16:49:47,440][21194] Updated weights for policy 1, policy_version 27520 (0.0007) +[2023-10-08 16:49:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 56557568. Throughput: 0: 1746.2, 1: 1721.5. Samples: 14146898. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 16:49:48,803][19739] Avg episode reward: [(0, '678.450'), (1, '738.830')] +[2023-10-08 16:49:50,244][21195] Updated weights for policy 0, policy_version 27720 (0.0008) +[2023-10-08 16:49:50,617][21195] Updated weights for policy 0, policy_version 27730 (0.0009) +[2023-10-08 16:49:50,992][21195] Updated weights for policy 0, policy_version 27740 (0.0008) +[2023-10-08 16:49:51,388][21194] Updated weights for policy 1, policy_version 27530 (0.0009) +[2023-10-08 16:49:51,750][21194] Updated weights for policy 1, policy_version 27540 (0.0010) +[2023-10-08 16:49:52,124][21194] Updated weights for policy 1, policy_version 27550 (0.0010) +[2023-10-08 16:49:53,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 56623104. Throughput: 0: 1716.3, 1: 1704.2. Samples: 14161216. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 16:49:53,803][19739] Avg episode reward: [(0, '659.230'), (1, '738.830')] +[2023-10-08 16:49:55,055][21195] Updated weights for policy 0, policy_version 27750 (0.0010) +[2023-10-08 16:49:55,428][21195] Updated weights for policy 0, policy_version 27760 (0.0010) +[2023-10-08 16:49:55,789][21195] Updated weights for policy 0, policy_version 27770 (0.0009) +[2023-10-08 16:49:56,002][21194] Updated weights for policy 1, policy_version 27560 (0.0008) +[2023-10-08 16:49:56,376][21194] Updated weights for policy 1, policy_version 27570 (0.0009) +[2023-10-08 16:49:56,747][21194] Updated weights for policy 1, policy_version 27580 (0.0008) +[2023-10-08 16:49:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 56688640. Throughput: 0: 1736.0, 1: 1712.8. Samples: 14182456. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 16:49:58,803][19739] Avg episode reward: [(0, '659.230'), (1, '738.830')] +[2023-10-08 16:49:59,609][21195] Updated weights for policy 0, policy_version 27780 (0.0009) +[2023-10-08 16:49:59,982][21195] Updated weights for policy 0, policy_version 27790 (0.0007) +[2023-10-08 16:50:00,354][21195] Updated weights for policy 0, policy_version 27800 (0.0009) +[2023-10-08 16:50:00,812][21194] Updated weights for policy 1, policy_version 27590 (0.0008) +[2023-10-08 16:50:01,194][21194] Updated weights for policy 1, policy_version 27600 (0.0010) +[2023-10-08 16:50:01,559][21194] Updated weights for policy 1, policy_version 27610 (0.0007) +[2023-10-08 16:50:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 56754176. Throughput: 0: 1746.8, 1: 1720.4. Samples: 14198658. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 16:50:03,804][19739] Avg episode reward: [(0, '659.230'), (1, '738.830')] +[2023-10-08 16:50:04,227][21195] Updated weights for policy 0, policy_version 27810 (0.0008) +[2023-10-08 16:50:04,597][21195] Updated weights for policy 0, policy_version 27820 (0.0009) +[2023-10-08 16:50:04,963][21195] Updated weights for policy 0, policy_version 27830 (0.0009) +[2023-10-08 16:50:05,341][21195] Updated weights for policy 0, policy_version 27840 (0.0007) +[2023-10-08 16:50:05,471][21194] Updated weights for policy 1, policy_version 27620 (0.0008) +[2023-10-08 16:50:05,829][21194] Updated weights for policy 1, policy_version 27630 (0.0009) +[2023-10-08 16:50:06,198][21194] Updated weights for policy 1, policy_version 27640 (0.0007) +[2023-10-08 16:50:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 56819712. Throughput: 0: 1727.2, 1: 1701.3. Samples: 14213118. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 16:50:08,803][19739] Avg episode reward: [(0, '659.230'), (1, '738.830')] +[2023-10-08 16:50:09,248][21195] Updated weights for policy 0, policy_version 27850 (0.0008) +[2023-10-08 16:50:09,616][21195] Updated weights for policy 0, policy_version 27860 (0.0009) +[2023-10-08 16:50:09,985][21195] Updated weights for policy 0, policy_version 27870 (0.0008) +[2023-10-08 16:50:10,184][21194] Updated weights for policy 1, policy_version 27650 (0.0010) +[2023-10-08 16:50:10,554][21194] Updated weights for policy 1, policy_version 27660 (0.0007) +[2023-10-08 16:50:10,925][21194] Updated weights for policy 1, policy_version 27670 (0.0008) +[2023-10-08 16:50:11,287][21194] Updated weights for policy 1, policy_version 27680 (0.0008) +[2023-10-08 16:50:13,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 56885248. Throughput: 0: 1752.7, 1: 1720.6. Samples: 14234518. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 16:50:13,803][19739] Avg episode reward: [(0, '659.230'), (1, '738.870')] +[2023-10-08 16:50:13,875][21195] Updated weights for policy 0, policy_version 27880 (0.0009) +[2023-10-08 16:50:14,252][21195] Updated weights for policy 0, policy_version 27890 (0.0008) +[2023-10-08 16:50:14,617][21195] Updated weights for policy 0, policy_version 27900 (0.0007) +[2023-10-08 16:50:15,219][21194] Updated weights for policy 1, policy_version 27690 (0.0008) +[2023-10-08 16:50:15,593][21194] Updated weights for policy 1, policy_version 27700 (0.0007) +[2023-10-08 16:50:15,961][21194] Updated weights for policy 1, policy_version 27710 (0.0009) +[2023-10-08 16:50:18,435][21195] Updated weights for policy 0, policy_version 27910 (0.0010) +[2023-10-08 16:50:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 56950784. Throughput: 0: 1733.6, 1: 1704.6. Samples: 14249392. Policy #0 lag: (min: 25.0, avg: 41.4, max: 57.0) +[2023-10-08 16:50:18,803][19739] Avg episode reward: [(0, '660.550'), (1, '738.870')] +[2023-10-08 16:50:18,805][21195] Updated weights for policy 0, policy_version 27920 (0.0009) +[2023-10-08 16:50:19,183][21195] Updated weights for policy 0, policy_version 27930 (0.0011) +[2023-10-08 16:50:20,054][21194] Updated weights for policy 1, policy_version 27720 (0.0009) +[2023-10-08 16:50:20,413][21194] Updated weights for policy 1, policy_version 27730 (0.0009) +[2023-10-08 16:50:20,777][21194] Updated weights for policy 1, policy_version 27740 (0.0009) +[2023-10-08 16:50:23,116][21195] Updated weights for policy 0, policy_version 27940 (0.0010) +[2023-10-08 16:50:23,488][21195] Updated weights for policy 0, policy_version 27950 (0.0009) +[2023-10-08 16:50:23,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 57016320. Throughput: 0: 1745.5, 1: 1706.3. Samples: 14265066. Policy #0 lag: (min: 25.0, avg: 41.4, max: 57.0) +[2023-10-08 16:50:23,803][19739] Avg episode reward: [(0, '657.670'), (1, '736.900')] +[2023-10-08 16:50:23,857][21195] Updated weights for policy 0, policy_version 27960 (0.0009) +[2023-10-08 16:50:24,698][21194] Updated weights for policy 1, policy_version 27750 (0.0010) +[2023-10-08 16:50:25,068][21194] Updated weights for policy 1, policy_version 27760 (0.0011) +[2023-10-08 16:50:25,434][21194] Updated weights for policy 1, policy_version 27770 (0.0010) +[2023-10-08 16:50:27,695][21195] Updated weights for policy 0, policy_version 27970 (0.0009) +[2023-10-08 16:50:28,067][21195] Updated weights for policy 0, policy_version 27980 (0.0008) +[2023-10-08 16:50:28,443][21195] Updated weights for policy 0, policy_version 27990 (0.0009) +[2023-10-08 16:50:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 57081856. Throughput: 0: 1746.8, 1: 1729.0. Samples: 14286490. Policy #0 lag: (min: 25.0, avg: 41.4, max: 57.0) +[2023-10-08 16:50:28,803][19739] Avg episode reward: [(0, '657.670'), (1, '736.900')] +[2023-10-08 16:50:28,808][21195] Updated weights for policy 0, policy_version 28000 (0.0010) +[2023-10-08 16:50:29,370][21194] Updated weights for policy 1, policy_version 27780 (0.0009) +[2023-10-08 16:50:29,736][21194] Updated weights for policy 1, policy_version 27790 (0.0007) +[2023-10-08 16:50:30,098][21194] Updated weights for policy 1, policy_version 27800 (0.0007) +[2023-10-08 16:50:32,775][21195] Updated weights for policy 0, policy_version 28010 (0.0007) +[2023-10-08 16:50:33,148][21195] Updated weights for policy 0, policy_version 28020 (0.0007) +[2023-10-08 16:50:33,526][21195] Updated weights for policy 0, policy_version 28030 (0.0010) +[2023-10-08 16:50:33,803][19739] Fps is (10 sec: 16383.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 57180160. Throughput: 0: 1722.4, 1: 1694.9. Samples: 14300678. Policy #0 lag: (min: 25.0, avg: 41.4, max: 57.0) +[2023-10-08 16:50:33,804][19739] Avg episode reward: [(0, '657.670'), (1, '736.900')] +[2023-10-08 16:50:34,047][21194] Updated weights for policy 1, policy_version 27810 (0.0007) +[2023-10-08 16:50:34,422][21194] Updated weights for policy 1, policy_version 27820 (0.0010) +[2023-10-08 16:50:34,787][21194] Updated weights for policy 1, policy_version 27830 (0.0008) +[2023-10-08 16:50:35,148][21194] Updated weights for policy 1, policy_version 27840 (0.0009) +[2023-10-08 16:50:37,462][21195] Updated weights for policy 0, policy_version 28040 (0.0009) +[2023-10-08 16:50:37,842][21195] Updated weights for policy 0, policy_version 28050 (0.0008) +[2023-10-08 16:50:38,200][21195] Updated weights for policy 0, policy_version 28060 (0.0009) +[2023-10-08 16:50:38,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 57245696. Throughput: 0: 1753.1, 1: 1714.7. Samples: 14317264. Policy #0 lag: (min: 14.0, avg: 20.1, max: 46.0) +[2023-10-08 16:50:38,803][19739] Avg episode reward: [(0, '639.440'), (1, '730.550')] +[2023-10-08 16:50:39,249][21194] Updated weights for policy 1, policy_version 27850 (0.0007) +[2023-10-08 16:50:39,626][21194] Updated weights for policy 1, policy_version 27860 (0.0008) +[2023-10-08 16:50:39,984][21194] Updated weights for policy 1, policy_version 27870 (0.0007) +[2023-10-08 16:50:42,108][21195] Updated weights for policy 0, policy_version 28070 (0.0009) +[2023-10-08 16:50:42,474][21195] Updated weights for policy 0, policy_version 28080 (0.0008) +[2023-10-08 16:50:42,847][21195] Updated weights for policy 0, policy_version 28090 (0.0007) +[2023-10-08 16:50:43,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 57311232. Throughput: 0: 1731.5, 1: 1721.5. Samples: 14337840. Policy #0 lag: (min: 14.0, avg: 20.1, max: 46.0) +[2023-10-08 16:50:43,803][19739] Avg episode reward: [(0, '639.440'), (1, '730.550')] +[2023-10-08 16:50:43,840][21194] Updated weights for policy 1, policy_version 27880 (0.0008) +[2023-10-08 16:50:44,212][21194] Updated weights for policy 1, policy_version 27890 (0.0007) +[2023-10-08 16:50:44,589][21194] Updated weights for policy 1, policy_version 27900 (0.0008) +[2023-10-08 16:50:46,590][21195] Updated weights for policy 0, policy_version 28100 (0.0008) +[2023-10-08 16:50:46,950][21195] Updated weights for policy 0, policy_version 28110 (0.0007) +[2023-10-08 16:50:47,315][21195] Updated weights for policy 0, policy_version 28120 (0.0007) +[2023-10-08 16:50:48,737][21194] Updated weights for policy 1, policy_version 27910 (0.0009) +[2023-10-08 16:50:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 57376768. Throughput: 0: 1722.4, 1: 1703.7. Samples: 14352830. Policy #0 lag: (min: 14.0, avg: 20.1, max: 46.0) +[2023-10-08 16:50:48,803][19739] Avg episode reward: [(0, '639.440'), (1, '730.550')] +[2023-10-08 16:50:49,112][21194] Updated weights for policy 1, policy_version 27920 (0.0011) +[2023-10-08 16:50:49,471][21194] Updated weights for policy 1, policy_version 27930 (0.0010) +[2023-10-08 16:50:51,287][21195] Updated weights for policy 0, policy_version 28130 (0.0007) +[2023-10-08 16:50:51,651][21195] Updated weights for policy 0, policy_version 28140 (0.0008) +[2023-10-08 16:50:52,031][21195] Updated weights for policy 0, policy_version 28150 (0.0009) +[2023-10-08 16:50:52,397][21195] Updated weights for policy 0, policy_version 28160 (0.0009) +[2023-10-08 16:50:53,505][21194] Updated weights for policy 1, policy_version 27940 (0.0008) +[2023-10-08 16:50:53,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 57442304. Throughput: 0: 1738.8, 1: 1719.9. Samples: 14368762. Policy #0 lag: (min: 14.0, avg: 20.1, max: 46.0) +[2023-10-08 16:50:53,803][19739] Avg episode reward: [(0, '639.440'), (1, '745.490')] +[2023-10-08 16:50:53,876][21194] Updated weights for policy 1, policy_version 27950 (0.0009) +[2023-10-08 16:50:54,239][21194] Updated weights for policy 1, policy_version 27960 (0.0007) +[2023-10-08 16:50:56,214][21195] Updated weights for policy 0, policy_version 28170 (0.0007) +[2023-10-08 16:50:56,582][21195] Updated weights for policy 0, policy_version 28180 (0.0008) +[2023-10-08 16:50:56,949][21195] Updated weights for policy 0, policy_version 28190 (0.0007) +[2023-10-08 16:50:58,225][21194] Updated weights for policy 1, policy_version 27970 (0.0008) +[2023-10-08 16:50:58,597][21194] Updated weights for policy 1, policy_version 27980 (0.0007) +[2023-10-08 16:50:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 57507840. Throughput: 0: 1719.6, 1: 1722.1. Samples: 14389396. Policy #0 lag: (min: 14.0, avg: 20.1, max: 46.0) +[2023-10-08 16:50:58,803][19739] Avg episode reward: [(0, '641.350'), (1, '760.640')] +[2023-10-08 16:50:58,962][21194] Updated weights for policy 1, policy_version 27990 (0.0010) +[2023-10-08 16:50:59,327][20836] Saving new best policy, reward=760.640! +[2023-10-08 16:50:59,328][21194] Updated weights for policy 1, policy_version 28000 (0.0010) +[2023-10-08 16:51:00,887][21195] Updated weights for policy 0, policy_version 28200 (0.0010) +[2023-10-08 16:51:01,262][21195] Updated weights for policy 0, policy_version 28210 (0.0009) +[2023-10-08 16:51:01,634][21195] Updated weights for policy 0, policy_version 28220 (0.0010) +[2023-10-08 16:51:03,266][21194] Updated weights for policy 1, policy_version 28010 (0.0008) +[2023-10-08 16:51:03,640][21194] Updated weights for policy 1, policy_version 28020 (0.0009) +[2023-10-08 16:51:03,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 57573376. Throughput: 0: 1736.6, 1: 1716.3. Samples: 14404776. Policy #0 lag: (min: 31.0, avg: 31.9, max: 52.0) +[2023-10-08 16:51:03,804][19739] Avg episode reward: [(0, '641.350'), (1, '740.320')] +[2023-10-08 16:51:04,014][21194] Updated weights for policy 1, policy_version 28030 (0.0009) +[2023-10-08 16:51:05,506][21195] Updated weights for policy 0, policy_version 28230 (0.0010) +[2023-10-08 16:51:05,871][21195] Updated weights for policy 0, policy_version 28240 (0.0008) +[2023-10-08 16:51:06,251][21195] Updated weights for policy 0, policy_version 28250 (0.0009) +[2023-10-08 16:51:07,806][21194] Updated weights for policy 1, policy_version 28040 (0.0008) +[2023-10-08 16:51:08,174][21194] Updated weights for policy 1, policy_version 28050 (0.0009) +[2023-10-08 16:51:08,545][21194] Updated weights for policy 1, policy_version 28060 (0.0008) +[2023-10-08 16:51:08,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 57671680. Throughput: 0: 1725.1, 1: 1726.4. Samples: 14420382. Policy #0 lag: (min: 31.0, avg: 31.9, max: 52.0) +[2023-10-08 16:51:08,803][19739] Avg episode reward: [(0, '641.350'), (1, '716.620')] +[2023-10-08 16:51:10,177][21195] Updated weights for policy 0, policy_version 28260 (0.0007) +[2023-10-08 16:51:10,544][21195] Updated weights for policy 0, policy_version 28270 (0.0007) +[2023-10-08 16:51:10,911][21195] Updated weights for policy 0, policy_version 28280 (0.0007) +[2023-10-08 16:51:12,506][21194] Updated weights for policy 1, policy_version 28070 (0.0008) +[2023-10-08 16:51:12,876][21194] Updated weights for policy 1, policy_version 28080 (0.0009) +[2023-10-08 16:51:13,232][21194] Updated weights for policy 1, policy_version 28090 (0.0009) +[2023-10-08 16:51:13,803][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 57737216. Throughput: 0: 1736.8, 1: 1708.8. Samples: 14441542. Policy #0 lag: (min: 31.0, avg: 31.9, max: 52.0) +[2023-10-08 16:51:13,803][19739] Avg episode reward: [(0, '641.350'), (1, '716.620')] +[2023-10-08 16:51:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000028288_28966912.pth... +[2023-10-08 16:51:13,811][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000028096_28770304.pth... +[2023-10-08 16:51:13,851][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000026688_27328512.pth +[2023-10-08 16:51:13,854][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000026496_27131904.pth +[2023-10-08 16:51:14,821][21195] Updated weights for policy 0, policy_version 28290 (0.0008) +[2023-10-08 16:51:15,189][21195] Updated weights for policy 0, policy_version 28300 (0.0010) +[2023-10-08 16:51:15,559][21195] Updated weights for policy 0, policy_version 28310 (0.0008) +[2023-10-08 16:51:15,931][21195] Updated weights for policy 0, policy_version 28320 (0.0008) +[2023-10-08 16:51:17,204][21194] Updated weights for policy 1, policy_version 28100 (0.0008) +[2023-10-08 16:51:17,569][21194] Updated weights for policy 1, policy_version 28110 (0.0007) +[2023-10-08 16:51:17,932][21194] Updated weights for policy 1, policy_version 28120 (0.0008) +[2023-10-08 16:51:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 57802752. Throughput: 0: 1762.9, 1: 1729.9. Samples: 14457852. Policy #0 lag: (min: 31.0, avg: 31.9, max: 52.0) +[2023-10-08 16:51:18,803][19739] Avg episode reward: [(0, '641.350'), (1, '716.620')] +[2023-10-08 16:51:19,948][21195] Updated weights for policy 0, policy_version 28330 (0.0007) +[2023-10-08 16:51:20,313][21195] Updated weights for policy 0, policy_version 28340 (0.0007) +[2023-10-08 16:51:20,687][21195] Updated weights for policy 0, policy_version 28350 (0.0008) +[2023-10-08 16:51:21,918][21194] Updated weights for policy 1, policy_version 28130 (0.0008) +[2023-10-08 16:51:22,278][21194] Updated weights for policy 1, policy_version 28140 (0.0008) +[2023-10-08 16:51:22,655][21194] Updated weights for policy 1, policy_version 28150 (0.0008) +[2023-10-08 16:51:23,016][21194] Updated weights for policy 1, policy_version 28160 (0.0009) +[2023-10-08 16:51:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 57868288. Throughput: 0: 1732.0, 1: 1727.6. Samples: 14472942. Policy #0 lag: (min: 31.0, avg: 31.9, max: 52.0) +[2023-10-08 16:51:23,803][19739] Avg episode reward: [(0, '637.600'), (1, '716.620')] +[2023-10-08 16:51:24,729][21195] Updated weights for policy 0, policy_version 28360 (0.0008) +[2023-10-08 16:51:25,104][21195] Updated weights for policy 0, policy_version 28370 (0.0007) +[2023-10-08 16:51:25,486][21195] Updated weights for policy 0, policy_version 28380 (0.0008) +[2023-10-08 16:51:27,028][21194] Updated weights for policy 1, policy_version 28170 (0.0007) +[2023-10-08 16:51:27,391][21194] Updated weights for policy 1, policy_version 28180 (0.0007) +[2023-10-08 16:51:27,748][21194] Updated weights for policy 1, policy_version 28190 (0.0008) +[2023-10-08 16:51:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 57933824. Throughput: 0: 1755.7, 1: 1696.6. Samples: 14493192. Policy #0 lag: (min: 15.0, avg: 23.0, max: 47.0) +[2023-10-08 16:51:28,803][19739] Avg episode reward: [(0, '651.700'), (1, '716.620')] +[2023-10-08 16:51:29,333][21195] Updated weights for policy 0, policy_version 28390 (0.0007) +[2023-10-08 16:51:29,707][21195] Updated weights for policy 0, policy_version 28400 (0.0007) +[2023-10-08 16:51:30,066][21195] Updated weights for policy 0, policy_version 28410 (0.0007) +[2023-10-08 16:51:31,718][21194] Updated weights for policy 1, policy_version 28200 (0.0008) +[2023-10-08 16:51:32,085][21194] Updated weights for policy 1, policy_version 28210 (0.0007) +[2023-10-08 16:51:32,451][21194] Updated weights for policy 1, policy_version 28220 (0.0007) +[2023-10-08 16:51:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 57999360. Throughput: 0: 1756.8, 1: 1727.7. Samples: 14509634. Policy #0 lag: (min: 15.0, avg: 23.0, max: 47.0) +[2023-10-08 16:51:33,803][19739] Avg episode reward: [(0, '651.700'), (1, '716.620')] +[2023-10-08 16:51:34,090][21195] Updated weights for policy 0, policy_version 28420 (0.0008) +[2023-10-08 16:51:34,447][21195] Updated weights for policy 0, policy_version 28430 (0.0007) +[2023-10-08 16:51:34,822][21195] Updated weights for policy 0, policy_version 28440 (0.0009) +[2023-10-08 16:51:36,399][21194] Updated weights for policy 1, policy_version 28230 (0.0007) +[2023-10-08 16:51:36,778][21194] Updated weights for policy 1, policy_version 28240 (0.0009) +[2023-10-08 16:51:37,152][21194] Updated weights for policy 1, policy_version 28250 (0.0009) +[2023-10-08 16:51:38,697][21195] Updated weights for policy 0, policy_version 28450 (0.0009) +[2023-10-08 16:51:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 58064896. Throughput: 0: 1740.5, 1: 1712.2. Samples: 14524134. Policy #0 lag: (min: 15.0, avg: 23.0, max: 47.0) +[2023-10-08 16:51:38,803][19739] Avg episode reward: [(0, '652.330'), (1, '716.620')] +[2023-10-08 16:51:39,075][21195] Updated weights for policy 0, policy_version 28460 (0.0009) +[2023-10-08 16:51:39,439][21195] Updated weights for policy 0, policy_version 28470 (0.0009) +[2023-10-08 16:51:39,821][21195] Updated weights for policy 0, policy_version 28480 (0.0007) +[2023-10-08 16:51:40,982][21194] Updated weights for policy 1, policy_version 28260 (0.0009) +[2023-10-08 16:51:41,350][21194] Updated weights for policy 1, policy_version 28270 (0.0007) +[2023-10-08 16:51:41,713][21194] Updated weights for policy 1, policy_version 28280 (0.0007) +[2023-10-08 16:51:43,576][21195] Updated weights for policy 0, policy_version 28490 (0.0008) +[2023-10-08 16:51:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 58130432. Throughput: 0: 1760.4, 1: 1705.6. Samples: 14545368. Policy #0 lag: (min: 15.0, avg: 23.0, max: 47.0) +[2023-10-08 16:51:43,803][19739] Avg episode reward: [(0, '652.330'), (1, '716.620')] +[2023-10-08 16:51:43,959][21195] Updated weights for policy 0, policy_version 28500 (0.0009) +[2023-10-08 16:51:44,322][21195] Updated weights for policy 0, policy_version 28510 (0.0008) +[2023-10-08 16:51:45,728][21194] Updated weights for policy 1, policy_version 28290 (0.0009) +[2023-10-08 16:51:46,085][21194] Updated weights for policy 1, policy_version 28300 (0.0007) +[2023-10-08 16:51:46,445][21194] Updated weights for policy 1, policy_version 28310 (0.0007) +[2023-10-08 16:51:46,810][21194] Updated weights for policy 1, policy_version 28320 (0.0007) +[2023-10-08 16:51:48,099][21195] Updated weights for policy 0, policy_version 28520 (0.0008) +[2023-10-08 16:51:48,480][21195] Updated weights for policy 0, policy_version 28530 (0.0009) +[2023-10-08 16:51:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 58195968. Throughput: 0: 1733.4, 1: 1732.3. Samples: 14560730. Policy #0 lag: (min: 15.0, avg: 23.0, max: 47.0) +[2023-10-08 16:51:48,803][19739] Avg episode reward: [(0, '652.330'), (1, '716.620')] +[2023-10-08 16:51:48,846][21195] Updated weights for policy 0, policy_version 28540 (0.0008) +[2023-10-08 16:51:50,772][21194] Updated weights for policy 1, policy_version 28330 (0.0008) +[2023-10-08 16:51:51,136][21194] Updated weights for policy 1, policy_version 28340 (0.0008) +[2023-10-08 16:51:51,506][21194] Updated weights for policy 1, policy_version 28350 (0.0009) +[2023-10-08 16:51:52,733][21195] Updated weights for policy 0, policy_version 28550 (0.0008) +[2023-10-08 16:51:53,096][21195] Updated weights for policy 0, policy_version 28560 (0.0007) +[2023-10-08 16:51:53,471][21195] Updated weights for policy 0, policy_version 28570 (0.0007) +[2023-10-08 16:51:53,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 58294272. Throughput: 0: 1760.4, 1: 1706.9. Samples: 14576408. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 16:51:53,803][19739] Avg episode reward: [(0, '660.320'), (1, '716.620')] +[2023-10-08 16:51:55,567][21194] Updated weights for policy 1, policy_version 28360 (0.0010) +[2023-10-08 16:51:55,933][21194] Updated weights for policy 1, policy_version 28370 (0.0008) +[2023-10-08 16:51:56,295][21194] Updated weights for policy 1, policy_version 28380 (0.0007) +[2023-10-08 16:51:57,369][21195] Updated weights for policy 0, policy_version 28580 (0.0008) +[2023-10-08 16:51:57,737][21195] Updated weights for policy 0, policy_version 28590 (0.0007) +[2023-10-08 16:51:58,104][21195] Updated weights for policy 0, policy_version 28600 (0.0007) +[2023-10-08 16:51:58,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 58359808. Throughput: 0: 1732.1, 1: 1725.7. Samples: 14597146. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 16:51:58,803][19739] Avg episode reward: [(0, '673.670'), (1, '716.620')] +[2023-10-08 16:52:00,185][21194] Updated weights for policy 1, policy_version 28390 (0.0008) +[2023-10-08 16:52:00,549][21194] Updated weights for policy 1, policy_version 28400 (0.0009) +[2023-10-08 16:52:00,923][21194] Updated weights for policy 1, policy_version 28410 (0.0008) +[2023-10-08 16:52:02,015][21195] Updated weights for policy 0, policy_version 28610 (0.0008) +[2023-10-08 16:52:02,384][21195] Updated weights for policy 0, policy_version 28620 (0.0008) +[2023-10-08 16:52:02,742][21195] Updated weights for policy 0, policy_version 28630 (0.0008) +[2023-10-08 16:52:03,113][21195] Updated weights for policy 0, policy_version 28640 (0.0009) +[2023-10-08 16:52:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 58425344. Throughput: 0: 1716.7, 1: 1707.8. Samples: 14611956. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 16:52:03,804][19739] Avg episode reward: [(0, '673.300'), (1, '716.620')] +[2023-10-08 16:52:04,803][21194] Updated weights for policy 1, policy_version 28420 (0.0009) +[2023-10-08 16:52:05,175][21194] Updated weights for policy 1, policy_version 28430 (0.0009) +[2023-10-08 16:52:05,543][21194] Updated weights for policy 1, policy_version 28440 (0.0009) +[2023-10-08 16:52:06,984][21195] Updated weights for policy 0, policy_version 28650 (0.0009) +[2023-10-08 16:52:07,350][21195] Updated weights for policy 0, policy_version 28660 (0.0012) +[2023-10-08 16:52:07,721][21195] Updated weights for policy 0, policy_version 28670 (0.0009) +[2023-10-08 16:52:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 58490880. Throughput: 0: 1743.4, 1: 1712.0. Samples: 14628434. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 16:52:08,803][19739] Avg episode reward: [(0, '673.300'), (1, '716.620')] +[2023-10-08 16:52:09,485][21194] Updated weights for policy 1, policy_version 28450 (0.0008) +[2023-10-08 16:52:09,850][21194] Updated weights for policy 1, policy_version 28460 (0.0010) +[2023-10-08 16:52:10,212][21194] Updated weights for policy 1, policy_version 28470 (0.0007) +[2023-10-08 16:52:10,580][21194] Updated weights for policy 1, policy_version 28480 (0.0010) +[2023-10-08 16:52:11,795][21195] Updated weights for policy 0, policy_version 28680 (0.0008) +[2023-10-08 16:52:12,167][21195] Updated weights for policy 0, policy_version 28690 (0.0009) +[2023-10-08 16:52:12,532][21195] Updated weights for policy 0, policy_version 28700 (0.0008) +[2023-10-08 16:52:13,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 58556416. Throughput: 0: 1710.2, 1: 1744.4. Samples: 14648650. Policy #0 lag: (min: 31.0, avg: 35.4, max: 63.0) +[2023-10-08 16:52:13,803][19739] Avg episode reward: [(0, '674.550'), (1, '716.620')] +[2023-10-08 16:52:14,411][21194] Updated weights for policy 1, policy_version 28490 (0.0009) +[2023-10-08 16:52:14,768][21194] Updated weights for policy 1, policy_version 28500 (0.0008) +[2023-10-08 16:52:15,129][21194] Updated weights for policy 1, policy_version 28510 (0.0009) +[2023-10-08 16:52:16,416][21195] Updated weights for policy 0, policy_version 28710 (0.0009) +[2023-10-08 16:52:16,786][21195] Updated weights for policy 0, policy_version 28720 (0.0008) +[2023-10-08 16:52:17,158][21195] Updated weights for policy 0, policy_version 28730 (0.0007) +[2023-10-08 16:52:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 58621952. Throughput: 0: 1718.1, 1: 1713.9. Samples: 14664074. Policy #0 lag: (min: 31.0, avg: 35.4, max: 63.0) +[2023-10-08 16:52:18,803][19739] Avg episode reward: [(0, '674.550'), (1, '729.810')] +[2023-10-08 16:52:19,211][21194] Updated weights for policy 1, policy_version 28520 (0.0007) +[2023-10-08 16:52:19,586][21194] Updated weights for policy 1, policy_version 28530 (0.0008) +[2023-10-08 16:52:19,955][21194] Updated weights for policy 1, policy_version 28540 (0.0011) +[2023-10-08 16:52:21,111][21195] Updated weights for policy 0, policy_version 28740 (0.0009) +[2023-10-08 16:52:21,482][21195] Updated weights for policy 0, policy_version 28750 (0.0008) +[2023-10-08 16:52:21,852][21195] Updated weights for policy 0, policy_version 28760 (0.0010) +[2023-10-08 16:52:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 58687488. Throughput: 0: 1731.6, 1: 1729.2. Samples: 14679872. Policy #0 lag: (min: 31.0, avg: 35.4, max: 63.0) +[2023-10-08 16:52:23,803][19739] Avg episode reward: [(0, '675.640'), (1, '736.900')] +[2023-10-08 16:52:23,944][21194] Updated weights for policy 1, policy_version 28550 (0.0008) +[2023-10-08 16:52:24,324][21194] Updated weights for policy 1, policy_version 28560 (0.0007) +[2023-10-08 16:52:24,700][21194] Updated weights for policy 1, policy_version 28570 (0.0007) +[2023-10-08 16:52:25,676][21195] Updated weights for policy 0, policy_version 28770 (0.0008) +[2023-10-08 16:52:26,051][21195] Updated weights for policy 0, policy_version 28780 (0.0009) +[2023-10-08 16:52:26,426][21195] Updated weights for policy 0, policy_version 28790 (0.0009) +[2023-10-08 16:52:26,800][21195] Updated weights for policy 0, policy_version 28800 (0.0009) +[2023-10-08 16:52:28,547][21194] Updated weights for policy 1, policy_version 28580 (0.0009) +[2023-10-08 16:52:28,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 58753024. Throughput: 0: 1717.4, 1: 1736.5. Samples: 14700792. Policy #0 lag: (min: 31.0, avg: 35.4, max: 63.0) +[2023-10-08 16:52:28,803][19739] Avg episode reward: [(0, '675.640'), (1, '736.900')] +[2023-10-08 16:52:28,914][21194] Updated weights for policy 1, policy_version 28590 (0.0009) +[2023-10-08 16:52:29,293][21194] Updated weights for policy 1, policy_version 28600 (0.0010) +[2023-10-08 16:52:30,781][21195] Updated weights for policy 0, policy_version 28810 (0.0007) +[2023-10-08 16:52:31,144][21195] Updated weights for policy 0, policy_version 28820 (0.0008) +[2023-10-08 16:52:31,513][21195] Updated weights for policy 0, policy_version 28830 (0.0009) +[2023-10-08 16:52:33,324][21194] Updated weights for policy 1, policy_version 28610 (0.0010) +[2023-10-08 16:52:33,690][21194] Updated weights for policy 1, policy_version 28620 (0.0007) +[2023-10-08 16:52:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 58818560. Throughput: 0: 1741.7, 1: 1710.6. Samples: 14716084. Policy #0 lag: (min: 31.0, avg: 35.4, max: 63.0) +[2023-10-08 16:52:33,803][19739] Avg episode reward: [(0, '675.710'), (1, '736.900')] +[2023-10-08 16:52:34,061][21194] Updated weights for policy 1, policy_version 28630 (0.0008) +[2023-10-08 16:52:34,427][21194] Updated weights for policy 1, policy_version 28640 (0.0007) +[2023-10-08 16:52:35,485][21195] Updated weights for policy 0, policy_version 28840 (0.0008) +[2023-10-08 16:52:35,867][21195] Updated weights for policy 0, policy_version 28850 (0.0009) +[2023-10-08 16:52:36,236][21195] Updated weights for policy 0, policy_version 28860 (0.0010) +[2023-10-08 16:52:38,235][21194] Updated weights for policy 1, policy_version 28650 (0.0008) +[2023-10-08 16:52:38,614][21194] Updated weights for policy 1, policy_version 28660 (0.0007) +[2023-10-08 16:52:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 58884096. Throughput: 0: 1713.5, 1: 1739.0. Samples: 14731768. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 16:52:38,803][19739] Avg episode reward: [(0, '675.710'), (1, '736.990')] +[2023-10-08 16:52:38,982][21194] Updated weights for policy 1, policy_version 28670 (0.0009) +[2023-10-08 16:52:39,972][21195] Updated weights for policy 0, policy_version 28870 (0.0008) +[2023-10-08 16:52:40,338][21195] Updated weights for policy 0, policy_version 28880 (0.0009) +[2023-10-08 16:52:40,707][21195] Updated weights for policy 0, policy_version 28890 (0.0008) +[2023-10-08 16:52:42,805][21194] Updated weights for policy 1, policy_version 28680 (0.0007) +[2023-10-08 16:52:43,171][21194] Updated weights for policy 1, policy_version 28690 (0.0007) +[2023-10-08 16:52:43,544][21194] Updated weights for policy 1, policy_version 28700 (0.0008) +[2023-10-08 16:52:43,803][19739] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 58982400. Throughput: 0: 1731.9, 1: 1726.7. Samples: 14752782. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 16:52:43,804][19739] Avg episode reward: [(0, '710.340'), (1, '736.990')] +[2023-10-08 16:52:43,813][20740] Saving new best policy, reward=710.340! +[2023-10-08 16:52:44,503][21195] Updated weights for policy 0, policy_version 28900 (0.0009) +[2023-10-08 16:52:44,873][21195] Updated weights for policy 0, policy_version 28910 (0.0009) +[2023-10-08 16:52:45,247][21195] Updated weights for policy 0, policy_version 28920 (0.0008) +[2023-10-08 16:52:47,649][21194] Updated weights for policy 1, policy_version 28710 (0.0009) +[2023-10-08 16:52:48,012][21194] Updated weights for policy 1, policy_version 28720 (0.0008) +[2023-10-08 16:52:48,383][21194] Updated weights for policy 1, policy_version 28730 (0.0010) +[2023-10-08 16:52:48,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 59047936. Throughput: 0: 1753.7, 1: 1736.5. Samples: 14769018. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 16:52:48,803][19739] Avg episode reward: [(0, '719.610'), (1, '751.780')] +[2023-10-08 16:52:48,804][20740] Saving new best policy, reward=719.610! +[2023-10-08 16:52:49,221][21195] Updated weights for policy 0, policy_version 28930 (0.0008) +[2023-10-08 16:52:49,592][21195] Updated weights for policy 0, policy_version 28940 (0.0007) +[2023-10-08 16:52:49,959][21195] Updated weights for policy 0, policy_version 28950 (0.0007) +[2023-10-08 16:52:50,336][21195] Updated weights for policy 0, policy_version 28960 (0.0007) +[2023-10-08 16:52:52,364][21194] Updated weights for policy 1, policy_version 28740 (0.0008) +[2023-10-08 16:52:52,723][21194] Updated weights for policy 1, policy_version 28750 (0.0010) +[2023-10-08 16:52:53,086][21194] Updated weights for policy 1, policy_version 28760 (0.0010) +[2023-10-08 16:52:53,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 59113472. Throughput: 0: 1726.9, 1: 1736.7. Samples: 14784298. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 16:52:53,804][19739] Avg episode reward: [(0, '719.610'), (1, '751.780')] +[2023-10-08 16:52:54,194][21195] Updated weights for policy 0, policy_version 28970 (0.0009) +[2023-10-08 16:52:54,563][21195] Updated weights for policy 0, policy_version 28980 (0.0007) +[2023-10-08 16:52:54,938][21195] Updated weights for policy 0, policy_version 28990 (0.0007) +[2023-10-08 16:52:56,996][21194] Updated weights for policy 1, policy_version 28770 (0.0009) +[2023-10-08 16:52:57,360][21194] Updated weights for policy 1, policy_version 28780 (0.0011) +[2023-10-08 16:52:57,719][21194] Updated weights for policy 1, policy_version 28790 (0.0009) +[2023-10-08 16:52:58,086][21194] Updated weights for policy 1, policy_version 28800 (0.0010) +[2023-10-08 16:52:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 59179008. Throughput: 0: 1757.8, 1: 1707.8. Samples: 14804602. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 16:52:58,803][19739] Avg episode reward: [(0, '719.610'), (1, '751.780')] +[2023-10-08 16:52:58,825][21195] Updated weights for policy 0, policy_version 29000 (0.0009) +[2023-10-08 16:52:59,200][21195] Updated weights for policy 0, policy_version 29010 (0.0007) +[2023-10-08 16:52:59,568][21195] Updated weights for policy 0, policy_version 29020 (0.0009) +[2023-10-08 16:53:01,968][21194] Updated weights for policy 1, policy_version 28810 (0.0011) +[2023-10-08 16:53:02,334][21194] Updated weights for policy 1, policy_version 28820 (0.0011) +[2023-10-08 16:53:02,703][21194] Updated weights for policy 1, policy_version 28830 (0.0010) +[2023-10-08 16:53:03,460][21195] Updated weights for policy 0, policy_version 29030 (0.0008) +[2023-10-08 16:53:03,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 59244544. Throughput: 0: 1738.1, 1: 1735.2. Samples: 14820374. Policy #0 lag: (min: 31.0, avg: 45.3, max: 63.0) +[2023-10-08 16:53:03,803][19739] Avg episode reward: [(0, '719.320'), (1, '751.780')] +[2023-10-08 16:53:03,838][21195] Updated weights for policy 0, policy_version 29040 (0.0010) +[2023-10-08 16:53:04,196][21195] Updated weights for policy 0, policy_version 29050 (0.0009) +[2023-10-08 16:53:06,769][21194] Updated weights for policy 1, policy_version 28840 (0.0009) +[2023-10-08 16:53:07,129][21194] Updated weights for policy 1, policy_version 28850 (0.0009) +[2023-10-08 16:53:07,497][21194] Updated weights for policy 1, policy_version 28860 (0.0009) +[2023-10-08 16:53:08,259][21195] Updated weights for policy 0, policy_version 29060 (0.0009) +[2023-10-08 16:53:08,622][21195] Updated weights for policy 0, policy_version 29070 (0.0007) +[2023-10-08 16:53:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 59310080. Throughput: 0: 1739.6, 1: 1724.5. Samples: 14835760. Policy #0 lag: (min: 31.0, avg: 45.3, max: 63.0) +[2023-10-08 16:53:08,803][19739] Avg episode reward: [(0, '719.320'), (1, '762.070')] +[2023-10-08 16:53:08,804][20836] Saving new best policy, reward=762.070! +[2023-10-08 16:53:08,997][21195] Updated weights for policy 0, policy_version 29080 (0.0008) +[2023-10-08 16:53:11,528][21194] Updated weights for policy 1, policy_version 28870 (0.0008) +[2023-10-08 16:53:11,909][21194] Updated weights for policy 1, policy_version 28880 (0.0008) +[2023-10-08 16:53:12,272][21194] Updated weights for policy 1, policy_version 28890 (0.0008) +[2023-10-08 16:53:12,901][21195] Updated weights for policy 0, policy_version 29090 (0.0009) +[2023-10-08 16:53:13,272][21195] Updated weights for policy 0, policy_version 29100 (0.0010) +[2023-10-08 16:53:13,646][21195] Updated weights for policy 0, policy_version 29110 (0.0011) +[2023-10-08 16:53:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 59375616. Throughput: 0: 1757.5, 1: 1706.5. Samples: 14856674. Policy #0 lag: (min: 31.0, avg: 45.3, max: 63.0) +[2023-10-08 16:53:13,803][19739] Avg episode reward: [(0, '719.320'), (1, '768.460')] +[2023-10-08 16:53:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000028896_29589504.pth... +[2023-10-08 16:53:13,844][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000027296_27951104.pth +[2023-10-08 16:53:13,850][20836] Saving new best policy, reward=768.460! +[2023-10-08 16:53:14,015][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000029120_29818880.pth... +[2023-10-08 16:53:14,019][21195] Updated weights for policy 0, policy_version 29120 (0.0009) +[2023-10-08 16:53:14,045][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000027488_28147712.pth +[2023-10-08 16:53:16,237][21194] Updated weights for policy 1, policy_version 28900 (0.0008) +[2023-10-08 16:53:16,603][21194] Updated weights for policy 1, policy_version 28910 (0.0009) +[2023-10-08 16:53:16,982][21194] Updated weights for policy 1, policy_version 28920 (0.0009) +[2023-10-08 16:53:17,976][21195] Updated weights for policy 0, policy_version 29130 (0.0007) +[2023-10-08 16:53:18,336][21195] Updated weights for policy 0, policy_version 29140 (0.0008) +[2023-10-08 16:53:18,709][21195] Updated weights for policy 0, policy_version 29150 (0.0009) +[2023-10-08 16:53:18,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 59473920. Throughput: 0: 1724.0, 1: 1738.6. Samples: 14871898. Policy #0 lag: (min: 31.0, avg: 45.3, max: 63.0) +[2023-10-08 16:53:18,803][19739] Avg episode reward: [(0, '719.320'), (1, '783.270')] +[2023-10-08 16:53:18,804][20836] Saving new best policy, reward=783.270! +[2023-10-08 16:53:20,889][21194] Updated weights for policy 1, policy_version 28930 (0.0009) +[2023-10-08 16:53:21,256][21194] Updated weights for policy 1, policy_version 28940 (0.0008) +[2023-10-08 16:53:21,635][21194] Updated weights for policy 1, policy_version 28950 (0.0008) +[2023-10-08 16:53:21,999][21194] Updated weights for policy 1, policy_version 28960 (0.0008) +[2023-10-08 16:53:22,675][21195] Updated weights for policy 0, policy_version 29160 (0.0009) +[2023-10-08 16:53:23,052][21195] Updated weights for policy 0, policy_version 29170 (0.0010) +[2023-10-08 16:53:23,416][21195] Updated weights for policy 0, policy_version 29180 (0.0011) +[2023-10-08 16:53:23,803][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 59539456. Throughput: 0: 1750.7, 1: 1702.3. Samples: 14887154. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:53:23,803][19739] Avg episode reward: [(0, '719.320'), (1, '783.270')] +[2023-10-08 16:53:25,941][21194] Updated weights for policy 1, policy_version 28970 (0.0008) +[2023-10-08 16:53:26,307][21194] Updated weights for policy 1, policy_version 28980 (0.0008) +[2023-10-08 16:53:26,679][21194] Updated weights for policy 1, policy_version 28990 (0.0007) +[2023-10-08 16:53:27,432][21195] Updated weights for policy 0, policy_version 29190 (0.0008) +[2023-10-08 16:53:27,800][21195] Updated weights for policy 0, policy_version 29200 (0.0010) +[2023-10-08 16:53:28,174][21195] Updated weights for policy 0, policy_version 29210 (0.0011) +[2023-10-08 16:53:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 59604992. Throughput: 0: 1730.1, 1: 1715.5. Samples: 14907834. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:53:28,803][19739] Avg episode reward: [(0, '719.320'), (1, '783.270')] +[2023-10-08 16:53:30,586][21194] Updated weights for policy 1, policy_version 29000 (0.0007) +[2023-10-08 16:53:30,954][21194] Updated weights for policy 1, policy_version 29010 (0.0007) +[2023-10-08 16:53:31,315][21194] Updated weights for policy 1, policy_version 29020 (0.0011) +[2023-10-08 16:53:32,011][21195] Updated weights for policy 0, policy_version 29220 (0.0008) +[2023-10-08 16:53:32,376][21195] Updated weights for policy 0, policy_version 29230 (0.0007) +[2023-10-08 16:53:32,753][21195] Updated weights for policy 0, policy_version 29240 (0.0009) +[2023-10-08 16:53:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 59670528. Throughput: 0: 1710.9, 1: 1712.8. Samples: 14923084. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:53:33,803][19739] Avg episode reward: [(0, '734.100'), (1, '779.470')] +[2023-10-08 16:53:33,804][20740] Saving new best policy, reward=734.100! +[2023-10-08 16:53:35,293][21194] Updated weights for policy 1, policy_version 29030 (0.0011) +[2023-10-08 16:53:35,652][21194] Updated weights for policy 1, policy_version 29040 (0.0010) +[2023-10-08 16:53:36,034][21194] Updated weights for policy 1, policy_version 29050 (0.0011) +[2023-10-08 16:53:36,579][21195] Updated weights for policy 0, policy_version 29250 (0.0009) +[2023-10-08 16:53:36,954][21195] Updated weights for policy 0, policy_version 29260 (0.0007) +[2023-10-08 16:53:37,332][21195] Updated weights for policy 0, policy_version 29270 (0.0009) +[2023-10-08 16:53:37,701][21195] Updated weights for policy 0, policy_version 29280 (0.0008) +[2023-10-08 16:53:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 59736064. Throughput: 0: 1738.8, 1: 1699.7. Samples: 14939032. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:53:38,803][19739] Avg episode reward: [(0, '734.100'), (1, '788.720')] +[2023-10-08 16:53:38,804][20836] Saving new best policy, reward=788.720! +[2023-10-08 16:53:39,942][21194] Updated weights for policy 1, policy_version 29060 (0.0008) +[2023-10-08 16:53:40,306][21194] Updated weights for policy 1, policy_version 29070 (0.0007) +[2023-10-08 16:53:40,674][21194] Updated weights for policy 1, policy_version 29080 (0.0011) +[2023-10-08 16:53:41,431][21195] Updated weights for policy 0, policy_version 29290 (0.0009) +[2023-10-08 16:53:41,797][21195] Updated weights for policy 0, policy_version 29300 (0.0010) +[2023-10-08 16:53:42,163][21195] Updated weights for policy 0, policy_version 29310 (0.0009) +[2023-10-08 16:53:43,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 59801600. Throughput: 0: 1720.3, 1: 1729.6. Samples: 14959850. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:53:43,803][19739] Avg episode reward: [(0, '734.100'), (1, '788.720')] +[2023-10-08 16:53:44,494][21194] Updated weights for policy 1, policy_version 29090 (0.0008) +[2023-10-08 16:53:44,860][21194] Updated weights for policy 1, policy_version 29100 (0.0007) +[2023-10-08 16:53:45,227][21194] Updated weights for policy 1, policy_version 29110 (0.0009) +[2023-10-08 16:53:45,587][21194] Updated weights for policy 1, policy_version 29120 (0.0010) +[2023-10-08 16:53:46,076][21195] Updated weights for policy 0, policy_version 29320 (0.0007) +[2023-10-08 16:53:46,440][21195] Updated weights for policy 0, policy_version 29330 (0.0007) +[2023-10-08 16:53:46,811][21195] Updated weights for policy 0, policy_version 29340 (0.0007) +[2023-10-08 16:53:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 59867136. Throughput: 0: 1737.9, 1: 1707.5. Samples: 14975416. Policy #0 lag: (min: 31.0, avg: 35.3, max: 63.0) +[2023-10-08 16:53:48,803][19739] Avg episode reward: [(0, '723.280'), (1, '788.720')] +[2023-10-08 16:53:49,561][21194] Updated weights for policy 1, policy_version 29130 (0.0012) +[2023-10-08 16:53:49,933][21194] Updated weights for policy 1, policy_version 29140 (0.0010) +[2023-10-08 16:53:50,292][21194] Updated weights for policy 1, policy_version 29150 (0.0010) +[2023-10-08 16:53:50,662][21195] Updated weights for policy 0, policy_version 29350 (0.0008) +[2023-10-08 16:53:51,036][21195] Updated weights for policy 0, policy_version 29360 (0.0010) +[2023-10-08 16:53:51,394][21195] Updated weights for policy 0, policy_version 29370 (0.0008) +[2023-10-08 16:53:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 59932672. Throughput: 0: 1722.8, 1: 1721.0. Samples: 14990728. Policy #0 lag: (min: 31.0, avg: 35.3, max: 63.0) +[2023-10-08 16:53:53,803][19739] Avg episode reward: [(0, '736.160'), (1, '818.740')] +[2023-10-08 16:53:53,804][20836] Saving new best policy, reward=818.740! +[2023-10-08 16:53:53,804][20740] Saving new best policy, reward=736.160! +[2023-10-08 16:53:54,384][21194] Updated weights for policy 1, policy_version 29160 (0.0008) +[2023-10-08 16:53:54,749][21194] Updated weights for policy 1, policy_version 29170 (0.0009) +[2023-10-08 16:53:55,110][21194] Updated weights for policy 1, policy_version 29180 (0.0008) +[2023-10-08 16:53:55,219][21195] Updated weights for policy 0, policy_version 29380 (0.0007) +[2023-10-08 16:53:55,589][21195] Updated weights for policy 0, policy_version 29390 (0.0010) +[2023-10-08 16:53:55,958][21195] Updated weights for policy 0, policy_version 29400 (0.0010) +[2023-10-08 16:53:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 59998208. Throughput: 0: 1724.1, 1: 1734.8. Samples: 15012322. Policy #0 lag: (min: 31.0, avg: 35.3, max: 63.0) +[2023-10-08 16:53:58,803][19739] Avg episode reward: [(0, '736.160'), (1, '818.740')] +[2023-10-08 16:53:59,211][21194] Updated weights for policy 1, policy_version 29190 (0.0011) +[2023-10-08 16:53:59,599][21194] Updated weights for policy 1, policy_version 29200 (0.0009) +[2023-10-08 16:53:59,819][21195] Updated weights for policy 0, policy_version 29410 (0.0010) +[2023-10-08 16:53:59,974][21194] Updated weights for policy 1, policy_version 29210 (0.0009) +[2023-10-08 16:54:00,188][21195] Updated weights for policy 0, policy_version 29420 (0.0007) +[2023-10-08 16:54:00,555][21195] Updated weights for policy 0, policy_version 29430 (0.0008) +[2023-10-08 16:54:00,923][21195] Updated weights for policy 0, policy_version 29440 (0.0008) +[2023-10-08 16:54:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 60063744. Throughput: 0: 1759.5, 1: 1697.5. Samples: 15027462. Policy #0 lag: (min: 31.0, avg: 35.3, max: 63.0) +[2023-10-08 16:54:03,803][19739] Avg episode reward: [(0, '736.160'), (1, '849.050')] +[2023-10-08 16:54:03,804][20836] Saving new best policy, reward=849.050! +[2023-10-08 16:54:04,075][21194] Updated weights for policy 1, policy_version 29220 (0.0008) +[2023-10-08 16:54:04,442][21194] Updated weights for policy 1, policy_version 29230 (0.0007) +[2023-10-08 16:54:04,808][21195] Updated weights for policy 0, policy_version 29450 (0.0007) +[2023-10-08 16:54:04,811][21194] Updated weights for policy 1, policy_version 29240 (0.0009) +[2023-10-08 16:54:05,183][21195] Updated weights for policy 0, policy_version 29460 (0.0007) +[2023-10-08 16:54:05,545][21195] Updated weights for policy 0, policy_version 29470 (0.0008) +[2023-10-08 16:54:08,778][21194] Updated weights for policy 1, policy_version 29250 (0.0008) +[2023-10-08 16:54:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 60129280. Throughput: 0: 1736.1, 1: 1727.6. Samples: 15043020. Policy #0 lag: (min: 31.0, avg: 35.3, max: 63.0) +[2023-10-08 16:54:08,803][19739] Avg episode reward: [(0, '736.160'), (1, '849.050')] +[2023-10-08 16:54:09,133][21194] Updated weights for policy 1, policy_version 29260 (0.0007) +[2023-10-08 16:54:09,343][21195] Updated weights for policy 0, policy_version 29480 (0.0009) +[2023-10-08 16:54:09,505][21194] Updated weights for policy 1, policy_version 29270 (0.0007) +[2023-10-08 16:54:09,715][21195] Updated weights for policy 0, policy_version 29490 (0.0009) +[2023-10-08 16:54:09,867][21194] Updated weights for policy 1, policy_version 29280 (0.0007) +[2023-10-08 16:54:10,078][21195] Updated weights for policy 0, policy_version 29500 (0.0008) +[2023-10-08 16:54:13,711][21194] Updated weights for policy 1, policy_version 29290 (0.0011) +[2023-10-08 16:54:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 60194816. Throughput: 0: 1755.6, 1: 1723.8. Samples: 15064408. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:54:13,803][19739] Avg episode reward: [(0, '736.160'), (1, '849.050')] +[2023-10-08 16:54:13,952][21195] Updated weights for policy 0, policy_version 29510 (0.0010) +[2023-10-08 16:54:14,086][21194] Updated weights for policy 1, policy_version 29300 (0.0009) +[2023-10-08 16:54:14,321][21195] Updated weights for policy 0, policy_version 29520 (0.0007) +[2023-10-08 16:54:14,444][21194] Updated weights for policy 1, policy_version 29310 (0.0008) +[2023-10-08 16:54:14,683][21195] Updated weights for policy 0, policy_version 29530 (0.0007) +[2023-10-08 16:54:18,396][21194] Updated weights for policy 1, policy_version 29320 (0.0009) +[2023-10-08 16:54:18,731][21195] Updated weights for policy 0, policy_version 29540 (0.0009) +[2023-10-08 16:54:18,759][21194] Updated weights for policy 1, policy_version 29330 (0.0009) +[2023-10-08 16:54:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 60260352. Throughput: 0: 1762.5, 1: 1714.7. Samples: 15079560. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:54:18,803][19739] Avg episode reward: [(0, '736.160'), (1, '849.050')] +[2023-10-08 16:54:19,113][21195] Updated weights for policy 0, policy_version 29550 (0.0008) +[2023-10-08 16:54:19,127][21194] Updated weights for policy 1, policy_version 29340 (0.0008) +[2023-10-08 16:54:19,478][21195] Updated weights for policy 0, policy_version 29560 (0.0007) +[2023-10-08 16:54:23,111][21194] Updated weights for policy 1, policy_version 29350 (0.0009) +[2023-10-08 16:54:23,419][21195] Updated weights for policy 0, policy_version 29570 (0.0007) +[2023-10-08 16:54:23,463][21194] Updated weights for policy 1, policy_version 29360 (0.0009) +[2023-10-08 16:54:23,794][21195] Updated weights for policy 0, policy_version 29580 (0.0008) +[2023-10-08 16:54:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 60325888. Throughput: 0: 1741.2, 1: 1729.8. Samples: 15095224. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:54:23,803][19739] Avg episode reward: [(0, '736.160'), (1, '849.050')] +[2023-10-08 16:54:23,826][21194] Updated weights for policy 1, policy_version 29370 (0.0008) +[2023-10-08 16:54:24,165][21195] Updated weights for policy 0, policy_version 29590 (0.0009) +[2023-10-08 16:54:24,540][21195] Updated weights for policy 0, policy_version 29600 (0.0010) +[2023-10-08 16:54:27,865][21194] Updated weights for policy 1, policy_version 29380 (0.0008) +[2023-10-08 16:54:28,235][21194] Updated weights for policy 1, policy_version 29390 (0.0007) +[2023-10-08 16:54:28,373][21195] Updated weights for policy 0, policy_version 29610 (0.0007) +[2023-10-08 16:54:28,594][21194] Updated weights for policy 1, policy_version 29400 (0.0008) +[2023-10-08 16:54:28,731][21195] Updated weights for policy 0, policy_version 29620 (0.0009) +[2023-10-08 16:54:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 60391424. Throughput: 0: 1762.1, 1: 1712.7. Samples: 15116214. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:54:28,803][19739] Avg episode reward: [(0, '736.160'), (1, '863.930')] +[2023-10-08 16:54:28,882][20836] Saving new best policy, reward=863.930! +[2023-10-08 16:54:29,103][21195] Updated weights for policy 0, policy_version 29630 (0.0009) +[2023-10-08 16:54:32,797][21194] Updated weights for policy 1, policy_version 29410 (0.0008) +[2023-10-08 16:54:33,131][21195] Updated weights for policy 0, policy_version 29640 (0.0009) +[2023-10-08 16:54:33,155][21194] Updated weights for policy 1, policy_version 29420 (0.0007) +[2023-10-08 16:54:33,502][21195] Updated weights for policy 0, policy_version 29650 (0.0009) +[2023-10-08 16:54:33,522][21194] Updated weights for policy 1, policy_version 29430 (0.0007) +[2023-10-08 16:54:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 60456960. Throughput: 0: 1734.0, 1: 1713.6. Samples: 15130556. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:54:33,803][19739] Avg episode reward: [(0, '748.480'), (1, '863.930')] +[2023-10-08 16:54:33,869][21195] Updated weights for policy 0, policy_version 29660 (0.0007) +[2023-10-08 16:54:33,884][21194] Updated weights for policy 1, policy_version 29440 (0.0007) +[2023-10-08 16:54:34,017][20740] Saving new best policy, reward=748.480! +[2023-10-08 16:54:37,703][21194] Updated weights for policy 1, policy_version 29450 (0.0009) +[2023-10-08 16:54:37,940][21195] Updated weights for policy 0, policy_version 29670 (0.0009) +[2023-10-08 16:54:38,066][21194] Updated weights for policy 1, policy_version 29460 (0.0008) +[2023-10-08 16:54:38,313][21195] Updated weights for policy 0, policy_version 29680 (0.0010) +[2023-10-08 16:54:38,433][21194] Updated weights for policy 1, policy_version 29470 (0.0009) +[2023-10-08 16:54:38,679][21195] Updated weights for policy 0, policy_version 29690 (0.0010) +[2023-10-08 16:54:38,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 60555264. Throughput: 0: 1755.8, 1: 1710.8. Samples: 15146726. Policy #0 lag: (min: 31.0, avg: 32.4, max: 57.0) +[2023-10-08 16:54:38,803][19739] Avg episode reward: [(0, '748.480'), (1, '855.750')] +[2023-10-08 16:54:42,300][21194] Updated weights for policy 1, policy_version 29480 (0.0007) +[2023-10-08 16:54:42,652][21195] Updated weights for policy 0, policy_version 29700 (0.0009) +[2023-10-08 16:54:42,667][21194] Updated weights for policy 1, policy_version 29490 (0.0007) +[2023-10-08 16:54:43,024][21195] Updated weights for policy 0, policy_version 29710 (0.0008) +[2023-10-08 16:54:43,028][21194] Updated weights for policy 1, policy_version 29500 (0.0007) +[2023-10-08 16:54:43,396][21195] Updated weights for policy 0, policy_version 29720 (0.0008) +[2023-10-08 16:54:43,803][19739] Fps is (10 sec: 19660.5, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 60653568. Throughput: 0: 1737.8, 1: 1692.7. Samples: 15166698. Policy #0 lag: (min: 31.0, avg: 32.4, max: 57.0) +[2023-10-08 16:54:43,804][19739] Avg episode reward: [(0, '717.080'), (1, '855.750')] +[2023-10-08 16:54:47,174][21194] Updated weights for policy 1, policy_version 29510 (0.0009) +[2023-10-08 16:54:47,396][21195] Updated weights for policy 0, policy_version 29730 (0.0011) +[2023-10-08 16:54:47,552][21194] Updated weights for policy 1, policy_version 29520 (0.0010) +[2023-10-08 16:54:47,758][21195] Updated weights for policy 0, policy_version 29740 (0.0008) +[2023-10-08 16:54:47,917][21194] Updated weights for policy 1, policy_version 29530 (0.0008) +[2023-10-08 16:54:48,126][21195] Updated weights for policy 0, policy_version 29750 (0.0008) +[2023-10-08 16:54:48,489][21195] Updated weights for policy 0, policy_version 29760 (0.0008) +[2023-10-08 16:54:48,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 60719104. Throughput: 0: 1713.6, 1: 1721.5. Samples: 15182042. Policy #0 lag: (min: 31.0, avg: 32.4, max: 57.0) +[2023-10-08 16:54:48,803][19739] Avg episode reward: [(0, '717.080'), (1, '855.750')] +[2023-10-08 16:54:51,763][21194] Updated weights for policy 1, policy_version 29540 (0.0009) +[2023-10-08 16:54:52,127][21194] Updated weights for policy 1, policy_version 29550 (0.0008) +[2023-10-08 16:54:52,317][21195] Updated weights for policy 0, policy_version 29770 (0.0008) +[2023-10-08 16:54:52,486][21194] Updated weights for policy 1, policy_version 29560 (0.0007) +[2023-10-08 16:54:52,694][21195] Updated weights for policy 0, policy_version 29780 (0.0007) +[2023-10-08 16:54:53,063][21195] Updated weights for policy 0, policy_version 29790 (0.0007) +[2023-10-08 16:54:53,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 60784640. Throughput: 0: 1740.2, 1: 1711.7. Samples: 15198358. Policy #0 lag: (min: 31.0, avg: 32.4, max: 57.0) +[2023-10-08 16:54:53,803][19739] Avg episode reward: [(0, '717.080'), (1, '860.240')] +[2023-10-08 16:54:56,402][21194] Updated weights for policy 1, policy_version 29570 (0.0009) +[2023-10-08 16:54:56,779][21194] Updated weights for policy 1, policy_version 29580 (0.0008) +[2023-10-08 16:54:56,992][21195] Updated weights for policy 0, policy_version 29800 (0.0007) +[2023-10-08 16:54:57,135][21194] Updated weights for policy 1, policy_version 29590 (0.0009) +[2023-10-08 16:54:57,359][21195] Updated weights for policy 0, policy_version 29810 (0.0008) +[2023-10-08 16:54:57,507][21194] Updated weights for policy 1, policy_version 29600 (0.0008) +[2023-10-08 16:54:57,736][21195] Updated weights for policy 0, policy_version 29820 (0.0009) +[2023-10-08 16:54:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 60850176. Throughput: 0: 1712.6, 1: 1693.4. Samples: 15217680. Policy #0 lag: (min: 1.0, avg: 1.7, max: 16.0) +[2023-10-08 16:54:58,803][19739] Avg episode reward: [(0, '717.080'), (1, '860.240')] +[2023-10-08 16:55:01,485][21195] Updated weights for policy 0, policy_version 29830 (0.0007) +[2023-10-08 16:55:01,605][21194] Updated weights for policy 1, policy_version 29610 (0.0010) +[2023-10-08 16:55:01,854][21195] Updated weights for policy 0, policy_version 29840 (0.0008) +[2023-10-08 16:55:01,976][21194] Updated weights for policy 1, policy_version 29620 (0.0009) +[2023-10-08 16:55:02,217][21195] Updated weights for policy 0, policy_version 29850 (0.0007) +[2023-10-08 16:55:02,350][21194] Updated weights for policy 1, policy_version 29630 (0.0009) +[2023-10-08 16:55:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 60915712. Throughput: 0: 1719.0, 1: 1718.4. Samples: 15234242. Policy #0 lag: (min: 1.0, avg: 1.7, max: 16.0) +[2023-10-08 16:55:03,803][19739] Avg episode reward: [(0, '717.080'), (1, '860.240')] +[2023-10-08 16:55:06,101][21195] Updated weights for policy 0, policy_version 29860 (0.0007) +[2023-10-08 16:55:06,306][21194] Updated weights for policy 1, policy_version 29640 (0.0007) +[2023-10-08 16:55:06,467][21195] Updated weights for policy 0, policy_version 29870 (0.0007) +[2023-10-08 16:55:06,667][21194] Updated weights for policy 1, policy_version 29650 (0.0007) +[2023-10-08 16:55:06,844][21195] Updated weights for policy 0, policy_version 29880 (0.0009) +[2023-10-08 16:55:07,032][21194] Updated weights for policy 1, policy_version 29660 (0.0007) +[2023-10-08 16:55:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 60981248. Throughput: 0: 1722.5, 1: 1690.0. Samples: 15248788. Policy #0 lag: (min: 1.0, avg: 1.7, max: 16.0) +[2023-10-08 16:55:08,803][19739] Avg episode reward: [(0, '725.000'), (1, '861.920')] +[2023-10-08 16:55:10,757][21195] Updated weights for policy 0, policy_version 29890 (0.0009) +[2023-10-08 16:55:10,906][21194] Updated weights for policy 1, policy_version 29670 (0.0008) +[2023-10-08 16:55:11,126][21195] Updated weights for policy 0, policy_version 29900 (0.0009) +[2023-10-08 16:55:11,264][21194] Updated weights for policy 1, policy_version 29680 (0.0009) +[2023-10-08 16:55:11,489][21195] Updated weights for policy 0, policy_version 29910 (0.0007) +[2023-10-08 16:55:11,628][21194] Updated weights for policy 1, policy_version 29690 (0.0008) +[2023-10-08 16:55:11,857][21195] Updated weights for policy 0, policy_version 29920 (0.0008) +[2023-10-08 16:55:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 61046784. Throughput: 0: 1711.4, 1: 1698.3. Samples: 15269648. Policy #0 lag: (min: 1.0, avg: 1.7, max: 16.0) +[2023-10-08 16:55:13,803][19739] Avg episode reward: [(0, '725.000'), (1, '868.060')] +[2023-10-08 16:55:13,813][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000029920_30638080.pth... +[2023-10-08 16:55:13,814][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000029696_30408704.pth... +[2023-10-08 16:55:13,849][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000028096_28770304.pth +[2023-10-08 16:55:13,853][20836] Saving new best policy, reward=868.060! +[2023-10-08 16:55:13,854][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000028288_28966912.pth +[2023-10-08 16:55:15,536][21194] Updated weights for policy 1, policy_version 29700 (0.0009) +[2023-10-08 16:55:15,651][21195] Updated weights for policy 0, policy_version 29930 (0.0009) +[2023-10-08 16:55:15,909][21194] Updated weights for policy 1, policy_version 29710 (0.0008) +[2023-10-08 16:55:16,021][21195] Updated weights for policy 0, policy_version 29940 (0.0008) +[2023-10-08 16:55:16,280][21194] Updated weights for policy 1, policy_version 29720 (0.0007) +[2023-10-08 16:55:16,402][21195] Updated weights for policy 0, policy_version 29950 (0.0008) +[2023-10-08 16:55:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 61112320. Throughput: 0: 1742.6, 1: 1707.8. Samples: 15285824. Policy #0 lag: (min: 1.0, avg: 1.7, max: 16.0) +[2023-10-08 16:55:18,803][19739] Avg episode reward: [(0, '724.160'), (1, '868.060')] +[2023-10-08 16:55:20,259][21194] Updated weights for policy 1, policy_version 29730 (0.0008) +[2023-10-08 16:55:20,526][21195] Updated weights for policy 0, policy_version 29960 (0.0009) +[2023-10-08 16:55:20,627][21194] Updated weights for policy 1, policy_version 29740 (0.0009) +[2023-10-08 16:55:20,900][21195] Updated weights for policy 0, policy_version 29970 (0.0008) +[2023-10-08 16:55:21,002][21194] Updated weights for policy 1, policy_version 29750 (0.0008) +[2023-10-08 16:55:21,267][21195] Updated weights for policy 0, policy_version 29980 (0.0008) +[2023-10-08 16:55:21,366][21194] Updated weights for policy 1, policy_version 29760 (0.0009) +[2023-10-08 16:55:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 61177856. Throughput: 0: 1719.2, 1: 1696.0. Samples: 15300408. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:55:23,803][19739] Avg episode reward: [(0, '724.160'), (1, '868.060')] +[2023-10-08 16:55:25,145][21195] Updated weights for policy 0, policy_version 29990 (0.0009) +[2023-10-08 16:55:25,363][21194] Updated weights for policy 1, policy_version 29770 (0.0010) +[2023-10-08 16:55:25,519][21195] Updated weights for policy 0, policy_version 30000 (0.0008) +[2023-10-08 16:55:25,730][21194] Updated weights for policy 1, policy_version 29780 (0.0007) +[2023-10-08 16:55:25,889][21195] Updated weights for policy 0, policy_version 30010 (0.0008) +[2023-10-08 16:55:26,096][21194] Updated weights for policy 1, policy_version 29790 (0.0007) +[2023-10-08 16:55:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 61243392. Throughput: 0: 1726.5, 1: 1716.9. Samples: 15321648. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:55:28,803][19739] Avg episode reward: [(0, '724.160'), (1, '868.060')] +[2023-10-08 16:55:29,985][21195] Updated weights for policy 0, policy_version 30020 (0.0008) +[2023-10-08 16:55:30,090][21194] Updated weights for policy 1, policy_version 29800 (0.0007) +[2023-10-08 16:55:30,345][21195] Updated weights for policy 0, policy_version 30030 (0.0010) +[2023-10-08 16:55:30,456][21194] Updated weights for policy 1, policy_version 29810 (0.0010) +[2023-10-08 16:55:30,716][21195] Updated weights for policy 0, policy_version 30040 (0.0009) +[2023-10-08 16:55:30,828][21194] Updated weights for policy 1, policy_version 29820 (0.0008) +[2023-10-08 16:55:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 61308928. Throughput: 0: 1745.8, 1: 1698.8. Samples: 15337050. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:55:33,804][19739] Avg episode reward: [(0, '734.940'), (1, '868.060')] +[2023-10-08 16:55:34,608][21195] Updated weights for policy 0, policy_version 30050 (0.0009) +[2023-10-08 16:55:34,837][21194] Updated weights for policy 1, policy_version 29830 (0.0010) +[2023-10-08 16:55:34,989][21195] Updated weights for policy 0, policy_version 30060 (0.0007) +[2023-10-08 16:55:35,215][21194] Updated weights for policy 1, policy_version 29840 (0.0007) +[2023-10-08 16:55:35,352][21195] Updated weights for policy 0, policy_version 30070 (0.0007) +[2023-10-08 16:55:35,581][21194] Updated weights for policy 1, policy_version 29850 (0.0009) +[2023-10-08 16:55:35,723][21195] Updated weights for policy 0, policy_version 30080 (0.0009) +[2023-10-08 16:55:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 61374464. Throughput: 0: 1716.0, 1: 1704.3. Samples: 15352272. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:55:38,803][19739] Avg episode reward: [(0, '720.450'), (1, '868.060')] +[2023-10-08 16:55:39,521][21194] Updated weights for policy 1, policy_version 29860 (0.0008) +[2023-10-08 16:55:39,567][21195] Updated weights for policy 0, policy_version 30090 (0.0008) +[2023-10-08 16:55:39,886][21194] Updated weights for policy 1, policy_version 29870 (0.0007) +[2023-10-08 16:55:39,942][21195] Updated weights for policy 0, policy_version 30100 (0.0007) +[2023-10-08 16:55:40,242][21194] Updated weights for policy 1, policy_version 29880 (0.0008) +[2023-10-08 16:55:40,307][21195] Updated weights for policy 0, policy_version 30110 (0.0007) +[2023-10-08 16:55:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 61440000. Throughput: 0: 1745.8, 1: 1725.4. Samples: 15373884. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:55:43,803][19739] Avg episode reward: [(0, '720.450'), (1, '868.060')] +[2023-10-08 16:55:44,123][21194] Updated weights for policy 1, policy_version 29890 (0.0008) +[2023-10-08 16:55:44,255][21195] Updated weights for policy 0, policy_version 30120 (0.0007) +[2023-10-08 16:55:44,490][21194] Updated weights for policy 1, policy_version 29900 (0.0007) +[2023-10-08 16:55:44,624][21195] Updated weights for policy 0, policy_version 30130 (0.0007) +[2023-10-08 16:55:44,853][21194] Updated weights for policy 1, policy_version 29910 (0.0007) +[2023-10-08 16:55:44,989][21195] Updated weights for policy 0, policy_version 30140 (0.0007) +[2023-10-08 16:55:45,228][21194] Updated weights for policy 1, policy_version 29920 (0.0010) +[2023-10-08 16:55:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 61505536. Throughput: 0: 1741.1, 1: 1700.8. Samples: 15389124. Policy #0 lag: (min: 31.0, avg: 31.7, max: 48.0) +[2023-10-08 16:55:48,803][19739] Avg episode reward: [(0, '720.450'), (1, '868.060')] +[2023-10-08 16:55:48,902][21195] Updated weights for policy 0, policy_version 30150 (0.0008) +[2023-10-08 16:55:49,093][21194] Updated weights for policy 1, policy_version 29930 (0.0009) +[2023-10-08 16:55:49,269][21195] Updated weights for policy 0, policy_version 30160 (0.0008) +[2023-10-08 16:55:49,453][21194] Updated weights for policy 1, policy_version 29940 (0.0009) +[2023-10-08 16:55:49,639][21195] Updated weights for policy 0, policy_version 30170 (0.0008) +[2023-10-08 16:55:49,819][21194] Updated weights for policy 1, policy_version 29950 (0.0009) +[2023-10-08 16:55:53,647][21195] Updated weights for policy 0, policy_version 30180 (0.0008) +[2023-10-08 16:55:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 61571072. Throughput: 0: 1731.2, 1: 1730.2. Samples: 15404550. Policy #0 lag: (min: 31.0, avg: 31.7, max: 48.0) +[2023-10-08 16:55:53,804][19739] Avg episode reward: [(0, '730.440'), (1, '868.060')] +[2023-10-08 16:55:53,895][21194] Updated weights for policy 1, policy_version 29960 (0.0009) +[2023-10-08 16:55:54,024][21195] Updated weights for policy 0, policy_version 30190 (0.0009) +[2023-10-08 16:55:54,265][21194] Updated weights for policy 1, policy_version 29970 (0.0007) +[2023-10-08 16:55:54,381][21195] Updated weights for policy 0, policy_version 30200 (0.0008) +[2023-10-08 16:55:54,630][21194] Updated weights for policy 1, policy_version 29980 (0.0007) +[2023-10-08 16:55:58,345][21195] Updated weights for policy 0, policy_version 30210 (0.0008) +[2023-10-08 16:55:58,595][21194] Updated weights for policy 1, policy_version 29990 (0.0010) +[2023-10-08 16:55:58,713][21195] Updated weights for policy 0, policy_version 30220 (0.0007) +[2023-10-08 16:55:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 61636608. Throughput: 0: 1737.4, 1: 1732.4. Samples: 15425790. Policy #0 lag: (min: 31.0, avg: 31.7, max: 48.0) +[2023-10-08 16:55:58,803][19739] Avg episode reward: [(0, '730.440'), (1, '868.060')] +[2023-10-08 16:55:58,964][21194] Updated weights for policy 1, policy_version 30000 (0.0008) +[2023-10-08 16:55:59,078][21195] Updated weights for policy 0, policy_version 30230 (0.0007) +[2023-10-08 16:55:59,323][21194] Updated weights for policy 1, policy_version 30010 (0.0009) +[2023-10-08 16:55:59,440][21195] Updated weights for policy 0, policy_version 30240 (0.0008) +[2023-10-08 16:56:03,404][21194] Updated weights for policy 1, policy_version 30020 (0.0009) +[2023-10-08 16:56:03,433][21195] Updated weights for policy 0, policy_version 30250 (0.0009) +[2023-10-08 16:56:03,763][21194] Updated weights for policy 1, policy_version 30030 (0.0010) +[2023-10-08 16:56:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 61702144. Throughput: 0: 1716.7, 1: 1717.8. Samples: 15440374. Policy #0 lag: (min: 31.0, avg: 31.7, max: 48.0) +[2023-10-08 16:56:03,803][19739] Avg episode reward: [(0, '730.440'), (1, '868.060')] +[2023-10-08 16:56:03,812][21195] Updated weights for policy 0, policy_version 30260 (0.0008) +[2023-10-08 16:56:04,123][21194] Updated weights for policy 1, policy_version 30040 (0.0010) +[2023-10-08 16:56:04,175][21195] Updated weights for policy 0, policy_version 30270 (0.0007) +[2023-10-08 16:56:08,089][21194] Updated weights for policy 1, policy_version 30050 (0.0010) +[2023-10-08 16:56:08,214][21195] Updated weights for policy 0, policy_version 30280 (0.0009) +[2023-10-08 16:56:08,450][21194] Updated weights for policy 1, policy_version 30060 (0.0008) +[2023-10-08 16:56:08,585][21195] Updated weights for policy 0, policy_version 30290 (0.0008) +[2023-10-08 16:56:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 61767680. Throughput: 0: 1732.8, 1: 1733.5. Samples: 15456392. Policy #0 lag: (min: 31.0, avg: 31.7, max: 48.0) +[2023-10-08 16:56:08,803][19739] Avg episode reward: [(0, '730.480'), (1, '868.060')] +[2023-10-08 16:56:08,817][21194] Updated weights for policy 1, policy_version 30070 (0.0008) +[2023-10-08 16:56:08,952][21195] Updated weights for policy 0, policy_version 30300 (0.0007) +[2023-10-08 16:56:09,179][21194] Updated weights for policy 1, policy_version 30080 (0.0007) +[2023-10-08 16:56:12,844][21195] Updated weights for policy 0, policy_version 30310 (0.0007) +[2023-10-08 16:56:13,084][21194] Updated weights for policy 1, policy_version 30090 (0.0007) +[2023-10-08 16:56:13,232][21195] Updated weights for policy 0, policy_version 30320 (0.0009) +[2023-10-08 16:56:13,452][21194] Updated weights for policy 1, policy_version 30100 (0.0007) +[2023-10-08 16:56:13,594][21195] Updated weights for policy 0, policy_version 30330 (0.0008) +[2023-10-08 16:56:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 61833216. Throughput: 0: 1726.0, 1: 1727.7. Samples: 15477064. Policy #0 lag: (min: 28.0, avg: 35.1, max: 60.0) +[2023-10-08 16:56:13,803][19739] Avg episode reward: [(0, '730.480'), (1, '868.060')] +[2023-10-08 16:56:13,815][21194] Updated weights for policy 1, policy_version 30110 (0.0009) +[2023-10-08 16:56:17,506][21195] Updated weights for policy 0, policy_version 30340 (0.0008) +[2023-10-08 16:56:17,794][21194] Updated weights for policy 1, policy_version 30120 (0.0009) +[2023-10-08 16:56:17,873][21195] Updated weights for policy 0, policy_version 30350 (0.0009) +[2023-10-08 16:56:18,151][21194] Updated weights for policy 1, policy_version 30130 (0.0007) +[2023-10-08 16:56:18,246][21195] Updated weights for policy 0, policy_version 30360 (0.0009) +[2023-10-08 16:56:18,523][21194] Updated weights for policy 1, policy_version 30140 (0.0010) +[2023-10-08 16:56:18,803][19739] Fps is (10 sec: 19660.6, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 61964288. Throughput: 0: 1701.9, 1: 1733.6. Samples: 15491646. Policy #0 lag: (min: 28.0, avg: 35.1, max: 60.0) +[2023-10-08 16:56:18,804][19739] Avg episode reward: [(0, '730.480'), (1, '868.060')] +[2023-10-08 16:56:22,208][21195] Updated weights for policy 0, policy_version 30370 (0.0009) +[2023-10-08 16:56:22,536][21194] Updated weights for policy 1, policy_version 30150 (0.0010) +[2023-10-08 16:56:22,579][21195] Updated weights for policy 0, policy_version 30380 (0.0009) +[2023-10-08 16:56:22,917][21194] Updated weights for policy 1, policy_version 30160 (0.0008) +[2023-10-08 16:56:22,948][21195] Updated weights for policy 0, policy_version 30390 (0.0008) +[2023-10-08 16:56:23,288][21194] Updated weights for policy 1, policy_version 30170 (0.0008) +[2023-10-08 16:56:23,325][21195] Updated weights for policy 0, policy_version 30400 (0.0008) +[2023-10-08 16:56:23,802][19739] Fps is (10 sec: 19660.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 62029824. Throughput: 0: 1733.6, 1: 1733.1. Samples: 15508270. Policy #0 lag: (min: 28.0, avg: 35.1, max: 60.0) +[2023-10-08 16:56:23,803][19739] Avg episode reward: [(0, '744.000'), (1, '861.200')] +[2023-10-08 16:56:27,295][21194] Updated weights for policy 1, policy_version 30180 (0.0007) +[2023-10-08 16:56:27,348][21195] Updated weights for policy 0, policy_version 30410 (0.0009) +[2023-10-08 16:56:27,665][21194] Updated weights for policy 1, policy_version 30190 (0.0007) +[2023-10-08 16:56:27,720][21195] Updated weights for policy 0, policy_version 30420 (0.0008) +[2023-10-08 16:56:28,037][21194] Updated weights for policy 1, policy_version 30200 (0.0007) +[2023-10-08 16:56:28,080][21195] Updated weights for policy 0, policy_version 30430 (0.0008) +[2023-10-08 16:56:28,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 62095360. Throughput: 0: 1704.5, 1: 1706.2. Samples: 15527368. Policy #0 lag: (min: 28.0, avg: 35.1, max: 60.0) +[2023-10-08 16:56:28,803][19739] Avg episode reward: [(0, '744.000'), (1, '861.200')] +[2023-10-08 16:56:31,967][21194] Updated weights for policy 1, policy_version 30210 (0.0007) +[2023-10-08 16:56:32,153][21195] Updated weights for policy 0, policy_version 30440 (0.0007) +[2023-10-08 16:56:32,339][21194] Updated weights for policy 1, policy_version 30220 (0.0009) +[2023-10-08 16:56:32,530][21195] Updated weights for policy 0, policy_version 30450 (0.0007) +[2023-10-08 16:56:32,708][21194] Updated weights for policy 1, policy_version 30230 (0.0008) +[2023-10-08 16:56:32,895][21195] Updated weights for policy 0, policy_version 30460 (0.0008) +[2023-10-08 16:56:33,074][21194] Updated weights for policy 1, policy_version 30240 (0.0007) +[2023-10-08 16:56:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 62160896. Throughput: 0: 1697.6, 1: 1723.7. Samples: 15543080. Policy #0 lag: (min: 12.0, avg: 19.9, max: 44.0) +[2023-10-08 16:56:33,803][19739] Avg episode reward: [(0, '744.000'), (1, '847.040')] +[2023-10-08 16:56:36,709][21195] Updated weights for policy 0, policy_version 30470 (0.0008) +[2023-10-08 16:56:37,072][21195] Updated weights for policy 0, policy_version 30480 (0.0009) +[2023-10-08 16:56:37,154][21194] Updated weights for policy 1, policy_version 30250 (0.0007) +[2023-10-08 16:56:37,442][21195] Updated weights for policy 0, policy_version 30490 (0.0008) +[2023-10-08 16:56:37,523][21194] Updated weights for policy 1, policy_version 30260 (0.0008) +[2023-10-08 16:56:37,898][21194] Updated weights for policy 1, policy_version 30270 (0.0010) +[2023-10-08 16:56:38,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 62226432. Throughput: 0: 1721.9, 1: 1715.6. Samples: 15559236. Policy #0 lag: (min: 12.0, avg: 19.9, max: 44.0) +[2023-10-08 16:56:38,804][19739] Avg episode reward: [(0, '744.000'), (1, '860.440')] +[2023-10-08 16:56:41,147][21195] Updated weights for policy 0, policy_version 30500 (0.0009) +[2023-10-08 16:56:41,515][21195] Updated weights for policy 0, policy_version 30510 (0.0008) +[2023-10-08 16:56:41,881][21195] Updated weights for policy 0, policy_version 30520 (0.0008) +[2023-10-08 16:56:41,948][21194] Updated weights for policy 1, policy_version 30280 (0.0008) +[2023-10-08 16:56:42,305][21194] Updated weights for policy 1, policy_version 30290 (0.0007) +[2023-10-08 16:56:42,665][21194] Updated weights for policy 1, policy_version 30300 (0.0007) +[2023-10-08 16:56:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 62291968. Throughput: 0: 1705.3, 1: 1692.1. Samples: 15578674. Policy #0 lag: (min: 12.0, avg: 19.9, max: 44.0) +[2023-10-08 16:56:43,803][19739] Avg episode reward: [(0, '744.000'), (1, '860.440')] +[2023-10-08 16:56:45,901][21195] Updated weights for policy 0, policy_version 30530 (0.0009) +[2023-10-08 16:56:46,264][21195] Updated weights for policy 0, policy_version 30540 (0.0009) +[2023-10-08 16:56:46,588][21194] Updated weights for policy 1, policy_version 30310 (0.0007) +[2023-10-08 16:56:46,633][21195] Updated weights for policy 0, policy_version 30550 (0.0008) +[2023-10-08 16:56:46,963][21194] Updated weights for policy 1, policy_version 30320 (0.0008) +[2023-10-08 16:56:46,996][21195] Updated weights for policy 0, policy_version 30560 (0.0008) +[2023-10-08 16:56:47,337][21194] Updated weights for policy 1, policy_version 30330 (0.0008) +[2023-10-08 16:56:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 62357504. Throughput: 0: 1721.2, 1: 1719.0. Samples: 15595186. Policy #0 lag: (min: 12.0, avg: 19.9, max: 44.0) +[2023-10-08 16:56:48,804][19739] Avg episode reward: [(0, '758.700'), (1, '860.600')] +[2023-10-08 16:56:48,805][20740] Saving new best policy, reward=758.700! +[2023-10-08 16:56:50,899][21195] Updated weights for policy 0, policy_version 30570 (0.0007) +[2023-10-08 16:56:51,284][21195] Updated weights for policy 0, policy_version 30580 (0.0009) +[2023-10-08 16:56:51,480][21194] Updated weights for policy 1, policy_version 30340 (0.0008) +[2023-10-08 16:56:51,649][21195] Updated weights for policy 0, policy_version 30590 (0.0008) +[2023-10-08 16:56:51,845][21194] Updated weights for policy 1, policy_version 30350 (0.0009) +[2023-10-08 16:56:52,211][21194] Updated weights for policy 1, policy_version 30360 (0.0007) +[2023-10-08 16:56:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 62423040. Throughput: 0: 1708.1, 1: 1699.1. Samples: 15609718. Policy #0 lag: (min: 12.0, avg: 19.9, max: 44.0) +[2023-10-08 16:56:53,803][19739] Avg episode reward: [(0, '770.440'), (1, '860.600')] +[2023-10-08 16:56:53,804][20740] Saving new best policy, reward=770.440! +[2023-10-08 16:56:55,478][21195] Updated weights for policy 0, policy_version 30600 (0.0008) +[2023-10-08 16:56:55,855][21195] Updated weights for policy 0, policy_version 30610 (0.0007) +[2023-10-08 16:56:56,173][21194] Updated weights for policy 1, policy_version 30370 (0.0007) +[2023-10-08 16:56:56,233][21195] Updated weights for policy 0, policy_version 30620 (0.0009) +[2023-10-08 16:56:56,537][21194] Updated weights for policy 1, policy_version 30380 (0.0010) +[2023-10-08 16:56:56,910][21194] Updated weights for policy 1, policy_version 30390 (0.0011) +[2023-10-08 16:56:57,262][21194] Updated weights for policy 1, policy_version 30400 (0.0010) +[2023-10-08 16:56:58,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 62488576. Throughput: 0: 1715.1, 1: 1697.2. Samples: 15630620. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:56:58,803][19739] Avg episode reward: [(0, '762.920'), (1, '862.750')] +[2023-10-08 16:57:00,241][21195] Updated weights for policy 0, policy_version 30630 (0.0009) +[2023-10-08 16:57:00,616][21195] Updated weights for policy 0, policy_version 30640 (0.0009) +[2023-10-08 16:57:00,985][21195] Updated weights for policy 0, policy_version 30650 (0.0007) +[2023-10-08 16:57:01,103][21194] Updated weights for policy 1, policy_version 30410 (0.0008) +[2023-10-08 16:57:01,470][21194] Updated weights for policy 1, policy_version 30420 (0.0009) +[2023-10-08 16:57:01,836][21194] Updated weights for policy 1, policy_version 30430 (0.0009) +[2023-10-08 16:57:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 62554112. Throughput: 0: 1743.3, 1: 1712.2. Samples: 15647142. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:57:03,803][19739] Avg episode reward: [(0, '762.790'), (1, '862.750')] +[2023-10-08 16:57:04,818][21195] Updated weights for policy 0, policy_version 30660 (0.0008) +[2023-10-08 16:57:05,176][21195] Updated weights for policy 0, policy_version 30670 (0.0008) +[2023-10-08 16:57:05,541][21195] Updated weights for policy 0, policy_version 30680 (0.0009) +[2023-10-08 16:57:05,605][21194] Updated weights for policy 1, policy_version 30440 (0.0008) +[2023-10-08 16:57:05,974][21194] Updated weights for policy 1, policy_version 30450 (0.0009) +[2023-10-08 16:57:06,338][21194] Updated weights for policy 1, policy_version 30460 (0.0008) +[2023-10-08 16:57:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 62619648. Throughput: 0: 1710.7, 1: 1699.4. Samples: 15661724. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:57:08,803][19739] Avg episode reward: [(0, '762.790'), (1, '862.750')] +[2023-10-08 16:57:09,482][21195] Updated weights for policy 0, policy_version 30690 (0.0007) +[2023-10-08 16:57:09,862][21195] Updated weights for policy 0, policy_version 30700 (0.0007) +[2023-10-08 16:57:10,242][21195] Updated weights for policy 0, policy_version 30710 (0.0007) +[2023-10-08 16:57:10,353][21194] Updated weights for policy 1, policy_version 30470 (0.0009) +[2023-10-08 16:57:10,602][21195] Updated weights for policy 0, policy_version 30720 (0.0008) +[2023-10-08 16:57:10,726][21194] Updated weights for policy 1, policy_version 30480 (0.0007) +[2023-10-08 16:57:11,090][21194] Updated weights for policy 1, policy_version 30490 (0.0007) +[2023-10-08 16:57:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 62685184. Throughput: 0: 1737.5, 1: 1722.5. Samples: 15683072. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:57:13,803][19739] Avg episode reward: [(0, '763.030'), (1, '862.750')] +[2023-10-08 16:57:13,811][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000030496_31227904.pth... +[2023-10-08 16:57:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000030720_31457280.pth... +[2023-10-08 16:57:13,858][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000029120_29818880.pth +[2023-10-08 16:57:13,859][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000028896_29589504.pth +[2023-10-08 16:57:14,623][21195] Updated weights for policy 0, policy_version 30730 (0.0008) +[2023-10-08 16:57:14,990][21195] Updated weights for policy 0, policy_version 30740 (0.0009) +[2023-10-08 16:57:15,106][21194] Updated weights for policy 1, policy_version 30500 (0.0007) +[2023-10-08 16:57:15,356][21195] Updated weights for policy 0, policy_version 30750 (0.0008) +[2023-10-08 16:57:15,478][21194] Updated weights for policy 1, policy_version 30510 (0.0009) +[2023-10-08 16:57:15,833][21194] Updated weights for policy 1, policy_version 30520 (0.0010) +[2023-10-08 16:57:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 62750720. Throughput: 0: 1747.9, 1: 1707.4. Samples: 15698566. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:57:18,803][19739] Avg episode reward: [(0, '763.030'), (1, '862.920')] +[2023-10-08 16:57:19,339][21195] Updated weights for policy 0, policy_version 30760 (0.0010) +[2023-10-08 16:57:19,707][21195] Updated weights for policy 0, policy_version 30770 (0.0010) +[2023-10-08 16:57:19,759][21194] Updated weights for policy 1, policy_version 30530 (0.0008) +[2023-10-08 16:57:20,077][21195] Updated weights for policy 0, policy_version 30780 (0.0008) +[2023-10-08 16:57:20,122][21194] Updated weights for policy 1, policy_version 30540 (0.0009) +[2023-10-08 16:57:20,490][21194] Updated weights for policy 1, policy_version 30550 (0.0009) +[2023-10-08 16:57:20,854][21194] Updated weights for policy 1, policy_version 30560 (0.0008) +[2023-10-08 16:57:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 62816256. Throughput: 0: 1721.6, 1: 1707.5. Samples: 15713542. Policy #0 lag: (min: 31.0, avg: 32.9, max: 62.0) +[2023-10-08 16:57:23,803][19739] Avg episode reward: [(0, '760.180'), (1, '862.830')] +[2023-10-08 16:57:24,005][21195] Updated weights for policy 0, policy_version 30790 (0.0008) +[2023-10-08 16:57:24,380][21195] Updated weights for policy 0, policy_version 30800 (0.0008) +[2023-10-08 16:57:24,736][21195] Updated weights for policy 0, policy_version 30810 (0.0009) +[2023-10-08 16:57:24,788][21194] Updated weights for policy 1, policy_version 30570 (0.0009) +[2023-10-08 16:57:25,150][21194] Updated weights for policy 1, policy_version 30580 (0.0009) +[2023-10-08 16:57:25,520][21194] Updated weights for policy 1, policy_version 30590 (0.0008) +[2023-10-08 16:57:28,663][21195] Updated weights for policy 0, policy_version 30820 (0.0008) +[2023-10-08 16:57:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 62881792. Throughput: 0: 1740.0, 1: 1732.8. Samples: 15734954. Policy #0 lag: (min: 31.0, avg: 32.9, max: 62.0) +[2023-10-08 16:57:28,803][19739] Avg episode reward: [(0, '765.100'), (1, '874.290')] +[2023-10-08 16:57:28,811][20836] Saving new best policy, reward=874.290! +[2023-10-08 16:57:29,036][21195] Updated weights for policy 0, policy_version 30830 (0.0009) +[2023-10-08 16:57:29,406][21195] Updated weights for policy 0, policy_version 30840 (0.0009) +[2023-10-08 16:57:29,529][21194] Updated weights for policy 1, policy_version 30600 (0.0008) +[2023-10-08 16:57:29,896][21194] Updated weights for policy 1, policy_version 30610 (0.0008) +[2023-10-08 16:57:30,269][21194] Updated weights for policy 1, policy_version 30620 (0.0011) +[2023-10-08 16:57:33,395][21195] Updated weights for policy 0, policy_version 30850 (0.0008) +[2023-10-08 16:57:33,762][21195] Updated weights for policy 0, policy_version 30860 (0.0011) +[2023-10-08 16:57:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 62947328. Throughput: 0: 1726.3, 1: 1704.5. Samples: 15749572. Policy #0 lag: (min: 31.0, avg: 32.9, max: 62.0) +[2023-10-08 16:57:33,803][19739] Avg episode reward: [(0, '765.100'), (1, '874.290')] +[2023-10-08 16:57:34,130][21195] Updated weights for policy 0, policy_version 30870 (0.0010) +[2023-10-08 16:57:34,350][21194] Updated weights for policy 1, policy_version 30630 (0.0009) +[2023-10-08 16:57:34,502][21195] Updated weights for policy 0, policy_version 30880 (0.0010) +[2023-10-08 16:57:34,717][21194] Updated weights for policy 1, policy_version 30640 (0.0007) +[2023-10-08 16:57:35,087][21194] Updated weights for policy 1, policy_version 30650 (0.0007) +[2023-10-08 16:57:38,581][21195] Updated weights for policy 0, policy_version 30890 (0.0011) +[2023-10-08 16:57:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 63012864. Throughput: 0: 1738.6, 1: 1717.5. Samples: 15765242. Policy #0 lag: (min: 31.0, avg: 32.9, max: 62.0) +[2023-10-08 16:57:38,803][19739] Avg episode reward: [(0, '765.100'), (1, '874.290')] +[2023-10-08 16:57:38,948][21195] Updated weights for policy 0, policy_version 30900 (0.0010) +[2023-10-08 16:57:39,116][21194] Updated weights for policy 1, policy_version 30660 (0.0009) +[2023-10-08 16:57:39,315][21195] Updated weights for policy 0, policy_version 30910 (0.0010) +[2023-10-08 16:57:39,483][21194] Updated weights for policy 1, policy_version 30670 (0.0007) +[2023-10-08 16:57:39,844][21194] Updated weights for policy 1, policy_version 30680 (0.0008) +[2023-10-08 16:57:43,188][21195] Updated weights for policy 0, policy_version 30920 (0.0008) +[2023-10-08 16:57:43,560][21195] Updated weights for policy 0, policy_version 30930 (0.0007) +[2023-10-08 16:57:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 63078400. Throughput: 0: 1738.8, 1: 1726.4. Samples: 15786554. Policy #0 lag: (min: 31.0, avg: 32.9, max: 62.0) +[2023-10-08 16:57:43,803][19739] Avg episode reward: [(0, '779.910'), (1, '874.290')] +[2023-10-08 16:57:43,836][21194] Updated weights for policy 1, policy_version 30690 (0.0010) +[2023-10-08 16:57:43,929][21195] Updated weights for policy 0, policy_version 30940 (0.0007) +[2023-10-08 16:57:44,068][20740] Saving new best policy, reward=779.910! +[2023-10-08 16:57:44,198][21194] Updated weights for policy 1, policy_version 30700 (0.0010) +[2023-10-08 16:57:44,569][21194] Updated weights for policy 1, policy_version 30710 (0.0008) +[2023-10-08 16:57:44,925][21194] Updated weights for policy 1, policy_version 30720 (0.0012) +[2023-10-08 16:57:47,555][21195] Updated weights for policy 0, policy_version 30950 (0.0008) +[2023-10-08 16:57:47,945][21195] Updated weights for policy 0, policy_version 30960 (0.0009) +[2023-10-08 16:57:48,311][21195] Updated weights for policy 0, policy_version 30970 (0.0007) +[2023-10-08 16:57:48,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 63176704. Throughput: 0: 1713.9, 1: 1701.6. Samples: 15800838. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 16:57:48,803][19739] Avg episode reward: [(0, '780.190'), (1, '880.330')] +[2023-10-08 16:57:48,804][20740] Saving new best policy, reward=780.190! +[2023-10-08 16:57:48,885][21194] Updated weights for policy 1, policy_version 30730 (0.0009) +[2023-10-08 16:57:49,248][21194] Updated weights for policy 1, policy_version 30740 (0.0008) +[2023-10-08 16:57:49,616][21194] Updated weights for policy 1, policy_version 30750 (0.0007) +[2023-10-08 16:57:49,680][20836] Saving new best policy, reward=880.330! +[2023-10-08 16:57:52,239][21195] Updated weights for policy 0, policy_version 30980 (0.0007) +[2023-10-08 16:57:52,603][21195] Updated weights for policy 0, policy_version 30990 (0.0007) +[2023-10-08 16:57:52,973][21195] Updated weights for policy 0, policy_version 31000 (0.0009) +[2023-10-08 16:57:53,698][21194] Updated weights for policy 1, policy_version 30760 (0.0009) +[2023-10-08 16:57:53,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 63242240. Throughput: 0: 1742.3, 1: 1718.5. Samples: 15817462. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 16:57:53,803][19739] Avg episode reward: [(0, '780.190'), (1, '880.330')] +[2023-10-08 16:57:54,070][21194] Updated weights for policy 1, policy_version 30770 (0.0008) +[2023-10-08 16:57:54,430][21194] Updated weights for policy 1, policy_version 30780 (0.0008) +[2023-10-08 16:57:56,954][21195] Updated weights for policy 0, policy_version 31010 (0.0009) +[2023-10-08 16:57:57,329][21195] Updated weights for policy 0, policy_version 31020 (0.0009) +[2023-10-08 16:57:57,702][21195] Updated weights for policy 0, policy_version 31030 (0.0009) +[2023-10-08 16:57:58,083][21195] Updated weights for policy 0, policy_version 31040 (0.0009) +[2023-10-08 16:57:58,409][21194] Updated weights for policy 1, policy_version 30790 (0.0010) +[2023-10-08 16:57:58,774][21194] Updated weights for policy 1, policy_version 30800 (0.0009) +[2023-10-08 16:57:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 63307776. Throughput: 0: 1719.6, 1: 1723.1. Samples: 15837994. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 16:57:58,803][19739] Avg episode reward: [(0, '777.820'), (1, '880.330')] +[2023-10-08 16:57:59,130][21194] Updated weights for policy 1, policy_version 30810 (0.0010) +[2023-10-08 16:58:02,016][21195] Updated weights for policy 0, policy_version 31050 (0.0008) +[2023-10-08 16:58:02,377][21195] Updated weights for policy 0, policy_version 31060 (0.0009) +[2023-10-08 16:58:02,752][21195] Updated weights for policy 0, policy_version 31070 (0.0010) +[2023-10-08 16:58:03,076][21194] Updated weights for policy 1, policy_version 30820 (0.0010) +[2023-10-08 16:58:03,441][21194] Updated weights for policy 1, policy_version 30830 (0.0010) +[2023-10-08 16:58:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 63373312. Throughput: 0: 1712.7, 1: 1714.1. Samples: 15852774. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 16:58:03,804][19739] Avg episode reward: [(0, '777.820'), (1, '880.330')] +[2023-10-08 16:58:03,816][21194] Updated weights for policy 1, policy_version 30840 (0.0008) +[2023-10-08 16:58:06,720][21195] Updated weights for policy 0, policy_version 31080 (0.0008) +[2023-10-08 16:58:07,095][21195] Updated weights for policy 0, policy_version 31090 (0.0007) +[2023-10-08 16:58:07,468][21195] Updated weights for policy 0, policy_version 31100 (0.0007) +[2023-10-08 16:58:07,691][21194] Updated weights for policy 1, policy_version 30850 (0.0008) +[2023-10-08 16:58:08,064][21194] Updated weights for policy 1, policy_version 30860 (0.0010) +[2023-10-08 16:58:08,431][21194] Updated weights for policy 1, policy_version 30870 (0.0009) +[2023-10-08 16:58:08,791][21194] Updated weights for policy 1, policy_version 30880 (0.0010) +[2023-10-08 16:58:08,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 63471616. Throughput: 0: 1737.6, 1: 1720.4. Samples: 15869154. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:58:08,803][19739] Avg episode reward: [(0, '777.820'), (1, '910.090')] +[2023-10-08 16:58:08,804][20836] Saving new best policy, reward=910.090! +[2023-10-08 16:58:11,383][21195] Updated weights for policy 0, policy_version 31110 (0.0007) +[2023-10-08 16:58:11,750][21195] Updated weights for policy 0, policy_version 31120 (0.0008) +[2023-10-08 16:58:12,121][21195] Updated weights for policy 0, policy_version 31130 (0.0007) +[2023-10-08 16:58:12,753][21194] Updated weights for policy 1, policy_version 30890 (0.0009) +[2023-10-08 16:58:13,115][21194] Updated weights for policy 1, policy_version 30900 (0.0007) +[2023-10-08 16:58:13,487][21194] Updated weights for policy 1, policy_version 30910 (0.0007) +[2023-10-08 16:58:13,803][19739] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 63537152. Throughput: 0: 1715.3, 1: 1707.8. Samples: 15888994. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:58:13,803][19739] Avg episode reward: [(0, '767.550'), (1, '916.460')] +[2023-10-08 16:58:13,811][20836] Saving new best policy, reward=916.460! +[2023-10-08 16:58:16,160][21195] Updated weights for policy 0, policy_version 31140 (0.0010) +[2023-10-08 16:58:16,525][21195] Updated weights for policy 0, policy_version 31150 (0.0010) +[2023-10-08 16:58:16,896][21195] Updated weights for policy 0, policy_version 31160 (0.0008) +[2023-10-08 16:58:17,312][21194] Updated weights for policy 1, policy_version 30920 (0.0008) +[2023-10-08 16:58:17,677][21194] Updated weights for policy 1, policy_version 30930 (0.0008) +[2023-10-08 16:58:18,047][21194] Updated weights for policy 1, policy_version 30940 (0.0008) +[2023-10-08 16:58:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 63602688. Throughput: 0: 1728.7, 1: 1728.3. Samples: 15905138. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:58:18,803][19739] Avg episode reward: [(0, '767.550'), (1, '931.410')] +[2023-10-08 16:58:18,804][20836] Saving new best policy, reward=931.410! +[2023-10-08 16:58:20,811][21195] Updated weights for policy 0, policy_version 31170 (0.0008) +[2023-10-08 16:58:21,192][21195] Updated weights for policy 0, policy_version 31180 (0.0009) +[2023-10-08 16:58:21,558][21195] Updated weights for policy 0, policy_version 31190 (0.0007) +[2023-10-08 16:58:21,920][21195] Updated weights for policy 0, policy_version 31200 (0.0008) +[2023-10-08 16:58:22,085][21194] Updated weights for policy 1, policy_version 30950 (0.0008) +[2023-10-08 16:58:22,457][21194] Updated weights for policy 1, policy_version 30960 (0.0007) +[2023-10-08 16:58:22,826][21194] Updated weights for policy 1, policy_version 30970 (0.0010) +[2023-10-08 16:58:23,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 63668224. Throughput: 0: 1720.6, 1: 1727.1. Samples: 15920386. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:58:23,803][19739] Avg episode reward: [(0, '767.550'), (1, '931.410')] +[2023-10-08 16:58:25,810][21195] Updated weights for policy 0, policy_version 31210 (0.0008) +[2023-10-08 16:58:26,174][21195] Updated weights for policy 0, policy_version 31220 (0.0009) +[2023-10-08 16:58:26,538][21195] Updated weights for policy 0, policy_version 31230 (0.0007) +[2023-10-08 16:58:26,697][21194] Updated weights for policy 1, policy_version 30980 (0.0008) +[2023-10-08 16:58:27,065][21194] Updated weights for policy 1, policy_version 30990 (0.0010) +[2023-10-08 16:58:27,431][21194] Updated weights for policy 1, policy_version 31000 (0.0011) +[2023-10-08 16:58:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 63733760. Throughput: 0: 1724.2, 1: 1703.1. Samples: 15940784. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:58:28,803][19739] Avg episode reward: [(0, '767.550'), (1, '931.410')] +[2023-10-08 16:58:30,295][21195] Updated weights for policy 0, policy_version 31240 (0.0009) +[2023-10-08 16:58:30,657][21195] Updated weights for policy 0, policy_version 31250 (0.0010) +[2023-10-08 16:58:31,029][21195] Updated weights for policy 0, policy_version 31260 (0.0008) +[2023-10-08 16:58:31,514][21194] Updated weights for policy 1, policy_version 31010 (0.0009) +[2023-10-08 16:58:31,875][21194] Updated weights for policy 1, policy_version 31020 (0.0008) +[2023-10-08 16:58:32,246][21194] Updated weights for policy 1, policy_version 31030 (0.0008) +[2023-10-08 16:58:32,620][21194] Updated weights for policy 1, policy_version 31040 (0.0008) +[2023-10-08 16:58:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 63799296. Throughput: 0: 1748.5, 1: 1734.4. Samples: 15957568. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:58:33,803][19739] Avg episode reward: [(0, '767.550'), (1, '931.410')] +[2023-10-08 16:58:34,955][21195] Updated weights for policy 0, policy_version 31270 (0.0009) +[2023-10-08 16:58:35,340][21195] Updated weights for policy 0, policy_version 31280 (0.0008) +[2023-10-08 16:58:35,699][21195] Updated weights for policy 0, policy_version 31290 (0.0008) +[2023-10-08 16:58:36,456][21194] Updated weights for policy 1, policy_version 31050 (0.0008) +[2023-10-08 16:58:36,827][21194] Updated weights for policy 1, policy_version 31060 (0.0011) +[2023-10-08 16:58:37,190][21194] Updated weights for policy 1, policy_version 31070 (0.0008) +[2023-10-08 16:58:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 63864832. Throughput: 0: 1718.0, 1: 1711.1. Samples: 15971770. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:58:38,803][19739] Avg episode reward: [(0, '779.860'), (1, '931.410')] +[2023-10-08 16:58:39,490][21195] Updated weights for policy 0, policy_version 31300 (0.0010) +[2023-10-08 16:58:39,874][21195] Updated weights for policy 0, policy_version 31310 (0.0010) +[2023-10-08 16:58:40,237][21195] Updated weights for policy 0, policy_version 31320 (0.0009) +[2023-10-08 16:58:41,182][21194] Updated weights for policy 1, policy_version 31080 (0.0010) +[2023-10-08 16:58:41,551][21194] Updated weights for policy 1, policy_version 31090 (0.0009) +[2023-10-08 16:58:41,907][21194] Updated weights for policy 1, policy_version 31100 (0.0010) +[2023-10-08 16:58:43,803][19739] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 63930368. Throughput: 0: 1738.8, 1: 1700.0. Samples: 15992740. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:58:43,804][19739] Avg episode reward: [(0, '779.860'), (1, '946.520')] +[2023-10-08 16:58:43,814][20836] Saving new best policy, reward=946.520! +[2023-10-08 16:58:44,323][21195] Updated weights for policy 0, policy_version 31330 (0.0009) +[2023-10-08 16:58:44,692][21195] Updated weights for policy 0, policy_version 31340 (0.0007) +[2023-10-08 16:58:45,076][21195] Updated weights for policy 0, policy_version 31350 (0.0007) +[2023-10-08 16:58:45,445][21195] Updated weights for policy 0, policy_version 31360 (0.0007) +[2023-10-08 16:58:45,918][21194] Updated weights for policy 1, policy_version 31110 (0.0011) +[2023-10-08 16:58:46,301][21194] Updated weights for policy 1, policy_version 31120 (0.0008) +[2023-10-08 16:58:46,663][21194] Updated weights for policy 1, policy_version 31130 (0.0007) +[2023-10-08 16:58:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 63995904. Throughput: 0: 1749.6, 1: 1727.5. Samples: 16009242. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:58:48,803][19739] Avg episode reward: [(0, '794.210'), (1, '946.520')] +[2023-10-08 16:58:48,804][20740] Saving new best policy, reward=794.210! +[2023-10-08 16:58:49,357][21195] Updated weights for policy 0, policy_version 31370 (0.0007) +[2023-10-08 16:58:49,740][21195] Updated weights for policy 0, policy_version 31380 (0.0008) +[2023-10-08 16:58:50,105][21195] Updated weights for policy 0, policy_version 31390 (0.0009) +[2023-10-08 16:58:50,698][21194] Updated weights for policy 1, policy_version 31140 (0.0009) +[2023-10-08 16:58:51,065][21194] Updated weights for policy 1, policy_version 31150 (0.0007) +[2023-10-08 16:58:51,423][21194] Updated weights for policy 1, policy_version 31160 (0.0008) +[2023-10-08 16:58:53,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 64061440. Throughput: 0: 1727.6, 1: 1705.0. Samples: 16023620. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:58:53,803][19739] Avg episode reward: [(0, '794.210'), (1, '946.520')] +[2023-10-08 16:58:54,016][21195] Updated weights for policy 0, policy_version 31400 (0.0010) +[2023-10-08 16:58:54,395][21195] Updated weights for policy 0, policy_version 31410 (0.0007) +[2023-10-08 16:58:54,764][21195] Updated weights for policy 0, policy_version 31420 (0.0009) +[2023-10-08 16:58:55,078][21194] Updated weights for policy 1, policy_version 31170 (0.0008) +[2023-10-08 16:58:55,434][21194] Updated weights for policy 1, policy_version 31180 (0.0009) +[2023-10-08 16:58:55,803][21194] Updated weights for policy 1, policy_version 31190 (0.0008) +[2023-10-08 16:58:56,165][21194] Updated weights for policy 1, policy_version 31200 (0.0007) +[2023-10-08 16:58:58,695][21195] Updated weights for policy 0, policy_version 31430 (0.0008) +[2023-10-08 16:58:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 64126976. Throughput: 0: 1754.3, 1: 1725.6. Samples: 16045588. Policy #0 lag: (min: 12.0, avg: 12.6, max: 30.0) +[2023-10-08 16:58:58,803][19739] Avg episode reward: [(0, '794.210'), (1, '946.520')] +[2023-10-08 16:58:59,071][21195] Updated weights for policy 0, policy_version 31440 (0.0009) +[2023-10-08 16:58:59,434][21195] Updated weights for policy 0, policy_version 31450 (0.0008) +[2023-10-08 16:59:00,105][21194] Updated weights for policy 1, policy_version 31210 (0.0007) +[2023-10-08 16:59:00,469][21194] Updated weights for policy 1, policy_version 31220 (0.0007) +[2023-10-08 16:59:00,834][21194] Updated weights for policy 1, policy_version 31230 (0.0007) +[2023-10-08 16:59:03,318][21195] Updated weights for policy 0, policy_version 31460 (0.0008) +[2023-10-08 16:59:03,693][21195] Updated weights for policy 0, policy_version 31470 (0.0008) +[2023-10-08 16:59:03,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 64192512. Throughput: 0: 1737.7, 1: 1709.0. Samples: 16060240. Policy #0 lag: (min: 12.0, avg: 12.6, max: 30.0) +[2023-10-08 16:59:03,804][19739] Avg episode reward: [(0, '794.210'), (1, '959.610')] +[2023-10-08 16:59:03,805][20836] Saving new best policy, reward=959.610! +[2023-10-08 16:59:04,060][21195] Updated weights for policy 0, policy_version 31480 (0.0008) +[2023-10-08 16:59:04,703][21194] Updated weights for policy 1, policy_version 31240 (0.0007) +[2023-10-08 16:59:05,059][21194] Updated weights for policy 1, policy_version 31250 (0.0009) +[2023-10-08 16:59:05,429][21194] Updated weights for policy 1, policy_version 31260 (0.0008) +[2023-10-08 16:59:08,004][21195] Updated weights for policy 0, policy_version 31490 (0.0008) +[2023-10-08 16:59:08,373][21195] Updated weights for policy 0, policy_version 31500 (0.0007) +[2023-10-08 16:59:08,735][21195] Updated weights for policy 0, policy_version 31510 (0.0009) +[2023-10-08 16:59:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 64258048. Throughput: 0: 1747.2, 1: 1720.3. Samples: 16076422. Policy #0 lag: (min: 12.0, avg: 12.6, max: 30.0) +[2023-10-08 16:59:08,803][19739] Avg episode reward: [(0, '794.210'), (1, '959.610')] +[2023-10-08 16:59:09,102][21195] Updated weights for policy 0, policy_version 31520 (0.0011) +[2023-10-08 16:59:09,379][21194] Updated weights for policy 1, policy_version 31270 (0.0009) +[2023-10-08 16:59:09,737][21194] Updated weights for policy 1, policy_version 31280 (0.0008) +[2023-10-08 16:59:10,102][21194] Updated weights for policy 1, policy_version 31290 (0.0009) +[2023-10-08 16:59:13,025][21195] Updated weights for policy 0, policy_version 31530 (0.0008) +[2023-10-08 16:59:13,397][21195] Updated weights for policy 0, policy_version 31540 (0.0008) +[2023-10-08 16:59:13,774][21195] Updated weights for policy 0, policy_version 31550 (0.0007) +[2023-10-08 16:59:13,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 64323584. Throughput: 0: 1742.0, 1: 1747.7. Samples: 16097818. Policy #0 lag: (min: 12.0, avg: 12.6, max: 30.0) +[2023-10-08 16:59:13,803][19739] Avg episode reward: [(0, '807.960'), (1, '959.600')] +[2023-10-08 16:59:13,847][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000031552_32309248.pth... +[2023-10-08 16:59:13,890][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000029920_30638080.pth +[2023-10-08 16:59:13,896][20740] Saving new best policy, reward=807.960! +[2023-10-08 16:59:13,963][21194] Updated weights for policy 1, policy_version 31300 (0.0009) +[2023-10-08 16:59:14,323][21194] Updated weights for policy 1, policy_version 31310 (0.0009) +[2023-10-08 16:59:14,697][21194] Updated weights for policy 1, policy_version 31320 (0.0008) +[2023-10-08 16:59:14,993][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000031328_32079872.pth... +[2023-10-08 16:59:15,027][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000029696_30408704.pth +[2023-10-08 16:59:17,659][21195] Updated weights for policy 0, policy_version 31560 (0.0009) +[2023-10-08 16:59:18,033][21195] Updated weights for policy 0, policy_version 31570 (0.0007) +[2023-10-08 16:59:18,398][21195] Updated weights for policy 0, policy_version 31580 (0.0008) +[2023-10-08 16:59:18,587][21194] Updated weights for policy 1, policy_version 31330 (0.0007) +[2023-10-08 16:59:18,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 64421888. Throughput: 0: 1717.1, 1: 1718.1. Samples: 16112154. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:59:18,803][19739] Avg episode reward: [(0, '807.960'), (1, '959.600')] +[2023-10-08 16:59:18,960][21194] Updated weights for policy 1, policy_version 31340 (0.0008) +[2023-10-08 16:59:19,321][21194] Updated weights for policy 1, policy_version 31350 (0.0007) +[2023-10-08 16:59:19,688][21194] Updated weights for policy 1, policy_version 31360 (0.0007) +[2023-10-08 16:59:22,232][21195] Updated weights for policy 0, policy_version 31590 (0.0008) +[2023-10-08 16:59:22,604][21195] Updated weights for policy 0, policy_version 31600 (0.0008) +[2023-10-08 16:59:22,981][21195] Updated weights for policy 0, policy_version 31610 (0.0007) +[2023-10-08 16:59:23,540][21194] Updated weights for policy 1, policy_version 31370 (0.0010) +[2023-10-08 16:59:23,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 64487424. Throughput: 0: 1749.9, 1: 1747.5. Samples: 16129154. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:59:23,803][19739] Avg episode reward: [(0, '779.040'), (1, '989.590')] +[2023-10-08 16:59:23,908][21194] Updated weights for policy 1, policy_version 31380 (0.0009) +[2023-10-08 16:59:24,282][21194] Updated weights for policy 1, policy_version 31390 (0.0010) +[2023-10-08 16:59:24,355][20836] Saving new best policy, reward=989.590! +[2023-10-08 16:59:26,808][21195] Updated weights for policy 0, policy_version 31620 (0.0007) +[2023-10-08 16:59:27,183][21195] Updated weights for policy 0, policy_version 31630 (0.0007) +[2023-10-08 16:59:27,550][21195] Updated weights for policy 0, policy_version 31640 (0.0007) +[2023-10-08 16:59:28,136][21194] Updated weights for policy 1, policy_version 31400 (0.0008) +[2023-10-08 16:59:28,514][21194] Updated weights for policy 1, policy_version 31410 (0.0008) +[2023-10-08 16:59:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 64552960. Throughput: 0: 1724.7, 1: 1753.7. Samples: 16149266. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:59:28,804][19739] Avg episode reward: [(0, '779.040'), (1, '989.590')] +[2023-10-08 16:59:28,872][21194] Updated weights for policy 1, policy_version 31420 (0.0008) +[2023-10-08 16:59:31,484][21195] Updated weights for policy 0, policy_version 31650 (0.0007) +[2023-10-08 16:59:31,853][21195] Updated weights for policy 0, policy_version 31660 (0.0007) +[2023-10-08 16:59:32,222][21195] Updated weights for policy 0, policy_version 31670 (0.0010) +[2023-10-08 16:59:32,596][21195] Updated weights for policy 0, policy_version 31680 (0.0011) +[2023-10-08 16:59:32,974][21194] Updated weights for policy 1, policy_version 31430 (0.0010) +[2023-10-08 16:59:33,340][21194] Updated weights for policy 1, policy_version 31440 (0.0011) +[2023-10-08 16:59:33,712][21194] Updated weights for policy 1, policy_version 31450 (0.0012) +[2023-10-08 16:59:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 64618496. Throughput: 0: 1719.0, 1: 1735.7. Samples: 16164702. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:59:33,804][19739] Avg episode reward: [(0, '779.040'), (1, '989.590')] +[2023-10-08 16:59:36,568][21195] Updated weights for policy 0, policy_version 31690 (0.0009) +[2023-10-08 16:59:36,938][21195] Updated weights for policy 0, policy_version 31700 (0.0008) +[2023-10-08 16:59:37,308][21195] Updated weights for policy 0, policy_version 31710 (0.0007) +[2023-10-08 16:59:37,781][21194] Updated weights for policy 1, policy_version 31460 (0.0009) +[2023-10-08 16:59:38,156][21194] Updated weights for policy 1, policy_version 31470 (0.0008) +[2023-10-08 16:59:38,527][21194] Updated weights for policy 1, policy_version 31480 (0.0009) +[2023-10-08 16:59:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 64684032. Throughput: 0: 1734.6, 1: 1752.9. Samples: 16180558. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:59:38,803][19739] Avg episode reward: [(0, '779.040'), (1, '989.590')] +[2023-10-08 16:59:41,313][21195] Updated weights for policy 0, policy_version 31720 (0.0007) +[2023-10-08 16:59:41,679][21195] Updated weights for policy 0, policy_version 31730 (0.0007) +[2023-10-08 16:59:42,053][21195] Updated weights for policy 0, policy_version 31740 (0.0009) +[2023-10-08 16:59:42,421][21194] Updated weights for policy 1, policy_version 31490 (0.0008) +[2023-10-08 16:59:42,784][21194] Updated weights for policy 1, policy_version 31500 (0.0007) +[2023-10-08 16:59:43,148][21194] Updated weights for policy 1, policy_version 31510 (0.0008) +[2023-10-08 16:59:43,512][21194] Updated weights for policy 1, policy_version 31520 (0.0008) +[2023-10-08 16:59:43,803][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.6, 300 sec: 13773.7). Total num frames: 64782336. Throughput: 0: 1714.0, 1: 1729.4. Samples: 16200542. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:59:43,803][19739] Avg episode reward: [(0, '791.620'), (1, '989.590')] +[2023-10-08 16:59:45,866][21195] Updated weights for policy 0, policy_version 31750 (0.0007) +[2023-10-08 16:59:46,240][21195] Updated weights for policy 0, policy_version 31760 (0.0009) +[2023-10-08 16:59:46,611][21195] Updated weights for policy 0, policy_version 31770 (0.0007) +[2023-10-08 16:59:47,449][21194] Updated weights for policy 1, policy_version 31530 (0.0010) +[2023-10-08 16:59:47,812][21194] Updated weights for policy 1, policy_version 31540 (0.0007) +[2023-10-08 16:59:48,191][21194] Updated weights for policy 1, policy_version 31550 (0.0007) +[2023-10-08 16:59:48,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 64847872. Throughput: 0: 1732.7, 1: 1744.4. Samples: 16216708. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:59:48,804][19739] Avg episode reward: [(0, '791.620'), (1, '989.590')] +[2023-10-08 16:59:50,690][21195] Updated weights for policy 0, policy_version 31780 (0.0010) +[2023-10-08 16:59:51,051][21195] Updated weights for policy 0, policy_version 31790 (0.0009) +[2023-10-08 16:59:51,429][21195] Updated weights for policy 0, policy_version 31800 (0.0008) +[2023-10-08 16:59:52,123][21194] Updated weights for policy 1, policy_version 31560 (0.0009) +[2023-10-08 16:59:52,491][21194] Updated weights for policy 1, policy_version 31570 (0.0008) +[2023-10-08 16:59:52,852][21194] Updated weights for policy 1, policy_version 31580 (0.0008) +[2023-10-08 16:59:53,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 64913408. Throughput: 0: 1714.4, 1: 1741.0. Samples: 16231916. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:59:53,804][19739] Avg episode reward: [(0, '791.620'), (1, '989.590')] +[2023-10-08 16:59:55,194][21195] Updated weights for policy 0, policy_version 31810 (0.0008) +[2023-10-08 16:59:55,561][21195] Updated weights for policy 0, policy_version 31820 (0.0009) +[2023-10-08 16:59:55,933][21195] Updated weights for policy 0, policy_version 31830 (0.0008) +[2023-10-08 16:59:56,298][21195] Updated weights for policy 0, policy_version 31840 (0.0009) +[2023-10-08 16:59:56,822][21194] Updated weights for policy 1, policy_version 31590 (0.0008) +[2023-10-08 16:59:57,198][21194] Updated weights for policy 1, policy_version 31600 (0.0009) +[2023-10-08 16:59:57,572][21194] Updated weights for policy 1, policy_version 31610 (0.0008) +[2023-10-08 16:59:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 64978944. Throughput: 0: 1724.2, 1: 1712.4. Samples: 16252468. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 16:59:58,803][19739] Avg episode reward: [(0, '791.620'), (1, '989.590')] +[2023-10-08 17:00:00,067][21195] Updated weights for policy 0, policy_version 31850 (0.0008) +[2023-10-08 17:00:00,439][21195] Updated weights for policy 0, policy_version 31860 (0.0007) +[2023-10-08 17:00:00,802][21195] Updated weights for policy 0, policy_version 31870 (0.0010) +[2023-10-08 17:00:01,554][21194] Updated weights for policy 1, policy_version 31620 (0.0008) +[2023-10-08 17:00:01,915][21194] Updated weights for policy 1, policy_version 31630 (0.0010) +[2023-10-08 17:00:02,282][21194] Updated weights for policy 1, policy_version 31640 (0.0009) +[2023-10-08 17:00:03,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.6, 300 sec: 13773.7). Total num frames: 65044480. Throughput: 0: 1751.3, 1: 1742.7. Samples: 16269384. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:00:03,803][19739] Avg episode reward: [(0, '791.620'), (1, '989.590')] +[2023-10-08 17:00:04,730][21195] Updated weights for policy 0, policy_version 31880 (0.0010) +[2023-10-08 17:00:05,113][21195] Updated weights for policy 0, policy_version 31890 (0.0008) +[2023-10-08 17:00:05,477][21195] Updated weights for policy 0, policy_version 31900 (0.0009) +[2023-10-08 17:00:06,151][21194] Updated weights for policy 1, policy_version 31650 (0.0007) +[2023-10-08 17:00:06,522][21194] Updated weights for policy 1, policy_version 31660 (0.0008) +[2023-10-08 17:00:06,886][21194] Updated weights for policy 1, policy_version 31670 (0.0007) +[2023-10-08 17:00:07,253][21194] Updated weights for policy 1, policy_version 31680 (0.0009) +[2023-10-08 17:00:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 65110016. Throughput: 0: 1723.4, 1: 1713.4. Samples: 16283808. Policy #0 lag: (min: 12.0, avg: 12.0, max: 12.0) +[2023-10-08 17:00:08,803][19739] Avg episode reward: [(0, '791.620'), (1, '989.590')] +[2023-10-08 17:00:09,413][21195] Updated weights for policy 0, policy_version 31910 (0.0009) +[2023-10-08 17:00:09,793][21195] Updated weights for policy 0, policy_version 31920 (0.0009) +[2023-10-08 17:00:10,158][21195] Updated weights for policy 0, policy_version 31930 (0.0007) +[2023-10-08 17:00:11,137][21194] Updated weights for policy 1, policy_version 31690 (0.0010) +[2023-10-08 17:00:11,513][21194] Updated weights for policy 1, policy_version 31700 (0.0012) +[2023-10-08 17:00:11,879][21194] Updated weights for policy 1, policy_version 31710 (0.0010) +[2023-10-08 17:00:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 65175552. Throughput: 0: 1742.3, 1: 1713.6. Samples: 16304782. Policy #0 lag: (min: 12.0, avg: 12.0, max: 12.0) +[2023-10-08 17:00:13,803][19739] Avg episode reward: [(0, '789.100'), (1, '989.590')] +[2023-10-08 17:00:14,200][21195] Updated weights for policy 0, policy_version 31940 (0.0010) +[2023-10-08 17:00:14,570][21195] Updated weights for policy 0, policy_version 31950 (0.0008) +[2023-10-08 17:00:14,929][21195] Updated weights for policy 0, policy_version 31960 (0.0008) +[2023-10-08 17:00:15,827][21194] Updated weights for policy 1, policy_version 31720 (0.0010) +[2023-10-08 17:00:16,207][21194] Updated weights for policy 1, policy_version 31730 (0.0008) +[2023-10-08 17:00:16,581][21194] Updated weights for policy 1, policy_version 31740 (0.0008) +[2023-10-08 17:00:18,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 65241088. Throughput: 0: 1742.1, 1: 1725.6. Samples: 16320748. Policy #0 lag: (min: 12.0, avg: 12.0, max: 12.0) +[2023-10-08 17:00:18,803][19739] Avg episode reward: [(0, '792.990'), (1, '975.370')] +[2023-10-08 17:00:18,867][21195] Updated weights for policy 0, policy_version 31970 (0.0010) +[2023-10-08 17:00:19,242][21195] Updated weights for policy 0, policy_version 31980 (0.0010) +[2023-10-08 17:00:19,613][21195] Updated weights for policy 0, policy_version 31990 (0.0008) +[2023-10-08 17:00:19,990][21195] Updated weights for policy 0, policy_version 32000 (0.0009) +[2023-10-08 17:00:20,483][21194] Updated weights for policy 1, policy_version 31750 (0.0008) +[2023-10-08 17:00:20,858][21194] Updated weights for policy 1, policy_version 31760 (0.0009) +[2023-10-08 17:00:21,226][21194] Updated weights for policy 1, policy_version 31770 (0.0009) +[2023-10-08 17:00:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 65306624. Throughput: 0: 1728.3, 1: 1712.0. Samples: 16335372. Policy #0 lag: (min: 12.0, avg: 12.0, max: 12.0) +[2023-10-08 17:00:23,803][19739] Avg episode reward: [(0, '791.440'), (1, '975.370')] +[2023-10-08 17:00:24,020][21195] Updated weights for policy 0, policy_version 32010 (0.0008) +[2023-10-08 17:00:24,401][21195] Updated weights for policy 0, policy_version 32020 (0.0009) +[2023-10-08 17:00:24,774][21195] Updated weights for policy 0, policy_version 32030 (0.0009) +[2023-10-08 17:00:25,136][21194] Updated weights for policy 1, policy_version 31780 (0.0008) +[2023-10-08 17:00:25,502][21194] Updated weights for policy 1, policy_version 31790 (0.0009) +[2023-10-08 17:00:25,866][21194] Updated weights for policy 1, policy_version 31800 (0.0008) +[2023-10-08 17:00:28,662][21195] Updated weights for policy 0, policy_version 32040 (0.0008) +[2023-10-08 17:00:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 65372160. Throughput: 0: 1743.2, 1: 1724.5. Samples: 16356588. Policy #0 lag: (min: 12.0, avg: 12.0, max: 12.0) +[2023-10-08 17:00:28,803][19739] Avg episode reward: [(0, '791.560'), (1, '989.120')] +[2023-10-08 17:00:29,030][21195] Updated weights for policy 0, policy_version 32050 (0.0007) +[2023-10-08 17:00:29,411][21195] Updated weights for policy 0, policy_version 32060 (0.0010) +[2023-10-08 17:00:29,924][21194] Updated weights for policy 1, policy_version 31810 (0.0008) +[2023-10-08 17:00:30,291][21194] Updated weights for policy 1, policy_version 31820 (0.0008) +[2023-10-08 17:00:30,660][21194] Updated weights for policy 1, policy_version 31830 (0.0008) +[2023-10-08 17:00:31,025][21194] Updated weights for policy 1, policy_version 31840 (0.0009) +[2023-10-08 17:00:33,273][21195] Updated weights for policy 0, policy_version 32070 (0.0008) +[2023-10-08 17:00:33,653][21195] Updated weights for policy 0, policy_version 32080 (0.0008) +[2023-10-08 17:00:33,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 65437696. Throughput: 0: 1728.8, 1: 1712.3. Samples: 16371558. Policy #0 lag: (min: 25.0, avg: 34.5, max: 57.0) +[2023-10-08 17:00:33,803][19739] Avg episode reward: [(0, '791.560'), (1, '989.120')] +[2023-10-08 17:00:34,014][21195] Updated weights for policy 0, policy_version 32090 (0.0008) +[2023-10-08 17:00:34,863][21194] Updated weights for policy 1, policy_version 31850 (0.0010) +[2023-10-08 17:00:35,231][21194] Updated weights for policy 1, policy_version 31860 (0.0008) +[2023-10-08 17:00:35,611][21194] Updated weights for policy 1, policy_version 31870 (0.0010) +[2023-10-08 17:00:37,892][21195] Updated weights for policy 0, policy_version 32100 (0.0009) +[2023-10-08 17:00:38,260][21195] Updated weights for policy 0, policy_version 32110 (0.0008) +[2023-10-08 17:00:38,626][21195] Updated weights for policy 0, policy_version 32120 (0.0007) +[2023-10-08 17:00:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 65503232. Throughput: 0: 1748.1, 1: 1711.0. Samples: 16387574. Policy #0 lag: (min: 25.0, avg: 34.5, max: 57.0) +[2023-10-08 17:00:38,803][19739] Avg episode reward: [(0, '779.240'), (1, '989.120')] +[2023-10-08 17:00:39,632][21194] Updated weights for policy 1, policy_version 31880 (0.0009) +[2023-10-08 17:00:40,000][21194] Updated weights for policy 1, policy_version 31890 (0.0007) +[2023-10-08 17:00:40,370][21194] Updated weights for policy 1, policy_version 31900 (0.0010) +[2023-10-08 17:00:42,487][21195] Updated weights for policy 0, policy_version 32130 (0.0008) +[2023-10-08 17:00:42,844][21195] Updated weights for policy 0, policy_version 32140 (0.0007) +[2023-10-08 17:00:43,223][21195] Updated weights for policy 0, policy_version 32150 (0.0007) +[2023-10-08 17:00:43,593][21195] Updated weights for policy 0, policy_version 32160 (0.0007) +[2023-10-08 17:00:43,803][19739] Fps is (10 sec: 16383.8, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 65601536. Throughput: 0: 1732.8, 1: 1734.1. Samples: 16408482. Policy #0 lag: (min: 25.0, avg: 34.5, max: 57.0) +[2023-10-08 17:00:43,803][19739] Avg episode reward: [(0, '779.180'), (1, '989.120')] +[2023-10-08 17:00:44,396][21194] Updated weights for policy 1, policy_version 31910 (0.0009) +[2023-10-08 17:00:44,760][21194] Updated weights for policy 1, policy_version 31920 (0.0010) +[2023-10-08 17:00:45,128][21194] Updated weights for policy 1, policy_version 31930 (0.0007) +[2023-10-08 17:00:47,446][21195] Updated weights for policy 0, policy_version 32170 (0.0010) +[2023-10-08 17:00:47,816][21195] Updated weights for policy 0, policy_version 32180 (0.0008) +[2023-10-08 17:00:48,185][21195] Updated weights for policy 0, policy_version 32190 (0.0010) +[2023-10-08 17:00:48,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 65667072. Throughput: 0: 1709.6, 1: 1701.8. Samples: 16422900. Policy #0 lag: (min: 25.0, avg: 34.5, max: 57.0) +[2023-10-08 17:00:48,803][19739] Avg episode reward: [(0, '779.180'), (1, '1004.040')] +[2023-10-08 17:00:49,029][21194] Updated weights for policy 1, policy_version 31940 (0.0009) +[2023-10-08 17:00:49,393][21194] Updated weights for policy 1, policy_version 31950 (0.0009) +[2023-10-08 17:00:49,760][21194] Updated weights for policy 1, policy_version 31960 (0.0009) +[2023-10-08 17:00:50,050][20836] Saving new best policy, reward=1004.040! +[2023-10-08 17:00:52,054][21195] Updated weights for policy 0, policy_version 32200 (0.0010) +[2023-10-08 17:00:52,429][21195] Updated weights for policy 0, policy_version 32210 (0.0008) +[2023-10-08 17:00:52,794][21195] Updated weights for policy 0, policy_version 32220 (0.0007) +[2023-10-08 17:00:53,749][21194] Updated weights for policy 1, policy_version 31970 (0.0007) +[2023-10-08 17:00:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 65732608. Throughput: 0: 1740.8, 1: 1724.1. Samples: 16439728. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:00:53,803][19739] Avg episode reward: [(0, '765.830'), (1, '1004.040')] +[2023-10-08 17:00:54,104][21194] Updated weights for policy 1, policy_version 31980 (0.0007) +[2023-10-08 17:00:54,472][21194] Updated weights for policy 1, policy_version 31990 (0.0009) +[2023-10-08 17:00:54,846][21194] Updated weights for policy 1, policy_version 32000 (0.0010) +[2023-10-08 17:00:56,740][21195] Updated weights for policy 0, policy_version 32230 (0.0007) +[2023-10-08 17:00:57,127][21195] Updated weights for policy 0, policy_version 32240 (0.0008) +[2023-10-08 17:00:57,497][21195] Updated weights for policy 0, policy_version 32250 (0.0008) +[2023-10-08 17:00:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 65798144. Throughput: 0: 1715.5, 1: 1734.4. Samples: 16460030. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:00:58,803][19739] Avg episode reward: [(0, '765.820'), (1, '1004.260')] +[2023-10-08 17:00:58,854][21194] Updated weights for policy 1, policy_version 32010 (0.0008) +[2023-10-08 17:00:59,221][21194] Updated weights for policy 1, policy_version 32020 (0.0009) +[2023-10-08 17:00:59,600][21194] Updated weights for policy 1, policy_version 32030 (0.0007) +[2023-10-08 17:00:59,667][20836] Saving new best policy, reward=1004.260! +[2023-10-08 17:01:01,479][21195] Updated weights for policy 0, policy_version 32260 (0.0008) +[2023-10-08 17:01:01,847][21195] Updated weights for policy 0, policy_version 32270 (0.0008) +[2023-10-08 17:01:02,211][21195] Updated weights for policy 0, policy_version 32280 (0.0008) +[2023-10-08 17:01:03,487][21194] Updated weights for policy 1, policy_version 32040 (0.0010) +[2023-10-08 17:01:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 65863680. Throughput: 0: 1721.7, 1: 1716.0. Samples: 16475444. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:01:03,804][19739] Avg episode reward: [(0, '765.820'), (1, '992.320')] +[2023-10-08 17:01:03,851][21194] Updated weights for policy 1, policy_version 32050 (0.0008) +[2023-10-08 17:01:04,221][21194] Updated weights for policy 1, policy_version 32060 (0.0008) +[2023-10-08 17:01:06,132][21195] Updated weights for policy 0, policy_version 32290 (0.0007) +[2023-10-08 17:01:06,504][21195] Updated weights for policy 0, policy_version 32300 (0.0011) +[2023-10-08 17:01:06,890][21195] Updated weights for policy 0, policy_version 32310 (0.0009) +[2023-10-08 17:01:07,265][21195] Updated weights for policy 0, policy_version 32320 (0.0008) +[2023-10-08 17:01:08,319][21194] Updated weights for policy 1, policy_version 32070 (0.0009) +[2023-10-08 17:01:08,703][21194] Updated weights for policy 1, policy_version 32080 (0.0007) +[2023-10-08 17:01:08,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 65929216. Throughput: 0: 1732.0, 1: 1735.7. Samples: 16491422. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:01:08,803][19739] Avg episode reward: [(0, '766.310'), (1, '992.320')] +[2023-10-08 17:01:09,071][21194] Updated weights for policy 1, policy_version 32090 (0.0007) +[2023-10-08 17:01:11,166][21195] Updated weights for policy 0, policy_version 32330 (0.0007) +[2023-10-08 17:01:11,534][21195] Updated weights for policy 0, policy_version 32340 (0.0008) +[2023-10-08 17:01:11,898][21195] Updated weights for policy 0, policy_version 32350 (0.0009) +[2023-10-08 17:01:12,983][21194] Updated weights for policy 1, policy_version 32100 (0.0008) +[2023-10-08 17:01:13,355][21194] Updated weights for policy 1, policy_version 32110 (0.0008) +[2023-10-08 17:01:13,719][21194] Updated weights for policy 1, policy_version 32120 (0.0008) +[2023-10-08 17:01:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 65994752. Throughput: 0: 1721.8, 1: 1732.1. Samples: 16512014. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:01:13,803][19739] Avg episode reward: [(0, '769.090'), (1, '992.320')] +[2023-10-08 17:01:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000032352_33128448.pth... +[2023-10-08 17:01:13,846][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000030720_31457280.pth +[2023-10-08 17:01:13,850][20740] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p0/milestones/checkpoint_000032352_33128448.pth +[2023-10-08 17:01:13,998][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000032128_32899072.pth... +[2023-10-08 17:01:14,036][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000030496_31227904.pth +[2023-10-08 17:01:14,041][20836] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p1/milestones/checkpoint_000032128_32899072.pth +[2023-10-08 17:01:15,900][21195] Updated weights for policy 0, policy_version 32360 (0.0007) +[2023-10-08 17:01:16,276][21195] Updated weights for policy 0, policy_version 32370 (0.0009) +[2023-10-08 17:01:16,644][21195] Updated weights for policy 0, policy_version 32380 (0.0007) +[2023-10-08 17:01:17,670][21194] Updated weights for policy 1, policy_version 32130 (0.0008) +[2023-10-08 17:01:18,039][21194] Updated weights for policy 1, policy_version 32140 (0.0009) +[2023-10-08 17:01:18,410][21194] Updated weights for policy 1, policy_version 32150 (0.0008) +[2023-10-08 17:01:18,773][21194] Updated weights for policy 1, policy_version 32160 (0.0007) +[2023-10-08 17:01:18,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 66093056. Throughput: 0: 1732.1, 1: 1733.5. Samples: 16527508. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 17:01:18,803][19739] Avg episode reward: [(0, '783.990'), (1, '992.320')] +[2023-10-08 17:01:20,648][21195] Updated weights for policy 0, policy_version 32390 (0.0008) +[2023-10-08 17:01:21,023][21195] Updated weights for policy 0, policy_version 32400 (0.0010) +[2023-10-08 17:01:21,392][21195] Updated weights for policy 0, policy_version 32410 (0.0011) +[2023-10-08 17:01:22,799][21194] Updated weights for policy 1, policy_version 32170 (0.0009) +[2023-10-08 17:01:23,174][21194] Updated weights for policy 1, policy_version 32180 (0.0008) +[2023-10-08 17:01:23,536][21194] Updated weights for policy 1, policy_version 32190 (0.0009) +[2023-10-08 17:01:23,803][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 66158592. Throughput: 0: 1712.5, 1: 1732.2. Samples: 16542584. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 17:01:23,803][19739] Avg episode reward: [(0, '784.270'), (1, '1007.130')] +[2023-10-08 17:01:23,804][20836] Saving new best policy, reward=1007.130! +[2023-10-08 17:01:25,359][21195] Updated weights for policy 0, policy_version 32420 (0.0009) +[2023-10-08 17:01:25,737][21195] Updated weights for policy 0, policy_version 32430 (0.0009) +[2023-10-08 17:01:26,099][21195] Updated weights for policy 0, policy_version 32440 (0.0009) +[2023-10-08 17:01:27,288][21194] Updated weights for policy 1, policy_version 32200 (0.0008) +[2023-10-08 17:01:27,660][21194] Updated weights for policy 1, policy_version 32210 (0.0008) +[2023-10-08 17:01:28,019][21194] Updated weights for policy 1, policy_version 32220 (0.0008) +[2023-10-08 17:01:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 66224128. Throughput: 0: 1723.0, 1: 1712.7. Samples: 16563086. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 17:01:28,803][19739] Avg episode reward: [(0, '784.270'), (1, '1012.700')] +[2023-10-08 17:01:28,811][20836] Saving new best policy, reward=1012.700! +[2023-10-08 17:01:29,990][21195] Updated weights for policy 0, policy_version 32450 (0.0008) +[2023-10-08 17:01:30,366][21195] Updated weights for policy 0, policy_version 32460 (0.0008) +[2023-10-08 17:01:30,737][21195] Updated weights for policy 0, policy_version 32470 (0.0011) +[2023-10-08 17:01:31,107][21195] Updated weights for policy 0, policy_version 32480 (0.0009) +[2023-10-08 17:01:31,727][21194] Updated weights for policy 1, policy_version 32230 (0.0009) +[2023-10-08 17:01:32,086][21194] Updated weights for policy 1, policy_version 32240 (0.0009) +[2023-10-08 17:01:32,457][21194] Updated weights for policy 1, policy_version 32250 (0.0011) +[2023-10-08 17:01:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 66289664. Throughput: 0: 1743.3, 1: 1741.9. Samples: 16579736. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 17:01:33,804][19739] Avg episode reward: [(0, '784.270'), (1, '1012.700')] +[2023-10-08 17:01:35,125][21195] Updated weights for policy 0, policy_version 32490 (0.0008) +[2023-10-08 17:01:35,490][21195] Updated weights for policy 0, policy_version 32500 (0.0009) +[2023-10-08 17:01:35,870][21195] Updated weights for policy 0, policy_version 32510 (0.0009) +[2023-10-08 17:01:36,361][21194] Updated weights for policy 1, policy_version 32260 (0.0010) +[2023-10-08 17:01:36,734][21194] Updated weights for policy 1, policy_version 32270 (0.0009) +[2023-10-08 17:01:37,102][21194] Updated weights for policy 1, policy_version 32280 (0.0009) +[2023-10-08 17:01:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 66355200. Throughput: 0: 1709.6, 1: 1725.4. Samples: 16594300. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 17:01:38,803][19739] Avg episode reward: [(0, '741.370'), (1, '1021.670')] +[2023-10-08 17:01:38,804][20836] Saving new best policy, reward=1021.670! +[2023-10-08 17:01:39,870][21195] Updated weights for policy 0, policy_version 32520 (0.0008) +[2023-10-08 17:01:40,249][21195] Updated weights for policy 0, policy_version 32530 (0.0007) +[2023-10-08 17:01:40,616][21195] Updated weights for policy 0, policy_version 32540 (0.0007) +[2023-10-08 17:01:40,923][21194] Updated weights for policy 1, policy_version 32290 (0.0008) +[2023-10-08 17:01:41,286][21194] Updated weights for policy 1, policy_version 32300 (0.0009) +[2023-10-08 17:01:41,656][21194] Updated weights for policy 1, policy_version 32310 (0.0010) +[2023-10-08 17:01:42,018][21194] Updated weights for policy 1, policy_version 32320 (0.0008) +[2023-10-08 17:01:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 66420736. Throughput: 0: 1744.3, 1: 1710.9. Samples: 16615514. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 17:01:43,803][19739] Avg episode reward: [(0, '741.370'), (1, '1021.670')] +[2023-10-08 17:01:44,512][21195] Updated weights for policy 0, policy_version 32550 (0.0007) +[2023-10-08 17:01:44,891][21195] Updated weights for policy 0, policy_version 32560 (0.0008) +[2023-10-08 17:01:45,252][21195] Updated weights for policy 0, policy_version 32570 (0.0009) +[2023-10-08 17:01:46,140][21194] Updated weights for policy 1, policy_version 32330 (0.0008) +[2023-10-08 17:01:46,509][21194] Updated weights for policy 1, policy_version 32340 (0.0007) +[2023-10-08 17:01:46,878][21194] Updated weights for policy 1, policy_version 32350 (0.0007) +[2023-10-08 17:01:48,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 66486272. Throughput: 0: 1740.4, 1: 1731.6. Samples: 16631682. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 17:01:48,804][19739] Avg episode reward: [(0, '741.370'), (1, '1021.670')] +[2023-10-08 17:01:49,226][21195] Updated weights for policy 0, policy_version 32580 (0.0009) +[2023-10-08 17:01:49,599][21195] Updated weights for policy 0, policy_version 32590 (0.0007) +[2023-10-08 17:01:49,976][21195] Updated weights for policy 0, policy_version 32600 (0.0009) +[2023-10-08 17:01:50,903][21194] Updated weights for policy 1, policy_version 32360 (0.0009) +[2023-10-08 17:01:51,273][21194] Updated weights for policy 1, policy_version 32370 (0.0010) +[2023-10-08 17:01:51,636][21194] Updated weights for policy 1, policy_version 32380 (0.0010) +[2023-10-08 17:01:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 66551808. Throughput: 0: 1731.3, 1: 1701.3. Samples: 16645890. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 17:01:53,803][19739] Avg episode reward: [(0, '741.980'), (1, '1021.670')] +[2023-10-08 17:01:53,824][21195] Updated weights for policy 0, policy_version 32610 (0.0008) +[2023-10-08 17:01:54,184][21195] Updated weights for policy 0, policy_version 32620 (0.0010) +[2023-10-08 17:01:54,565][21195] Updated weights for policy 0, policy_version 32630 (0.0007) +[2023-10-08 17:01:54,926][21195] Updated weights for policy 0, policy_version 32640 (0.0007) +[2023-10-08 17:01:55,693][21194] Updated weights for policy 1, policy_version 32390 (0.0011) +[2023-10-08 17:01:56,073][21194] Updated weights for policy 1, policy_version 32400 (0.0007) +[2023-10-08 17:01:56,445][21194] Updated weights for policy 1, policy_version 32410 (0.0007) +[2023-10-08 17:01:58,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 66617344. Throughput: 0: 1741.1, 1: 1705.1. Samples: 16667094. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 17:01:58,803][19739] Avg episode reward: [(0, '741.980'), (1, '1026.840')] +[2023-10-08 17:01:58,811][20836] Saving new best policy, reward=1026.840! +[2023-10-08 17:01:58,933][21195] Updated weights for policy 0, policy_version 32650 (0.0009) +[2023-10-08 17:01:59,308][21195] Updated weights for policy 0, policy_version 32660 (0.0009) +[2023-10-08 17:01:59,679][21195] Updated weights for policy 0, policy_version 32670 (0.0009) +[2023-10-08 17:02:00,470][21194] Updated weights for policy 1, policy_version 32420 (0.0008) +[2023-10-08 17:02:00,834][21194] Updated weights for policy 1, policy_version 32430 (0.0007) +[2023-10-08 17:02:01,195][21194] Updated weights for policy 1, policy_version 32440 (0.0010) +[2023-10-08 17:02:03,514][21195] Updated weights for policy 0, policy_version 32680 (0.0009) +[2023-10-08 17:02:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 66682880. Throughput: 0: 1726.4, 1: 1712.4. Samples: 16682252. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 17:02:03,803][19739] Avg episode reward: [(0, '741.980'), (1, '1026.840')] +[2023-10-08 17:02:03,886][21195] Updated weights for policy 0, policy_version 32690 (0.0008) +[2023-10-08 17:02:04,257][21195] Updated weights for policy 0, policy_version 32700 (0.0009) +[2023-10-08 17:02:05,063][21194] Updated weights for policy 1, policy_version 32450 (0.0008) +[2023-10-08 17:02:05,424][21194] Updated weights for policy 1, policy_version 32460 (0.0007) +[2023-10-08 17:02:05,785][21194] Updated weights for policy 1, policy_version 32470 (0.0011) +[2023-10-08 17:02:06,157][21194] Updated weights for policy 1, policy_version 32480 (0.0010) +[2023-10-08 17:02:08,174][21195] Updated weights for policy 0, policy_version 32710 (0.0010) +[2023-10-08 17:02:08,539][21195] Updated weights for policy 0, policy_version 32720 (0.0007) +[2023-10-08 17:02:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 66748416. Throughput: 0: 1744.6, 1: 1701.9. Samples: 16697676. Policy #0 lag: (min: 31.0, avg: 32.3, max: 56.0) +[2023-10-08 17:02:08,803][19739] Avg episode reward: [(0, '747.070'), (1, '1023.980')] +[2023-10-08 17:02:08,917][21195] Updated weights for policy 0, policy_version 32730 (0.0009) +[2023-10-08 17:02:10,165][21194] Updated weights for policy 1, policy_version 32490 (0.0008) +[2023-10-08 17:02:10,521][21194] Updated weights for policy 1, policy_version 32500 (0.0008) +[2023-10-08 17:02:10,885][21194] Updated weights for policy 1, policy_version 32510 (0.0007) +[2023-10-08 17:02:12,810][21195] Updated weights for policy 0, policy_version 32740 (0.0007) +[2023-10-08 17:02:13,173][21195] Updated weights for policy 0, policy_version 32750 (0.0008) +[2023-10-08 17:02:13,553][21195] Updated weights for policy 0, policy_version 32760 (0.0009) +[2023-10-08 17:02:13,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 66813952. Throughput: 0: 1737.8, 1: 1731.2. Samples: 16719190. Policy #0 lag: (min: 31.0, avg: 32.3, max: 56.0) +[2023-10-08 17:02:13,803][19739] Avg episode reward: [(0, '747.070'), (1, '1023.980')] +[2023-10-08 17:02:14,688][21194] Updated weights for policy 1, policy_version 32520 (0.0007) +[2023-10-08 17:02:15,051][21194] Updated weights for policy 1, policy_version 32530 (0.0009) +[2023-10-08 17:02:15,416][21194] Updated weights for policy 1, policy_version 32540 (0.0010) +[2023-10-08 17:02:17,275][21195] Updated weights for policy 0, policy_version 32770 (0.0009) +[2023-10-08 17:02:17,644][21195] Updated weights for policy 0, policy_version 32780 (0.0010) +[2023-10-08 17:02:18,011][21195] Updated weights for policy 0, policy_version 32790 (0.0009) +[2023-10-08 17:02:18,390][21195] Updated weights for policy 0, policy_version 32800 (0.0010) +[2023-10-08 17:02:18,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 66912256. Throughput: 0: 1712.3, 1: 1704.8. Samples: 16733506. Policy #0 lag: (min: 31.0, avg: 32.3, max: 56.0) +[2023-10-08 17:02:18,803][19739] Avg episode reward: [(0, '747.070'), (1, '1009.650')] +[2023-10-08 17:02:19,345][21194] Updated weights for policy 1, policy_version 32550 (0.0009) +[2023-10-08 17:02:19,706][21194] Updated weights for policy 1, policy_version 32560 (0.0008) +[2023-10-08 17:02:20,079][21194] Updated weights for policy 1, policy_version 32570 (0.0008) +[2023-10-08 17:02:22,383][21195] Updated weights for policy 0, policy_version 32810 (0.0008) +[2023-10-08 17:02:22,755][21195] Updated weights for policy 0, policy_version 32820 (0.0008) +[2023-10-08 17:02:23,130][21195] Updated weights for policy 0, policy_version 32830 (0.0009) +[2023-10-08 17:02:23,803][19739] Fps is (10 sec: 16383.4, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 66977792. Throughput: 0: 1743.3, 1: 1723.4. Samples: 16750300. Policy #0 lag: (min: 31.0, avg: 32.3, max: 56.0) +[2023-10-08 17:02:23,804][19739] Avg episode reward: [(0, '747.070'), (1, '1010.010')] +[2023-10-08 17:02:24,050][21194] Updated weights for policy 1, policy_version 32580 (0.0010) +[2023-10-08 17:02:24,411][21194] Updated weights for policy 1, policy_version 32590 (0.0009) +[2023-10-08 17:02:24,791][21194] Updated weights for policy 1, policy_version 32600 (0.0011) +[2023-10-08 17:02:27,044][21195] Updated weights for policy 0, policy_version 32840 (0.0008) +[2023-10-08 17:02:27,415][21195] Updated weights for policy 0, policy_version 32850 (0.0008) +[2023-10-08 17:02:27,781][21195] Updated weights for policy 0, policy_version 32860 (0.0008) +[2023-10-08 17:02:28,688][21194] Updated weights for policy 1, policy_version 32610 (0.0009) +[2023-10-08 17:02:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 67043328. Throughput: 0: 1715.1, 1: 1732.8. Samples: 16770668. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 17:02:28,803][19739] Avg episode reward: [(0, '747.070'), (1, '1017.460')] +[2023-10-08 17:02:29,056][21194] Updated weights for policy 1, policy_version 32620 (0.0008) +[2023-10-08 17:02:29,414][21194] Updated weights for policy 1, policy_version 32630 (0.0007) +[2023-10-08 17:02:29,783][21194] Updated weights for policy 1, policy_version 32640 (0.0007) +[2023-10-08 17:02:31,769][21195] Updated weights for policy 0, policy_version 32870 (0.0007) +[2023-10-08 17:02:32,144][21195] Updated weights for policy 0, policy_version 32880 (0.0008) +[2023-10-08 17:02:32,513][21195] Updated weights for policy 0, policy_version 32890 (0.0008) +[2023-10-08 17:02:33,747][21194] Updated weights for policy 1, policy_version 32650 (0.0010) +[2023-10-08 17:02:33,802][19739] Fps is (10 sec: 13107.7, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 67108864. Throughput: 0: 1710.5, 1: 1713.7. Samples: 16785766. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 17:02:33,803][19739] Avg episode reward: [(0, '734.860'), (1, '1031.250')] +[2023-10-08 17:02:34,123][21194] Updated weights for policy 1, policy_version 32660 (0.0010) +[2023-10-08 17:02:34,488][21194] Updated weights for policy 1, policy_version 32670 (0.0011) +[2023-10-08 17:02:34,559][20836] Saving new best policy, reward=1031.250! +[2023-10-08 17:02:36,514][21195] Updated weights for policy 0, policy_version 32900 (0.0007) +[2023-10-08 17:02:36,878][21195] Updated weights for policy 0, policy_version 32910 (0.0007) +[2023-10-08 17:02:37,245][21195] Updated weights for policy 0, policy_version 32920 (0.0010) +[2023-10-08 17:02:38,406][21194] Updated weights for policy 1, policy_version 32680 (0.0008) +[2023-10-08 17:02:38,774][21194] Updated weights for policy 1, policy_version 32690 (0.0010) +[2023-10-08 17:02:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 67174400. Throughput: 0: 1727.5, 1: 1740.9. Samples: 16801970. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 17:02:38,803][19739] Avg episode reward: [(0, '734.860'), (1, '1031.250')] +[2023-10-08 17:02:39,128][21194] Updated weights for policy 1, policy_version 32700 (0.0009) +[2023-10-08 17:02:41,212][21195] Updated weights for policy 0, policy_version 32930 (0.0007) +[2023-10-08 17:02:41,594][21195] Updated weights for policy 0, policy_version 32940 (0.0010) +[2023-10-08 17:02:41,961][21195] Updated weights for policy 0, policy_version 32950 (0.0010) +[2023-10-08 17:02:42,322][21195] Updated weights for policy 0, policy_version 32960 (0.0009) +[2023-10-08 17:02:43,105][21194] Updated weights for policy 1, policy_version 32710 (0.0007) +[2023-10-08 17:02:43,490][21194] Updated weights for policy 1, policy_version 32720 (0.0010) +[2023-10-08 17:02:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 67239936. Throughput: 0: 1708.6, 1: 1738.4. Samples: 16822210. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 17:02:43,803][19739] Avg episode reward: [(0, '734.860'), (1, '1031.250')] +[2023-10-08 17:02:43,857][21194] Updated weights for policy 1, policy_version 32730 (0.0009) +[2023-10-08 17:02:46,271][21195] Updated weights for policy 0, policy_version 32970 (0.0008) +[2023-10-08 17:02:46,637][21195] Updated weights for policy 0, policy_version 32980 (0.0008) +[2023-10-08 17:02:46,997][21195] Updated weights for policy 0, policy_version 32990 (0.0008) +[2023-10-08 17:02:47,804][21194] Updated weights for policy 1, policy_version 32740 (0.0007) +[2023-10-08 17:02:48,175][21194] Updated weights for policy 1, policy_version 32750 (0.0008) +[2023-10-08 17:02:48,541][21194] Updated weights for policy 1, policy_version 32760 (0.0007) +[2023-10-08 17:02:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 67305472. Throughput: 0: 1728.0, 1: 1729.8. Samples: 16837854. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 17:02:48,803][19739] Avg episode reward: [(0, '734.260'), (1, '1031.250')] +[2023-10-08 17:02:50,994][21195] Updated weights for policy 0, policy_version 33000 (0.0011) +[2023-10-08 17:02:51,356][21195] Updated weights for policy 0, policy_version 33010 (0.0012) +[2023-10-08 17:02:51,731][21195] Updated weights for policy 0, policy_version 33020 (0.0009) +[2023-10-08 17:02:52,510][21194] Updated weights for policy 1, policy_version 32770 (0.0011) +[2023-10-08 17:02:52,872][21194] Updated weights for policy 1, policy_version 32780 (0.0009) +[2023-10-08 17:02:53,238][21194] Updated weights for policy 1, policy_version 32790 (0.0009) +[2023-10-08 17:02:53,598][21194] Updated weights for policy 1, policy_version 32800 (0.0008) +[2023-10-08 17:02:53,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 67403776. Throughput: 0: 1714.9, 1: 1746.3. Samples: 16853430. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 17:02:53,803][19739] Avg episode reward: [(0, '719.530'), (1, '1031.250')] +[2023-10-08 17:02:55,333][21195] Updated weights for policy 0, policy_version 33030 (0.0007) +[2023-10-08 17:02:55,712][21195] Updated weights for policy 0, policy_version 33040 (0.0010) +[2023-10-08 17:02:56,082][21195] Updated weights for policy 0, policy_version 33050 (0.0010) +[2023-10-08 17:02:57,644][21194] Updated weights for policy 1, policy_version 32810 (0.0007) +[2023-10-08 17:02:58,011][21194] Updated weights for policy 1, policy_version 32820 (0.0008) +[2023-10-08 17:02:58,374][21194] Updated weights for policy 1, policy_version 32830 (0.0008) +[2023-10-08 17:02:58,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 67469312. Throughput: 0: 1722.4, 1: 1722.4. Samples: 16874206. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 17:02:58,803][19739] Avg episode reward: [(0, '734.180'), (1, '1018.740')] +[2023-10-08 17:03:00,112][21195] Updated weights for policy 0, policy_version 33060 (0.0008) +[2023-10-08 17:03:00,477][21195] Updated weights for policy 0, policy_version 33070 (0.0007) +[2023-10-08 17:03:00,843][21195] Updated weights for policy 0, policy_version 33080 (0.0008) +[2023-10-08 17:03:02,247][21194] Updated weights for policy 1, policy_version 32840 (0.0009) +[2023-10-08 17:03:02,613][21194] Updated weights for policy 1, policy_version 32850 (0.0007) +[2023-10-08 17:03:02,977][21194] Updated weights for policy 1, policy_version 32860 (0.0007) +[2023-10-08 17:03:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 67534848. Throughput: 0: 1751.4, 1: 1741.2. Samples: 16890672. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 17:03:03,803][19739] Avg episode reward: [(0, '734.180'), (1, '1018.740')] +[2023-10-08 17:03:04,647][21195] Updated weights for policy 0, policy_version 33090 (0.0009) +[2023-10-08 17:03:05,012][21195] Updated weights for policy 0, policy_version 33100 (0.0009) +[2023-10-08 17:03:05,390][21195] Updated weights for policy 0, policy_version 33110 (0.0011) +[2023-10-08 17:03:05,761][21195] Updated weights for policy 0, policy_version 33120 (0.0011) +[2023-10-08 17:03:06,751][21194] Updated weights for policy 1, policy_version 32870 (0.0007) +[2023-10-08 17:03:07,108][21194] Updated weights for policy 1, policy_version 32880 (0.0007) +[2023-10-08 17:03:07,473][21194] Updated weights for policy 1, policy_version 32890 (0.0011) +[2023-10-08 17:03:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 67600384. Throughput: 0: 1723.8, 1: 1732.0. Samples: 16905812. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 17:03:08,803][19739] Avg episode reward: [(0, '734.180'), (1, '1018.740')] +[2023-10-08 17:03:09,764][21195] Updated weights for policy 0, policy_version 33130 (0.0010) +[2023-10-08 17:03:10,146][21195] Updated weights for policy 0, policy_version 33140 (0.0009) +[2023-10-08 17:03:10,523][21195] Updated weights for policy 0, policy_version 33150 (0.0010) +[2023-10-08 17:03:11,601][21194] Updated weights for policy 1, policy_version 32900 (0.0009) +[2023-10-08 17:03:11,967][21194] Updated weights for policy 1, policy_version 32910 (0.0009) +[2023-10-08 17:03:12,324][21194] Updated weights for policy 1, policy_version 32920 (0.0009) +[2023-10-08 17:03:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 67665920. Throughput: 0: 1748.0, 1: 1707.7. Samples: 16926174. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 17:03:13,803][19739] Avg episode reward: [(0, '734.180'), (1, '1018.740')] +[2023-10-08 17:03:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000033152_33947648.pth... +[2023-10-08 17:03:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000032928_33718272.pth... +[2023-10-08 17:03:13,842][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000031328_32079872.pth +[2023-10-08 17:03:13,853][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000031552_32309248.pth +[2023-10-08 17:03:14,348][21195] Updated weights for policy 0, policy_version 33160 (0.0008) +[2023-10-08 17:03:14,715][21195] Updated weights for policy 0, policy_version 33170 (0.0008) +[2023-10-08 17:03:15,086][21195] Updated weights for policy 0, policy_version 33180 (0.0007) +[2023-10-08 17:03:16,503][21194] Updated weights for policy 1, policy_version 32930 (0.0009) +[2023-10-08 17:03:16,861][21194] Updated weights for policy 1, policy_version 32940 (0.0007) +[2023-10-08 17:03:17,230][21194] Updated weights for policy 1, policy_version 32950 (0.0009) +[2023-10-08 17:03:17,602][21194] Updated weights for policy 1, policy_version 32960 (0.0007) +[2023-10-08 17:03:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 67731456. Throughput: 0: 1752.1, 1: 1731.6. Samples: 16942534. Policy #0 lag: (min: 19.0, avg: 26.5, max: 51.0) +[2023-10-08 17:03:18,803][19739] Avg episode reward: [(0, '734.180'), (1, '1032.740')] +[2023-10-08 17:03:18,804][20836] Saving new best policy, reward=1032.740! +[2023-10-08 17:03:18,811][21195] Updated weights for policy 0, policy_version 33190 (0.0008) +[2023-10-08 17:03:19,189][21195] Updated weights for policy 0, policy_version 33200 (0.0008) +[2023-10-08 17:03:19,556][21195] Updated weights for policy 0, policy_version 33210 (0.0008) +[2023-10-08 17:03:21,423][21194] Updated weights for policy 1, policy_version 32970 (0.0007) +[2023-10-08 17:03:21,799][21194] Updated weights for policy 1, policy_version 32980 (0.0009) +[2023-10-08 17:03:22,161][21194] Updated weights for policy 1, policy_version 32990 (0.0010) +[2023-10-08 17:03:23,454][21195] Updated weights for policy 0, policy_version 33220 (0.0008) +[2023-10-08 17:03:23,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 67796992. Throughput: 0: 1740.2, 1: 1710.7. Samples: 16957258. Policy #0 lag: (min: 19.0, avg: 26.5, max: 51.0) +[2023-10-08 17:03:23,803][19739] Avg episode reward: [(0, '750.790'), (1, '1032.740')] +[2023-10-08 17:03:23,822][21195] Updated weights for policy 0, policy_version 33230 (0.0009) +[2023-10-08 17:03:24,193][21195] Updated weights for policy 0, policy_version 33240 (0.0009) +[2023-10-08 17:03:25,894][21194] Updated weights for policy 1, policy_version 33000 (0.0008) +[2023-10-08 17:03:26,254][21194] Updated weights for policy 1, policy_version 33010 (0.0007) +[2023-10-08 17:03:26,624][21194] Updated weights for policy 1, policy_version 33020 (0.0009) +[2023-10-08 17:03:28,294][21195] Updated weights for policy 0, policy_version 33250 (0.0009) +[2023-10-08 17:03:28,671][21195] Updated weights for policy 0, policy_version 33260 (0.0009) +[2023-10-08 17:03:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 67862528. Throughput: 0: 1754.4, 1: 1715.5. Samples: 16978356. Policy #0 lag: (min: 19.0, avg: 26.5, max: 51.0) +[2023-10-08 17:03:28,803][19739] Avg episode reward: [(0, '750.790'), (1, '1032.740')] +[2023-10-08 17:03:29,041][21195] Updated weights for policy 0, policy_version 33270 (0.0010) +[2023-10-08 17:03:29,403][21195] Updated weights for policy 0, policy_version 33280 (0.0008) +[2023-10-08 17:03:30,689][21194] Updated weights for policy 1, policy_version 33030 (0.0009) +[2023-10-08 17:03:31,070][21194] Updated weights for policy 1, policy_version 33040 (0.0010) +[2023-10-08 17:03:31,443][21194] Updated weights for policy 1, policy_version 33050 (0.0010) +[2023-10-08 17:03:33,315][21195] Updated weights for policy 0, policy_version 33290 (0.0008) +[2023-10-08 17:03:33,675][21195] Updated weights for policy 0, policy_version 33300 (0.0009) +[2023-10-08 17:03:33,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 67928064. Throughput: 0: 1733.9, 1: 1726.2. Samples: 16993560. Policy #0 lag: (min: 19.0, avg: 26.5, max: 51.0) +[2023-10-08 17:03:33,804][19739] Avg episode reward: [(0, '750.790'), (1, '1038.880')] +[2023-10-08 17:03:33,805][20836] Saving new best policy, reward=1038.880! +[2023-10-08 17:03:34,049][21195] Updated weights for policy 0, policy_version 33310 (0.0008) +[2023-10-08 17:03:35,526][21194] Updated weights for policy 1, policy_version 33060 (0.0012) +[2023-10-08 17:03:35,891][21194] Updated weights for policy 1, policy_version 33070 (0.0010) +[2023-10-08 17:03:36,256][21194] Updated weights for policy 1, policy_version 33080 (0.0011) +[2023-10-08 17:03:38,060][21195] Updated weights for policy 0, policy_version 33320 (0.0009) +[2023-10-08 17:03:38,427][21195] Updated weights for policy 0, policy_version 33330 (0.0009) +[2023-10-08 17:03:38,793][21195] Updated weights for policy 0, policy_version 33340 (0.0009) +[2023-10-08 17:03:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 67993600. Throughput: 0: 1753.7, 1: 1705.5. Samples: 17009094. Policy #0 lag: (min: 19.0, avg: 26.5, max: 51.0) +[2023-10-08 17:03:38,803][19739] Avg episode reward: [(0, '750.790'), (1, '1034.090')] +[2023-10-08 17:03:40,184][21194] Updated weights for policy 1, policy_version 33090 (0.0009) +[2023-10-08 17:03:40,550][21194] Updated weights for policy 1, policy_version 33100 (0.0008) +[2023-10-08 17:03:40,917][21194] Updated weights for policy 1, policy_version 33110 (0.0007) +[2023-10-08 17:03:41,279][21194] Updated weights for policy 1, policy_version 33120 (0.0010) +[2023-10-08 17:03:42,772][21195] Updated weights for policy 0, policy_version 33350 (0.0009) +[2023-10-08 17:03:43,141][21195] Updated weights for policy 0, policy_version 33360 (0.0009) +[2023-10-08 17:03:43,517][21195] Updated weights for policy 0, policy_version 33370 (0.0009) +[2023-10-08 17:03:43,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 68091904. Throughput: 0: 1740.4, 1: 1724.4. Samples: 17030124. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 17:03:43,804][19739] Avg episode reward: [(0, '765.720'), (1, '1024.920')] +[2023-10-08 17:03:45,122][21194] Updated weights for policy 1, policy_version 33130 (0.0007) +[2023-10-08 17:03:45,493][21194] Updated weights for policy 1, policy_version 33140 (0.0010) +[2023-10-08 17:03:45,870][21194] Updated weights for policy 1, policy_version 33150 (0.0009) +[2023-10-08 17:03:47,580][21195] Updated weights for policy 0, policy_version 33380 (0.0008) +[2023-10-08 17:03:47,953][21195] Updated weights for policy 0, policy_version 33390 (0.0009) +[2023-10-08 17:03:48,319][21195] Updated weights for policy 0, policy_version 33400 (0.0009) +[2023-10-08 17:03:48,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 68157440. Throughput: 0: 1707.0, 1: 1704.1. Samples: 17044170. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 17:03:48,803][19739] Avg episode reward: [(0, '765.720'), (1, '1024.920')] +[2023-10-08 17:03:49,787][21194] Updated weights for policy 1, policy_version 33160 (0.0008) +[2023-10-08 17:03:50,163][21194] Updated weights for policy 1, policy_version 33170 (0.0008) +[2023-10-08 17:03:50,529][21194] Updated weights for policy 1, policy_version 33180 (0.0008) +[2023-10-08 17:03:52,217][21195] Updated weights for policy 0, policy_version 33410 (0.0007) +[2023-10-08 17:03:52,587][21195] Updated weights for policy 0, policy_version 33420 (0.0007) +[2023-10-08 17:03:52,954][21195] Updated weights for policy 0, policy_version 33430 (0.0007) +[2023-10-08 17:03:53,324][21195] Updated weights for policy 0, policy_version 33440 (0.0007) +[2023-10-08 17:03:53,802][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 68222976. Throughput: 0: 1733.0, 1: 1709.6. Samples: 17060730. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 17:03:53,803][19739] Avg episode reward: [(0, '764.620'), (1, '1024.920')] +[2023-10-08 17:03:54,475][21194] Updated weights for policy 1, policy_version 33190 (0.0007) +[2023-10-08 17:03:54,840][21194] Updated weights for policy 1, policy_version 33200 (0.0007) +[2023-10-08 17:03:55,208][21194] Updated weights for policy 1, policy_version 33210 (0.0010) +[2023-10-08 17:03:57,143][21195] Updated weights for policy 0, policy_version 33450 (0.0007) +[2023-10-08 17:03:57,514][21195] Updated weights for policy 0, policy_version 33460 (0.0007) +[2023-10-08 17:03:57,885][21195] Updated weights for policy 0, policy_version 33470 (0.0010) +[2023-10-08 17:03:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 68288512. Throughput: 0: 1715.6, 1: 1735.2. Samples: 17081458. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 17:03:58,803][19739] Avg episode reward: [(0, '774.220'), (1, '1024.920')] +[2023-10-08 17:03:59,185][21194] Updated weights for policy 1, policy_version 33220 (0.0009) +[2023-10-08 17:03:59,543][21194] Updated weights for policy 1, policy_version 33230 (0.0011) +[2023-10-08 17:03:59,902][21194] Updated weights for policy 1, policy_version 33240 (0.0009) +[2023-10-08 17:04:01,778][21195] Updated weights for policy 0, policy_version 33480 (0.0008) +[2023-10-08 17:04:02,144][21195] Updated weights for policy 0, policy_version 33490 (0.0007) +[2023-10-08 17:04:02,514][21195] Updated weights for policy 0, policy_version 33500 (0.0007) +[2023-10-08 17:04:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 68354048. Throughput: 0: 1711.6, 1: 1710.0. Samples: 17096508. Policy #0 lag: (min: 17.0, avg: 20.9, max: 39.0) +[2023-10-08 17:04:03,803][19739] Avg episode reward: [(0, '774.220'), (1, '1008.240')] +[2023-10-08 17:04:03,813][21194] Updated weights for policy 1, policy_version 33250 (0.0011) +[2023-10-08 17:04:04,170][21194] Updated weights for policy 1, policy_version 33260 (0.0007) +[2023-10-08 17:04:04,537][21194] Updated weights for policy 1, policy_version 33270 (0.0007) +[2023-10-08 17:04:04,910][21194] Updated weights for policy 1, policy_version 33280 (0.0007) +[2023-10-08 17:04:06,606][21195] Updated weights for policy 0, policy_version 33510 (0.0007) +[2023-10-08 17:04:06,984][21195] Updated weights for policy 0, policy_version 33520 (0.0008) +[2023-10-08 17:04:07,349][21195] Updated weights for policy 0, policy_version 33530 (0.0008) +[2023-10-08 17:04:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 68419584. Throughput: 0: 1721.3, 1: 1732.2. Samples: 17112666. Policy #0 lag: (min: 17.0, avg: 20.9, max: 39.0) +[2023-10-08 17:04:08,803][19739] Avg episode reward: [(0, '761.210'), (1, '1008.240')] +[2023-10-08 17:04:08,888][21194] Updated weights for policy 1, policy_version 33290 (0.0007) +[2023-10-08 17:04:09,255][21194] Updated weights for policy 1, policy_version 33300 (0.0007) +[2023-10-08 17:04:09,612][21194] Updated weights for policy 1, policy_version 33310 (0.0008) +[2023-10-08 17:04:11,003][21195] Updated weights for policy 0, policy_version 33540 (0.0008) +[2023-10-08 17:04:11,373][21195] Updated weights for policy 0, policy_version 33550 (0.0008) +[2023-10-08 17:04:11,735][21195] Updated weights for policy 0, policy_version 33560 (0.0009) +[2023-10-08 17:04:13,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 68485120. Throughput: 0: 1712.5, 1: 1728.1. Samples: 17133186. Policy #0 lag: (min: 17.0, avg: 20.9, max: 39.0) +[2023-10-08 17:04:13,803][19739] Avg episode reward: [(0, '761.210'), (1, '1008.590')] +[2023-10-08 17:04:13,821][21194] Updated weights for policy 1, policy_version 33320 (0.0009) +[2023-10-08 17:04:14,178][21194] Updated weights for policy 1, policy_version 33330 (0.0009) +[2023-10-08 17:04:14,553][21194] Updated weights for policy 1, policy_version 33340 (0.0008) +[2023-10-08 17:04:15,479][21195] Updated weights for policy 0, policy_version 33570 (0.0009) +[2023-10-08 17:04:15,851][21195] Updated weights for policy 0, policy_version 33580 (0.0009) +[2023-10-08 17:04:16,218][21195] Updated weights for policy 0, policy_version 33590 (0.0008) +[2023-10-08 17:04:16,585][21195] Updated weights for policy 0, policy_version 33600 (0.0008) +[2023-10-08 17:04:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 68550656. Throughput: 0: 1736.2, 1: 1711.8. Samples: 17148722. Policy #0 lag: (min: 17.0, avg: 20.9, max: 39.0) +[2023-10-08 17:04:18,803][19739] Avg episode reward: [(0, '761.210'), (1, '1008.590')] +[2023-10-08 17:04:18,817][21194] Updated weights for policy 1, policy_version 33350 (0.0009) +[2023-10-08 17:04:19,191][21194] Updated weights for policy 1, policy_version 33360 (0.0007) +[2023-10-08 17:04:19,554][21194] Updated weights for policy 1, policy_version 33370 (0.0007) +[2023-10-08 17:04:20,674][21195] Updated weights for policy 0, policy_version 33610 (0.0007) +[2023-10-08 17:04:21,045][21195] Updated weights for policy 0, policy_version 33620 (0.0007) +[2023-10-08 17:04:21,406][21195] Updated weights for policy 0, policy_version 33630 (0.0009) +[2023-10-08 17:04:23,286][21194] Updated weights for policy 1, policy_version 33380 (0.0008) +[2023-10-08 17:04:23,648][21194] Updated weights for policy 1, policy_version 33390 (0.0008) +[2023-10-08 17:04:23,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 68616192. Throughput: 0: 1713.0, 1: 1724.4. Samples: 17163776. Policy #0 lag: (min: 17.0, avg: 20.9, max: 39.0) +[2023-10-08 17:04:23,804][19739] Avg episode reward: [(0, '760.200'), (1, '1008.590')] +[2023-10-08 17:04:24,018][21194] Updated weights for policy 1, policy_version 33400 (0.0009) +[2023-10-08 17:04:25,467][21195] Updated weights for policy 0, policy_version 33640 (0.0009) +[2023-10-08 17:04:25,840][21195] Updated weights for policy 0, policy_version 33650 (0.0009) +[2023-10-08 17:04:26,201][21195] Updated weights for policy 0, policy_version 33660 (0.0010) +[2023-10-08 17:04:27,950][21194] Updated weights for policy 1, policy_version 33410 (0.0008) +[2023-10-08 17:04:28,317][21194] Updated weights for policy 1, policy_version 33420 (0.0009) +[2023-10-08 17:04:28,681][21194] Updated weights for policy 1, policy_version 33430 (0.0007) +[2023-10-08 17:04:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 68681728. Throughput: 0: 1724.2, 1: 1715.8. Samples: 17184926. Policy #0 lag: (min: 31.0, avg: 36.3, max: 63.0) +[2023-10-08 17:04:28,803][19739] Avg episode reward: [(0, '761.350'), (1, '1008.590')] +[2023-10-08 17:04:29,047][21194] Updated weights for policy 1, policy_version 33440 (0.0011) +[2023-10-08 17:04:30,026][21195] Updated weights for policy 0, policy_version 33670 (0.0011) +[2023-10-08 17:04:30,399][21195] Updated weights for policy 0, policy_version 33680 (0.0009) +[2023-10-08 17:04:30,757][21195] Updated weights for policy 0, policy_version 33690 (0.0011) +[2023-10-08 17:04:33,014][21194] Updated weights for policy 1, policy_version 33450 (0.0010) +[2023-10-08 17:04:33,372][21194] Updated weights for policy 1, policy_version 33460 (0.0008) +[2023-10-08 17:04:33,735][21194] Updated weights for policy 1, policy_version 33470 (0.0010) +[2023-10-08 17:04:33,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 68747264. Throughput: 0: 1758.5, 1: 1720.8. Samples: 17200738. Policy #0 lag: (min: 31.0, avg: 36.3, max: 63.0) +[2023-10-08 17:04:33,803][19739] Avg episode reward: [(0, '760.320'), (1, '1008.590')] +[2023-10-08 17:04:34,631][21195] Updated weights for policy 0, policy_version 33700 (0.0010) +[2023-10-08 17:04:35,004][21195] Updated weights for policy 0, policy_version 33710 (0.0008) +[2023-10-08 17:04:35,369][21195] Updated weights for policy 0, policy_version 33720 (0.0009) +[2023-10-08 17:04:37,791][21194] Updated weights for policy 1, policy_version 33480 (0.0009) +[2023-10-08 17:04:38,154][21194] Updated weights for policy 1, policy_version 33490 (0.0010) +[2023-10-08 17:04:38,528][21194] Updated weights for policy 1, policy_version 33500 (0.0009) +[2023-10-08 17:04:38,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 68845568. Throughput: 0: 1727.3, 1: 1722.8. Samples: 17215982. Policy #0 lag: (min: 31.0, avg: 36.3, max: 63.0) +[2023-10-08 17:04:38,803][19739] Avg episode reward: [(0, '746.740'), (1, '995.020')] +[2023-10-08 17:04:39,217][21195] Updated weights for policy 0, policy_version 33730 (0.0008) +[2023-10-08 17:04:39,599][21195] Updated weights for policy 0, policy_version 33740 (0.0007) +[2023-10-08 17:04:39,967][21195] Updated weights for policy 0, policy_version 33750 (0.0007) +[2023-10-08 17:04:40,327][21195] Updated weights for policy 0, policy_version 33760 (0.0008) +[2023-10-08 17:04:42,448][21194] Updated weights for policy 1, policy_version 33510 (0.0009) +[2023-10-08 17:04:42,817][21194] Updated weights for policy 1, policy_version 33520 (0.0009) +[2023-10-08 17:04:43,194][21194] Updated weights for policy 1, policy_version 33530 (0.0008) +[2023-10-08 17:04:43,803][19739] Fps is (10 sec: 16383.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 68911104. Throughput: 0: 1754.3, 1: 1701.4. Samples: 17236966. Policy #0 lag: (min: 31.0, avg: 36.3, max: 63.0) +[2023-10-08 17:04:43,804][19739] Avg episode reward: [(0, '746.740'), (1, '995.020')] +[2023-10-08 17:04:44,249][21195] Updated weights for policy 0, policy_version 33770 (0.0009) +[2023-10-08 17:04:44,622][21195] Updated weights for policy 0, policy_version 33780 (0.0007) +[2023-10-08 17:04:44,991][21195] Updated weights for policy 0, policy_version 33790 (0.0009) +[2023-10-08 17:04:47,230][21194] Updated weights for policy 1, policy_version 33540 (0.0008) +[2023-10-08 17:04:47,583][21194] Updated weights for policy 1, policy_version 33550 (0.0009) +[2023-10-08 17:04:47,945][21194] Updated weights for policy 1, policy_version 33560 (0.0007) +[2023-10-08 17:04:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 68976640. Throughput: 0: 1753.1, 1: 1720.7. Samples: 17252828. Policy #0 lag: (min: 31.0, avg: 36.3, max: 63.0) +[2023-10-08 17:04:48,803][19739] Avg episode reward: [(0, '746.740'), (1, '980.390')] +[2023-10-08 17:04:48,810][21195] Updated weights for policy 0, policy_version 33800 (0.0007) +[2023-10-08 17:04:49,182][21195] Updated weights for policy 0, policy_version 33810 (0.0007) +[2023-10-08 17:04:49,555][21195] Updated weights for policy 0, policy_version 33820 (0.0007) +[2023-10-08 17:04:51,901][21194] Updated weights for policy 1, policy_version 33570 (0.0009) +[2023-10-08 17:04:52,264][21194] Updated weights for policy 1, policy_version 33580 (0.0009) +[2023-10-08 17:04:52,639][21194] Updated weights for policy 1, policy_version 33590 (0.0007) +[2023-10-08 17:04:53,005][21194] Updated weights for policy 1, policy_version 33600 (0.0010) +[2023-10-08 17:04:53,490][21195] Updated weights for policy 0, policy_version 33830 (0.0007) +[2023-10-08 17:04:53,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 69042176. Throughput: 0: 1742.8, 1: 1710.0. Samples: 17268040. Policy #0 lag: (min: 16.0, avg: 45.0, max: 48.0) +[2023-10-08 17:04:53,803][19739] Avg episode reward: [(0, '746.740'), (1, '980.390')] +[2023-10-08 17:04:53,868][21195] Updated weights for policy 0, policy_version 33840 (0.0008) +[2023-10-08 17:04:54,243][21195] Updated weights for policy 0, policy_version 33850 (0.0007) +[2023-10-08 17:04:56,980][21194] Updated weights for policy 1, policy_version 33610 (0.0010) +[2023-10-08 17:04:57,356][21194] Updated weights for policy 1, policy_version 33620 (0.0008) +[2023-10-08 17:04:57,728][21194] Updated weights for policy 1, policy_version 33630 (0.0007) +[2023-10-08 17:04:58,016][21195] Updated weights for policy 0, policy_version 33860 (0.0010) +[2023-10-08 17:04:58,394][21195] Updated weights for policy 0, policy_version 33870 (0.0010) +[2023-10-08 17:04:58,764][21195] Updated weights for policy 0, policy_version 33880 (0.0009) +[2023-10-08 17:04:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 69107712. Throughput: 0: 1760.0, 1: 1690.8. Samples: 17288468. Policy #0 lag: (min: 16.0, avg: 45.0, max: 48.0) +[2023-10-08 17:04:58,803][19739] Avg episode reward: [(0, '746.740'), (1, '951.320')] +[2023-10-08 17:05:01,701][21194] Updated weights for policy 1, policy_version 33640 (0.0007) +[2023-10-08 17:05:02,059][21194] Updated weights for policy 1, policy_version 33650 (0.0008) +[2023-10-08 17:05:02,433][21194] Updated weights for policy 1, policy_version 33660 (0.0007) +[2023-10-08 17:05:02,707][21195] Updated weights for policy 0, policy_version 33890 (0.0008) +[2023-10-08 17:05:03,077][21195] Updated weights for policy 0, policy_version 33900 (0.0008) +[2023-10-08 17:05:03,439][21195] Updated weights for policy 0, policy_version 33910 (0.0008) +[2023-10-08 17:05:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 69173248. Throughput: 0: 1728.4, 1: 1718.4. Samples: 17303826. Policy #0 lag: (min: 16.0, avg: 45.0, max: 48.0) +[2023-10-08 17:05:03,803][19739] Avg episode reward: [(0, '746.740'), (1, '951.370')] +[2023-10-08 17:05:03,811][21195] Updated weights for policy 0, policy_version 33920 (0.0008) +[2023-10-08 17:05:06,498][21194] Updated weights for policy 1, policy_version 33670 (0.0008) +[2023-10-08 17:05:06,866][21194] Updated weights for policy 1, policy_version 33680 (0.0007) +[2023-10-08 17:05:07,219][21194] Updated weights for policy 1, policy_version 33690 (0.0007) +[2023-10-08 17:05:07,699][21195] Updated weights for policy 0, policy_version 33930 (0.0008) +[2023-10-08 17:05:08,064][21195] Updated weights for policy 0, policy_version 33940 (0.0010) +[2023-10-08 17:05:08,426][21195] Updated weights for policy 0, policy_version 33950 (0.0009) +[2023-10-08 17:05:08,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 69271552. Throughput: 0: 1759.4, 1: 1702.5. Samples: 17319564. Policy #0 lag: (min: 16.0, avg: 45.0, max: 48.0) +[2023-10-08 17:05:08,803][19739] Avg episode reward: [(0, '746.740'), (1, '959.560')] +[2023-10-08 17:05:11,187][21194] Updated weights for policy 1, policy_version 33700 (0.0007) +[2023-10-08 17:05:11,543][21194] Updated weights for policy 1, policy_version 33710 (0.0008) +[2023-10-08 17:05:11,919][21194] Updated weights for policy 1, policy_version 33720 (0.0008) +[2023-10-08 17:05:12,427][21195] Updated weights for policy 0, policy_version 33960 (0.0007) +[2023-10-08 17:05:12,805][21195] Updated weights for policy 0, policy_version 33970 (0.0008) +[2023-10-08 17:05:13,193][21195] Updated weights for policy 0, policy_version 33980 (0.0009) +[2023-10-08 17:05:13,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 69337088. Throughput: 0: 1741.6, 1: 1698.3. Samples: 17339722. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 17:05:13,803][19739] Avg episode reward: [(0, '740.500'), (1, '959.690')] +[2023-10-08 17:05:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000033728_34537472.pth... +[2023-10-08 17:05:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000033984_34799616.pth... +[2023-10-08 17:05:13,852][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000032128_32899072.pth +[2023-10-08 17:05:13,855][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000032352_33128448.pth +[2023-10-08 17:05:15,923][21194] Updated weights for policy 1, policy_version 33730 (0.0007) +[2023-10-08 17:05:16,291][21194] Updated weights for policy 1, policy_version 33740 (0.0009) +[2023-10-08 17:05:16,647][21194] Updated weights for policy 1, policy_version 33750 (0.0010) +[2023-10-08 17:05:17,013][21194] Updated weights for policy 1, policy_version 33760 (0.0009) +[2023-10-08 17:05:17,077][21195] Updated weights for policy 0, policy_version 33990 (0.0008) +[2023-10-08 17:05:17,441][21195] Updated weights for policy 0, policy_version 34000 (0.0007) +[2023-10-08 17:05:17,807][21195] Updated weights for policy 0, policy_version 34010 (0.0007) +[2023-10-08 17:05:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 69402624. Throughput: 0: 1726.8, 1: 1715.5. Samples: 17355642. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 17:05:18,803][19739] Avg episode reward: [(0, '740.500'), (1, '959.690')] +[2023-10-08 17:05:20,880][21194] Updated weights for policy 1, policy_version 33770 (0.0009) +[2023-10-08 17:05:21,244][21194] Updated weights for policy 1, policy_version 33780 (0.0009) +[2023-10-08 17:05:21,609][21194] Updated weights for policy 1, policy_version 33790 (0.0009) +[2023-10-08 17:05:21,614][21195] Updated weights for policy 0, policy_version 34020 (0.0008) +[2023-10-08 17:05:21,981][21195] Updated weights for policy 0, policy_version 34030 (0.0009) +[2023-10-08 17:05:22,346][21195] Updated weights for policy 0, policy_version 34040 (0.0008) +[2023-10-08 17:05:23,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 69468160. Throughput: 0: 1750.5, 1: 1691.4. Samples: 17370870. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 17:05:23,804][19739] Avg episode reward: [(0, '755.170'), (1, '959.690')] +[2023-10-08 17:05:25,591][21194] Updated weights for policy 1, policy_version 33800 (0.0010) +[2023-10-08 17:05:25,960][21194] Updated weights for policy 1, policy_version 33810 (0.0011) +[2023-10-08 17:05:26,196][21195] Updated weights for policy 0, policy_version 34050 (0.0010) +[2023-10-08 17:05:26,316][21194] Updated weights for policy 1, policy_version 33820 (0.0009) +[2023-10-08 17:05:26,563][21195] Updated weights for policy 0, policy_version 34060 (0.0007) +[2023-10-08 17:05:26,941][21195] Updated weights for policy 0, policy_version 34070 (0.0008) +[2023-10-08 17:05:27,304][21195] Updated weights for policy 0, policy_version 34080 (0.0007) +[2023-10-08 17:05:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 69533696. Throughput: 0: 1719.8, 1: 1715.9. Samples: 17391574. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 17:05:28,803][19739] Avg episode reward: [(0, '794.700'), (1, '950.300')] +[2023-10-08 17:05:30,208][21194] Updated weights for policy 1, policy_version 33830 (0.0009) +[2023-10-08 17:05:30,577][21194] Updated weights for policy 1, policy_version 33840 (0.0007) +[2023-10-08 17:05:30,943][21194] Updated weights for policy 1, policy_version 33850 (0.0009) +[2023-10-08 17:05:31,233][21195] Updated weights for policy 0, policy_version 34090 (0.0010) +[2023-10-08 17:05:31,607][21195] Updated weights for policy 0, policy_version 34100 (0.0008) +[2023-10-08 17:05:31,985][21195] Updated weights for policy 0, policy_version 34110 (0.0011) +[2023-10-08 17:05:33,802][19739] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 69599232. Throughput: 0: 1731.6, 1: 1702.8. Samples: 17407374. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 17:05:33,803][19739] Avg episode reward: [(0, '780.160'), (1, '950.340')] +[2023-10-08 17:05:34,922][21194] Updated weights for policy 1, policy_version 33860 (0.0009) +[2023-10-08 17:05:35,294][21194] Updated weights for policy 1, policy_version 33870 (0.0007) +[2023-10-08 17:05:35,652][21194] Updated weights for policy 1, policy_version 33880 (0.0007) +[2023-10-08 17:05:35,679][21195] Updated weights for policy 0, policy_version 34120 (0.0009) +[2023-10-08 17:05:36,050][21195] Updated weights for policy 0, policy_version 34130 (0.0007) +[2023-10-08 17:05:36,406][21195] Updated weights for policy 0, policy_version 34140 (0.0007) +[2023-10-08 17:05:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 69664768. Throughput: 0: 1727.7, 1: 1709.3. Samples: 17422706. Policy #0 lag: (min: 1.0, avg: 5.1, max: 33.0) +[2023-10-08 17:05:38,803][19739] Avg episode reward: [(0, '766.060'), (1, '950.340')] +[2023-10-08 17:05:39,631][21194] Updated weights for policy 1, policy_version 33890 (0.0007) +[2023-10-08 17:05:39,994][21194] Updated weights for policy 1, policy_version 33900 (0.0008) +[2023-10-08 17:05:40,358][21194] Updated weights for policy 1, policy_version 33910 (0.0008) +[2023-10-08 17:05:40,536][21195] Updated weights for policy 0, policy_version 34150 (0.0008) +[2023-10-08 17:05:40,716][21194] Updated weights for policy 1, policy_version 33920 (0.0008) +[2023-10-08 17:05:40,916][21195] Updated weights for policy 0, policy_version 34160 (0.0009) +[2023-10-08 17:05:41,277][21195] Updated weights for policy 0, policy_version 34170 (0.0009) +[2023-10-08 17:05:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 69730304. Throughput: 0: 1725.0, 1: 1727.6. Samples: 17443832. Policy #0 lag: (min: 1.0, avg: 5.1, max: 33.0) +[2023-10-08 17:05:43,803][19739] Avg episode reward: [(0, '766.060'), (1, '950.340')] +[2023-10-08 17:05:44,738][21194] Updated weights for policy 1, policy_version 33930 (0.0007) +[2023-10-08 17:05:45,064][21195] Updated weights for policy 0, policy_version 34180 (0.0008) +[2023-10-08 17:05:45,107][21194] Updated weights for policy 1, policy_version 33940 (0.0007) +[2023-10-08 17:05:45,431][21195] Updated weights for policy 0, policy_version 34190 (0.0007) +[2023-10-08 17:05:45,471][21194] Updated weights for policy 1, policy_version 33950 (0.0008) +[2023-10-08 17:05:45,797][21195] Updated weights for policy 0, policy_version 34200 (0.0010) +[2023-10-08 17:05:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 69795840. Throughput: 0: 1750.1, 1: 1701.8. Samples: 17459162. Policy #0 lag: (min: 1.0, avg: 5.1, max: 33.0) +[2023-10-08 17:05:48,803][19739] Avg episode reward: [(0, '766.060'), (1, '950.140')] +[2023-10-08 17:05:49,431][21194] Updated weights for policy 1, policy_version 33960 (0.0008) +[2023-10-08 17:05:49,803][21195] Updated weights for policy 0, policy_version 34210 (0.0010) +[2023-10-08 17:05:49,804][21194] Updated weights for policy 1, policy_version 33970 (0.0008) +[2023-10-08 17:05:50,169][21194] Updated weights for policy 1, policy_version 33980 (0.0007) +[2023-10-08 17:05:50,169][21195] Updated weights for policy 0, policy_version 34220 (0.0009) +[2023-10-08 17:05:50,536][21195] Updated weights for policy 0, policy_version 34230 (0.0010) +[2023-10-08 17:05:50,901][21195] Updated weights for policy 0, policy_version 34240 (0.0010) +[2023-10-08 17:05:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 69861376. Throughput: 0: 1720.0, 1: 1719.7. Samples: 17474350. Policy #0 lag: (min: 1.0, avg: 5.1, max: 33.0) +[2023-10-08 17:05:53,803][19739] Avg episode reward: [(0, '766.060'), (1, '950.140')] +[2023-10-08 17:05:54,106][21194] Updated weights for policy 1, policy_version 33990 (0.0008) +[2023-10-08 17:05:54,494][21194] Updated weights for policy 1, policy_version 34000 (0.0011) +[2023-10-08 17:05:54,862][21194] Updated weights for policy 1, policy_version 34010 (0.0007) +[2023-10-08 17:05:54,888][21195] Updated weights for policy 0, policy_version 34250 (0.0007) +[2023-10-08 17:05:55,255][21195] Updated weights for policy 0, policy_version 34260 (0.0007) +[2023-10-08 17:05:55,629][21195] Updated weights for policy 0, policy_version 34270 (0.0010) +[2023-10-08 17:05:58,775][21194] Updated weights for policy 1, policy_version 34020 (0.0008) +[2023-10-08 17:05:58,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 69926912. Throughput: 0: 1738.9, 1: 1730.3. Samples: 17495836. Policy #0 lag: (min: 1.0, avg: 5.1, max: 33.0) +[2023-10-08 17:05:58,803][19739] Avg episode reward: [(0, '766.060'), (1, '935.520')] +[2023-10-08 17:05:59,142][21194] Updated weights for policy 1, policy_version 34030 (0.0009) +[2023-10-08 17:05:59,522][21194] Updated weights for policy 1, policy_version 34040 (0.0008) +[2023-10-08 17:05:59,543][21195] Updated weights for policy 0, policy_version 34280 (0.0010) +[2023-10-08 17:05:59,910][21195] Updated weights for policy 0, policy_version 34290 (0.0007) +[2023-10-08 17:06:00,285][21195] Updated weights for policy 0, policy_version 34300 (0.0007) +[2023-10-08 17:06:03,498][21194] Updated weights for policy 1, policy_version 34050 (0.0008) +[2023-10-08 17:06:03,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 69992448. Throughput: 0: 1751.3, 1: 1708.1. Samples: 17511316. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 17:06:03,804][19739] Avg episode reward: [(0, '766.160'), (1, '935.520')] +[2023-10-08 17:06:03,859][21194] Updated weights for policy 1, policy_version 34060 (0.0008) +[2023-10-08 17:06:04,226][21194] Updated weights for policy 1, policy_version 34070 (0.0008) +[2023-10-08 17:06:04,318][21195] Updated weights for policy 0, policy_version 34310 (0.0009) +[2023-10-08 17:06:04,581][21194] Updated weights for policy 1, policy_version 34080 (0.0010) +[2023-10-08 17:06:04,687][21195] Updated weights for policy 0, policy_version 34320 (0.0009) +[2023-10-08 17:06:05,058][21195] Updated weights for policy 0, policy_version 34330 (0.0008) +[2023-10-08 17:06:08,615][21194] Updated weights for policy 1, policy_version 34090 (0.0008) +[2023-10-08 17:06:08,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 70057984. Throughput: 0: 1728.9, 1: 1734.0. Samples: 17526698. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 17:06:08,803][19739] Avg episode reward: [(0, '766.160'), (1, '941.210')] +[2023-10-08 17:06:08,894][21195] Updated weights for policy 0, policy_version 34340 (0.0008) +[2023-10-08 17:06:08,976][21194] Updated weights for policy 1, policy_version 34100 (0.0008) +[2023-10-08 17:06:09,265][21195] Updated weights for policy 0, policy_version 34350 (0.0007) +[2023-10-08 17:06:09,337][21194] Updated weights for policy 1, policy_version 34110 (0.0008) +[2023-10-08 17:06:09,630][21195] Updated weights for policy 0, policy_version 34360 (0.0007) +[2023-10-08 17:06:13,319][21194] Updated weights for policy 1, policy_version 34120 (0.0009) +[2023-10-08 17:06:13,429][21195] Updated weights for policy 0, policy_version 34370 (0.0009) +[2023-10-08 17:06:13,695][21194] Updated weights for policy 1, policy_version 34130 (0.0010) +[2023-10-08 17:06:13,790][21195] Updated weights for policy 0, policy_version 34380 (0.0008) +[2023-10-08 17:06:13,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 70123520. Throughput: 0: 1753.5, 1: 1725.0. Samples: 17548104. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 17:06:13,803][19739] Avg episode reward: [(0, '760.490'), (1, '941.210')] +[2023-10-08 17:06:14,055][21194] Updated weights for policy 1, policy_version 34140 (0.0009) +[2023-10-08 17:06:14,164][21195] Updated weights for policy 0, policy_version 34390 (0.0008) +[2023-10-08 17:06:14,539][21195] Updated weights for policy 0, policy_version 34400 (0.0008) +[2023-10-08 17:06:17,917][21194] Updated weights for policy 1, policy_version 34150 (0.0008) +[2023-10-08 17:06:18,281][21194] Updated weights for policy 1, policy_version 34160 (0.0008) +[2023-10-08 17:06:18,612][21195] Updated weights for policy 0, policy_version 34410 (0.0007) +[2023-10-08 17:06:18,649][21194] Updated weights for policy 1, policy_version 34170 (0.0007) +[2023-10-08 17:06:18,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 70189056. Throughput: 0: 1735.8, 1: 1721.6. Samples: 17562956. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 17:06:18,803][19739] Avg episode reward: [(0, '774.710'), (1, '938.990')] +[2023-10-08 17:06:18,980][21195] Updated weights for policy 0, policy_version 34420 (0.0009) +[2023-10-08 17:06:19,350][21195] Updated weights for policy 0, policy_version 34430 (0.0008) +[2023-10-08 17:06:22,625][21194] Updated weights for policy 1, policy_version 34180 (0.0008) +[2023-10-08 17:06:22,987][21194] Updated weights for policy 1, policy_version 34190 (0.0010) +[2023-10-08 17:06:23,284][21195] Updated weights for policy 0, policy_version 34440 (0.0007) +[2023-10-08 17:06:23,359][21194] Updated weights for policy 1, policy_version 34200 (0.0008) +[2023-10-08 17:06:23,639][21195] Updated weights for policy 0, policy_version 34450 (0.0007) +[2023-10-08 17:06:23,803][19739] Fps is (10 sec: 16383.7, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 70287360. Throughput: 0: 1747.0, 1: 1727.9. Samples: 17579076. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 17:06:23,804][19739] Avg episode reward: [(0, '774.710'), (1, '938.990')] +[2023-10-08 17:06:24,010][21195] Updated weights for policy 0, policy_version 34460 (0.0007) +[2023-10-08 17:06:27,336][21194] Updated weights for policy 1, policy_version 34210 (0.0009) +[2023-10-08 17:06:27,700][21194] Updated weights for policy 1, policy_version 34220 (0.0008) +[2023-10-08 17:06:27,923][21195] Updated weights for policy 0, policy_version 34470 (0.0008) +[2023-10-08 17:06:28,073][21194] Updated weights for policy 1, policy_version 34230 (0.0007) +[2023-10-08 17:06:28,316][21195] Updated weights for policy 0, policy_version 34480 (0.0009) +[2023-10-08 17:06:28,438][21194] Updated weights for policy 1, policy_version 34240 (0.0008) +[2023-10-08 17:06:28,690][21195] Updated weights for policy 0, policy_version 34490 (0.0008) +[2023-10-08 17:06:28,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 70352896. Throughput: 0: 1742.0, 1: 1714.9. Samples: 17599396. Policy #0 lag: (min: 20.0, avg: 23.0, max: 52.0) +[2023-10-08 17:06:28,803][19739] Avg episode reward: [(0, '774.710'), (1, '944.270')] +[2023-10-08 17:06:32,351][21194] Updated weights for policy 1, policy_version 34250 (0.0009) +[2023-10-08 17:06:32,621][21195] Updated weights for policy 0, policy_version 34500 (0.0008) +[2023-10-08 17:06:32,727][21194] Updated weights for policy 1, policy_version 34260 (0.0008) +[2023-10-08 17:06:32,990][21195] Updated weights for policy 0, policy_version 34510 (0.0007) +[2023-10-08 17:06:33,096][21194] Updated weights for policy 1, policy_version 34270 (0.0007) +[2023-10-08 17:06:33,369][21195] Updated weights for policy 0, policy_version 34520 (0.0007) +[2023-10-08 17:06:33,802][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 70451200. Throughput: 0: 1715.1, 1: 1732.1. Samples: 17614288. Policy #0 lag: (min: 20.0, avg: 23.0, max: 52.0) +[2023-10-08 17:06:33,803][19739] Avg episode reward: [(0, '774.710'), (1, '945.020')] +[2023-10-08 17:06:37,102][21194] Updated weights for policy 1, policy_version 34280 (0.0007) +[2023-10-08 17:06:37,213][21195] Updated weights for policy 0, policy_version 34530 (0.0007) +[2023-10-08 17:06:37,465][21194] Updated weights for policy 1, policy_version 34290 (0.0007) +[2023-10-08 17:06:37,588][21195] Updated weights for policy 0, policy_version 34540 (0.0008) +[2023-10-08 17:06:37,828][21194] Updated weights for policy 1, policy_version 34300 (0.0007) +[2023-10-08 17:06:37,954][21195] Updated weights for policy 0, policy_version 34550 (0.0008) +[2023-10-08 17:06:38,319][21195] Updated weights for policy 0, policy_version 34560 (0.0009) +[2023-10-08 17:06:38,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 70516736. Throughput: 0: 1747.0, 1: 1726.5. Samples: 17630660. Policy #0 lag: (min: 20.0, avg: 23.0, max: 52.0) +[2023-10-08 17:06:38,804][19739] Avg episode reward: [(0, '774.710'), (1, '940.010')] +[2023-10-08 17:06:41,884][21194] Updated weights for policy 1, policy_version 34310 (0.0009) +[2023-10-08 17:06:42,256][21195] Updated weights for policy 0, policy_version 34570 (0.0008) +[2023-10-08 17:06:42,257][21194] Updated weights for policy 1, policy_version 34320 (0.0008) +[2023-10-08 17:06:42,622][21195] Updated weights for policy 0, policy_version 34580 (0.0007) +[2023-10-08 17:06:42,628][21194] Updated weights for policy 1, policy_version 34330 (0.0009) +[2023-10-08 17:06:42,994][21195] Updated weights for policy 0, policy_version 34590 (0.0008) +[2023-10-08 17:06:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 70582272. Throughput: 0: 1724.4, 1: 1699.7. Samples: 17649920. Policy #0 lag: (min: 20.0, avg: 23.0, max: 52.0) +[2023-10-08 17:06:43,803][19739] Avg episode reward: [(0, '774.710'), (1, '937.170')] +[2023-10-08 17:06:46,522][21194] Updated weights for policy 1, policy_version 34340 (0.0008) +[2023-10-08 17:06:46,896][21194] Updated weights for policy 1, policy_version 34350 (0.0008) +[2023-10-08 17:06:46,898][21195] Updated weights for policy 0, policy_version 34600 (0.0008) +[2023-10-08 17:06:47,263][21194] Updated weights for policy 1, policy_version 34360 (0.0009) +[2023-10-08 17:06:47,266][21195] Updated weights for policy 0, policy_version 34610 (0.0007) +[2023-10-08 17:06:47,628][21195] Updated weights for policy 0, policy_version 34620 (0.0009) +[2023-10-08 17:06:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 70647808. Throughput: 0: 1714.1, 1: 1731.2. Samples: 17666354. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 17:06:48,803][19739] Avg episode reward: [(0, '774.710'), (1, '943.960')] +[2023-10-08 17:06:51,331][21194] Updated weights for policy 1, policy_version 34370 (0.0009) +[2023-10-08 17:06:51,585][21195] Updated weights for policy 0, policy_version 34630 (0.0008) +[2023-10-08 17:06:51,693][21194] Updated weights for policy 1, policy_version 34380 (0.0008) +[2023-10-08 17:06:51,961][21195] Updated weights for policy 0, policy_version 34640 (0.0008) +[2023-10-08 17:06:52,062][21194] Updated weights for policy 1, policy_version 34390 (0.0007) +[2023-10-08 17:06:52,323][21195] Updated weights for policy 0, policy_version 34650 (0.0007) +[2023-10-08 17:06:52,427][21194] Updated weights for policy 1, policy_version 34400 (0.0010) +[2023-10-08 17:06:53,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 70713344. Throughput: 0: 1730.1, 1: 1706.8. Samples: 17681360. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 17:06:53,804][19739] Avg episode reward: [(0, '747.540'), (1, '943.960')] +[2023-10-08 17:06:56,338][21195] Updated weights for policy 0, policy_version 34660 (0.0009) +[2023-10-08 17:06:56,348][21194] Updated weights for policy 1, policy_version 34410 (0.0009) +[2023-10-08 17:06:56,704][21195] Updated weights for policy 0, policy_version 34670 (0.0009) +[2023-10-08 17:06:56,712][21194] Updated weights for policy 1, policy_version 34420 (0.0007) +[2023-10-08 17:06:57,067][21195] Updated weights for policy 0, policy_version 34680 (0.0009) +[2023-10-08 17:06:57,078][21194] Updated weights for policy 1, policy_version 34430 (0.0008) +[2023-10-08 17:06:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 70778880. Throughput: 0: 1708.0, 1: 1698.9. Samples: 17701414. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 17:06:58,803][19739] Avg episode reward: [(0, '747.540'), (1, '943.960')] +[2023-10-08 17:07:01,094][21194] Updated weights for policy 1, policy_version 34440 (0.0009) +[2023-10-08 17:07:01,190][21195] Updated weights for policy 0, policy_version 34690 (0.0008) +[2023-10-08 17:07:01,450][21194] Updated weights for policy 1, policy_version 34450 (0.0008) +[2023-10-08 17:07:01,569][21195] Updated weights for policy 0, policy_version 34700 (0.0008) +[2023-10-08 17:07:01,816][21194] Updated weights for policy 1, policy_version 34460 (0.0010) +[2023-10-08 17:07:01,924][21195] Updated weights for policy 0, policy_version 34710 (0.0010) +[2023-10-08 17:07:02,297][21195] Updated weights for policy 0, policy_version 34720 (0.0007) +[2023-10-08 17:07:03,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 70844416. Throughput: 0: 1717.9, 1: 1718.2. Samples: 17717580. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 17:07:03,803][19739] Avg episode reward: [(0, '734.970'), (1, '943.960')] +[2023-10-08 17:07:05,750][21194] Updated weights for policy 1, policy_version 34470 (0.0009) +[2023-10-08 17:07:06,121][21194] Updated weights for policy 1, policy_version 34480 (0.0007) +[2023-10-08 17:07:06,182][21195] Updated weights for policy 0, policy_version 34730 (0.0007) +[2023-10-08 17:07:06,480][21194] Updated weights for policy 1, policy_version 34490 (0.0007) +[2023-10-08 17:07:06,559][21195] Updated weights for policy 0, policy_version 34740 (0.0008) +[2023-10-08 17:07:06,927][21195] Updated weights for policy 0, policy_version 34750 (0.0009) +[2023-10-08 17:07:08,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 70909952. Throughput: 0: 1709.5, 1: 1697.3. Samples: 17732380. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 17:07:08,804][19739] Avg episode reward: [(0, '731.180'), (1, '935.880')] +[2023-10-08 17:07:10,411][21194] Updated weights for policy 1, policy_version 34500 (0.0007) +[2023-10-08 17:07:10,781][21194] Updated weights for policy 1, policy_version 34510 (0.0007) +[2023-10-08 17:07:10,956][21195] Updated weights for policy 0, policy_version 34760 (0.0008) +[2023-10-08 17:07:11,145][21194] Updated weights for policy 1, policy_version 34520 (0.0008) +[2023-10-08 17:07:11,335][21195] Updated weights for policy 0, policy_version 34770 (0.0007) +[2023-10-08 17:07:11,708][21195] Updated weights for policy 0, policy_version 34780 (0.0009) +[2023-10-08 17:07:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 70975488. Throughput: 0: 1705.8, 1: 1715.9. Samples: 17753372. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 17:07:13,803][19739] Avg episode reward: [(0, '731.180'), (1, '935.980')] +[2023-10-08 17:07:13,813][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000034784_35618816.pth... +[2023-10-08 17:07:13,813][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000034528_35356672.pth... +[2023-10-08 17:07:13,850][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000032928_33718272.pth +[2023-10-08 17:07:13,853][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000033152_33947648.pth +[2023-10-08 17:07:15,041][21194] Updated weights for policy 1, policy_version 34530 (0.0009) +[2023-10-08 17:07:15,409][21194] Updated weights for policy 1, policy_version 34540 (0.0009) +[2023-10-08 17:07:15,530][21195] Updated weights for policy 0, policy_version 34790 (0.0008) +[2023-10-08 17:07:15,778][21194] Updated weights for policy 1, policy_version 34550 (0.0009) +[2023-10-08 17:07:15,903][21195] Updated weights for policy 0, policy_version 34800 (0.0008) +[2023-10-08 17:07:16,137][21194] Updated weights for policy 1, policy_version 34560 (0.0009) +[2023-10-08 17:07:16,266][21195] Updated weights for policy 0, policy_version 34810 (0.0008) +[2023-10-08 17:07:18,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 71041024. Throughput: 0: 1737.7, 1: 1703.0. Samples: 17769118. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 17:07:18,803][19739] Avg episode reward: [(0, '731.180'), (1, '935.980')] +[2023-10-08 17:07:20,030][21195] Updated weights for policy 0, policy_version 34820 (0.0007) +[2023-10-08 17:07:20,337][21194] Updated weights for policy 1, policy_version 34570 (0.0009) +[2023-10-08 17:07:20,399][21195] Updated weights for policy 0, policy_version 34830 (0.0007) +[2023-10-08 17:07:20,700][21194] Updated weights for policy 1, policy_version 34580 (0.0009) +[2023-10-08 17:07:20,763][21195] Updated weights for policy 0, policy_version 34840 (0.0008) +[2023-10-08 17:07:21,066][21194] Updated weights for policy 1, policy_version 34590 (0.0007) +[2023-10-08 17:07:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 71106560. Throughput: 0: 1707.3, 1: 1703.2. Samples: 17784130. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 17:07:23,803][19739] Avg episode reward: [(0, '731.180'), (1, '935.980')] +[2023-10-08 17:07:24,865][21195] Updated weights for policy 0, policy_version 34850 (0.0008) +[2023-10-08 17:07:25,099][21194] Updated weights for policy 1, policy_version 34600 (0.0007) +[2023-10-08 17:07:25,234][21195] Updated weights for policy 0, policy_version 34860 (0.0007) +[2023-10-08 17:07:25,469][21194] Updated weights for policy 1, policy_version 34610 (0.0007) +[2023-10-08 17:07:25,604][21195] Updated weights for policy 0, policy_version 34870 (0.0008) +[2023-10-08 17:07:25,826][21194] Updated weights for policy 1, policy_version 34620 (0.0008) +[2023-10-08 17:07:25,965][21195] Updated weights for policy 0, policy_version 34880 (0.0007) +[2023-10-08 17:07:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 71172096. Throughput: 0: 1727.4, 1: 1731.0. Samples: 17805548. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 17:07:28,803][19739] Avg episode reward: [(0, '731.180'), (1, '950.980')] +[2023-10-08 17:07:29,754][21195] Updated weights for policy 0, policy_version 34890 (0.0008) +[2023-10-08 17:07:29,868][21194] Updated weights for policy 1, policy_version 34630 (0.0009) +[2023-10-08 17:07:30,127][21195] Updated weights for policy 0, policy_version 34900 (0.0008) +[2023-10-08 17:07:30,257][21194] Updated weights for policy 1, policy_version 34640 (0.0007) +[2023-10-08 17:07:30,500][21195] Updated weights for policy 0, policy_version 34910 (0.0010) +[2023-10-08 17:07:30,622][21194] Updated weights for policy 1, policy_version 34650 (0.0007) +[2023-10-08 17:07:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 71237632. Throughput: 0: 1742.2, 1: 1697.6. Samples: 17821146. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 17:07:33,803][19739] Avg episode reward: [(0, '745.660'), (1, '950.980')] +[2023-10-08 17:07:34,299][21195] Updated weights for policy 0, policy_version 34920 (0.0009) +[2023-10-08 17:07:34,455][21194] Updated weights for policy 1, policy_version 34660 (0.0009) +[2023-10-08 17:07:34,666][21195] Updated weights for policy 0, policy_version 34930 (0.0008) +[2023-10-08 17:07:34,817][21194] Updated weights for policy 1, policy_version 34670 (0.0007) +[2023-10-08 17:07:35,028][21195] Updated weights for policy 0, policy_version 34940 (0.0007) +[2023-10-08 17:07:35,182][21194] Updated weights for policy 1, policy_version 34680 (0.0008) +[2023-10-08 17:07:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 71303168. Throughput: 0: 1726.1, 1: 1718.7. Samples: 17836374. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:07:38,803][19739] Avg episode reward: [(0, '745.660'), (1, '950.980')] +[2023-10-08 17:07:39,059][21195] Updated weights for policy 0, policy_version 34950 (0.0008) +[2023-10-08 17:07:39,191][21194] Updated weights for policy 1, policy_version 34690 (0.0008) +[2023-10-08 17:07:39,434][21195] Updated weights for policy 0, policy_version 34960 (0.0008) +[2023-10-08 17:07:39,568][21194] Updated weights for policy 1, policy_version 34700 (0.0007) +[2023-10-08 17:07:39,800][21195] Updated weights for policy 0, policy_version 34970 (0.0010) +[2023-10-08 17:07:39,938][21194] Updated weights for policy 1, policy_version 34710 (0.0008) +[2023-10-08 17:07:40,295][21194] Updated weights for policy 1, policy_version 34720 (0.0009) +[2023-10-08 17:07:43,656][21195] Updated weights for policy 0, policy_version 34980 (0.0008) +[2023-10-08 17:07:43,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13107.1, 300 sec: 13773.7). Total num frames: 71368704. Throughput: 0: 1748.7, 1: 1731.6. Samples: 17858026. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:07:43,804][19739] Avg episode reward: [(0, '745.660'), (1, '950.980')] +[2023-10-08 17:07:44,020][21195] Updated weights for policy 0, policy_version 34990 (0.0009) +[2023-10-08 17:07:44,115][21194] Updated weights for policy 1, policy_version 34730 (0.0007) +[2023-10-08 17:07:44,389][21195] Updated weights for policy 0, policy_version 35000 (0.0007) +[2023-10-08 17:07:44,485][21194] Updated weights for policy 1, policy_version 34740 (0.0008) +[2023-10-08 17:07:44,845][21194] Updated weights for policy 1, policy_version 34750 (0.0008) +[2023-10-08 17:07:48,270][21195] Updated weights for policy 0, policy_version 35010 (0.0007) +[2023-10-08 17:07:48,637][21195] Updated weights for policy 0, policy_version 35020 (0.0008) +[2023-10-08 17:07:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 71434240. Throughput: 0: 1735.2, 1: 1710.7. Samples: 17872644. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:07:48,803][19739] Avg episode reward: [(0, '759.560'), (1, '960.970')] +[2023-10-08 17:07:48,842][21194] Updated weights for policy 1, policy_version 34760 (0.0009) +[2023-10-08 17:07:48,999][21195] Updated weights for policy 0, policy_version 35030 (0.0009) +[2023-10-08 17:07:49,200][21194] Updated weights for policy 1, policy_version 34770 (0.0009) +[2023-10-08 17:07:49,375][21195] Updated weights for policy 0, policy_version 35040 (0.0008) +[2023-10-08 17:07:49,577][21194] Updated weights for policy 1, policy_version 34780 (0.0007) +[2023-10-08 17:07:53,356][21195] Updated weights for policy 0, policy_version 35050 (0.0007) +[2023-10-08 17:07:53,635][21194] Updated weights for policy 1, policy_version 34790 (0.0009) +[2023-10-08 17:07:53,723][21195] Updated weights for policy 0, policy_version 35060 (0.0008) +[2023-10-08 17:07:53,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 71499776. Throughput: 0: 1742.8, 1: 1722.7. Samples: 17888328. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:07:53,803][19739] Avg episode reward: [(0, '759.560'), (1, '950.560')] +[2023-10-08 17:07:54,009][21194] Updated weights for policy 1, policy_version 34800 (0.0008) +[2023-10-08 17:07:54,091][21195] Updated weights for policy 0, policy_version 35070 (0.0009) +[2023-10-08 17:07:54,371][21194] Updated weights for policy 1, policy_version 34810 (0.0007) +[2023-10-08 17:07:57,941][21195] Updated weights for policy 0, policy_version 35080 (0.0009) +[2023-10-08 17:07:58,307][21195] Updated weights for policy 0, policy_version 35090 (0.0007) +[2023-10-08 17:07:58,380][21194] Updated weights for policy 1, policy_version 34820 (0.0010) +[2023-10-08 17:07:58,680][21195] Updated weights for policy 0, policy_version 35100 (0.0007) +[2023-10-08 17:07:58,735][21194] Updated weights for policy 1, policy_version 34830 (0.0007) +[2023-10-08 17:07:58,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 71565312. Throughput: 0: 1754.8, 1: 1720.8. Samples: 17909778. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:07:58,804][19739] Avg episode reward: [(0, '759.560'), (1, '950.560')] +[2023-10-08 17:07:59,102][21194] Updated weights for policy 1, policy_version 34840 (0.0009) +[2023-10-08 17:08:02,698][21195] Updated weights for policy 0, policy_version 35110 (0.0007) +[2023-10-08 17:08:03,026][21194] Updated weights for policy 1, policy_version 34850 (0.0010) +[2023-10-08 17:08:03,088][21195] Updated weights for policy 0, policy_version 35120 (0.0008) +[2023-10-08 17:08:03,404][21194] Updated weights for policy 1, policy_version 34860 (0.0008) +[2023-10-08 17:08:03,453][21195] Updated weights for policy 0, policy_version 35130 (0.0007) +[2023-10-08 17:08:03,759][21194] Updated weights for policy 1, policy_version 34870 (0.0008) +[2023-10-08 17:08:03,803][19739] Fps is (10 sec: 16383.8, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 71663616. Throughput: 0: 1724.3, 1: 1717.1. Samples: 17923978. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:08:03,804][19739] Avg episode reward: [(0, '760.180'), (1, '905.850')] +[2023-10-08 17:08:04,135][21194] Updated weights for policy 1, policy_version 34880 (0.0010) +[2023-10-08 17:08:07,352][21195] Updated weights for policy 0, policy_version 35140 (0.0007) +[2023-10-08 17:08:07,725][21195] Updated weights for policy 0, policy_version 35150 (0.0007) +[2023-10-08 17:08:08,054][21194] Updated weights for policy 1, policy_version 34890 (0.0007) +[2023-10-08 17:08:08,087][21195] Updated weights for policy 0, policy_version 35160 (0.0008) +[2023-10-08 17:08:08,415][21194] Updated weights for policy 1, policy_version 34900 (0.0009) +[2023-10-08 17:08:08,790][21194] Updated weights for policy 1, policy_version 34910 (0.0008) +[2023-10-08 17:08:08,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 71729152. Throughput: 0: 1754.0, 1: 1727.3. Samples: 17940790. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:08:08,804][19739] Avg episode reward: [(0, '760.040'), (1, '905.850')] +[2023-10-08 17:08:12,020][21195] Updated weights for policy 0, policy_version 35170 (0.0008) +[2023-10-08 17:08:12,398][21195] Updated weights for policy 0, policy_version 35180 (0.0007) +[2023-10-08 17:08:12,645][21194] Updated weights for policy 1, policy_version 34920 (0.0009) +[2023-10-08 17:08:12,771][21195] Updated weights for policy 0, policy_version 35190 (0.0007) +[2023-10-08 17:08:13,012][21194] Updated weights for policy 1, policy_version 34930 (0.0009) +[2023-10-08 17:08:13,149][21195] Updated weights for policy 0, policy_version 35200 (0.0007) +[2023-10-08 17:08:13,377][21194] Updated weights for policy 1, policy_version 34940 (0.0008) +[2023-10-08 17:08:13,803][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 71827456. Throughput: 0: 1734.0, 1: 1713.4. Samples: 17960682. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:08:13,803][19739] Avg episode reward: [(0, '760.040'), (1, '905.850')] +[2023-10-08 17:08:17,158][21195] Updated weights for policy 0, policy_version 35210 (0.0007) +[2023-10-08 17:08:17,494][21194] Updated weights for policy 1, policy_version 34950 (0.0008) +[2023-10-08 17:08:17,527][21195] Updated weights for policy 0, policy_version 35220 (0.0008) +[2023-10-08 17:08:17,878][21194] Updated weights for policy 1, policy_version 34960 (0.0009) +[2023-10-08 17:08:17,887][21195] Updated weights for policy 0, policy_version 35230 (0.0009) +[2023-10-08 17:08:18,235][21194] Updated weights for policy 1, policy_version 34970 (0.0009) +[2023-10-08 17:08:18,803][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 71892992. Throughput: 0: 1716.8, 1: 1729.0. Samples: 17976208. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:08:18,803][19739] Avg episode reward: [(0, '760.040'), (1, '898.980')] +[2023-10-08 17:08:21,774][21195] Updated weights for policy 0, policy_version 35240 (0.0009) +[2023-10-08 17:08:22,139][21195] Updated weights for policy 0, policy_version 35250 (0.0007) +[2023-10-08 17:08:22,356][21194] Updated weights for policy 1, policy_version 34980 (0.0007) +[2023-10-08 17:08:22,511][21195] Updated weights for policy 0, policy_version 35260 (0.0009) +[2023-10-08 17:08:22,723][21194] Updated weights for policy 1, policy_version 34990 (0.0008) +[2023-10-08 17:08:23,092][21194] Updated weights for policy 1, policy_version 35000 (0.0008) +[2023-10-08 17:08:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 71958528. Throughput: 0: 1736.9, 1: 1725.6. Samples: 17992188. Policy #0 lag: (min: 31.0, avg: 33.1, max: 63.0) +[2023-10-08 17:08:23,803][19739] Avg episode reward: [(0, '760.040'), (1, '898.980')] +[2023-10-08 17:08:26,489][21195] Updated weights for policy 0, policy_version 35270 (0.0008) +[2023-10-08 17:08:26,862][21195] Updated weights for policy 0, policy_version 35280 (0.0007) +[2023-10-08 17:08:27,109][21194] Updated weights for policy 1, policy_version 35010 (0.0007) +[2023-10-08 17:08:27,229][21195] Updated weights for policy 0, policy_version 35290 (0.0007) +[2023-10-08 17:08:27,472][21194] Updated weights for policy 1, policy_version 35020 (0.0007) +[2023-10-08 17:08:27,843][21194] Updated weights for policy 1, policy_version 35030 (0.0009) +[2023-10-08 17:08:28,209][21194] Updated weights for policy 1, policy_version 35040 (0.0010) +[2023-10-08 17:08:28,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 72024064. Throughput: 0: 1712.3, 1: 1693.5. Samples: 18011286. Policy #0 lag: (min: 31.0, avg: 33.1, max: 63.0) +[2023-10-08 17:08:28,803][19739] Avg episode reward: [(0, '753.810'), (1, '890.650')] +[2023-10-08 17:08:31,051][21195] Updated weights for policy 0, policy_version 35300 (0.0008) +[2023-10-08 17:08:31,424][21195] Updated weights for policy 0, policy_version 35310 (0.0007) +[2023-10-08 17:08:31,778][21195] Updated weights for policy 0, policy_version 35320 (0.0009) +[2023-10-08 17:08:32,008][21194] Updated weights for policy 1, policy_version 35050 (0.0010) +[2023-10-08 17:08:32,377][21194] Updated weights for policy 1, policy_version 35060 (0.0011) +[2023-10-08 17:08:32,740][21194] Updated weights for policy 1, policy_version 35070 (0.0008) +[2023-10-08 17:08:33,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 72089600. Throughput: 0: 1734.3, 1: 1717.6. Samples: 18027978. Policy #0 lag: (min: 31.0, avg: 33.1, max: 63.0) +[2023-10-08 17:08:33,803][19739] Avg episode reward: [(0, '748.300'), (1, '890.650')] +[2023-10-08 17:08:35,596][21195] Updated weights for policy 0, policy_version 35330 (0.0009) +[2023-10-08 17:08:35,972][21195] Updated weights for policy 0, policy_version 35340 (0.0010) +[2023-10-08 17:08:36,338][21195] Updated weights for policy 0, policy_version 35350 (0.0007) +[2023-10-08 17:08:36,611][21194] Updated weights for policy 1, policy_version 35080 (0.0009) +[2023-10-08 17:08:36,707][21195] Updated weights for policy 0, policy_version 35360 (0.0007) +[2023-10-08 17:08:36,978][21194] Updated weights for policy 1, policy_version 35090 (0.0007) +[2023-10-08 17:08:37,341][21194] Updated weights for policy 1, policy_version 35100 (0.0008) +[2023-10-08 17:08:38,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 72155136. Throughput: 0: 1720.3, 1: 1708.8. Samples: 18042634. Policy #0 lag: (min: 31.0, avg: 33.1, max: 63.0) +[2023-10-08 17:08:38,803][19739] Avg episode reward: [(0, '765.020'), (1, '890.650')] +[2023-10-08 17:08:40,621][21195] Updated weights for policy 0, policy_version 35370 (0.0009) +[2023-10-08 17:08:40,998][21195] Updated weights for policy 0, policy_version 35380 (0.0008) +[2023-10-08 17:08:41,281][21194] Updated weights for policy 1, policy_version 35110 (0.0007) +[2023-10-08 17:08:41,359][21195] Updated weights for policy 0, policy_version 35390 (0.0008) +[2023-10-08 17:08:41,647][21194] Updated weights for policy 1, policy_version 35120 (0.0007) +[2023-10-08 17:08:42,006][21194] Updated weights for policy 1, policy_version 35130 (0.0011) +[2023-10-08 17:08:43,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 72220672. Throughput: 0: 1720.4, 1: 1700.8. Samples: 18063730. Policy #0 lag: (min: 31.0, avg: 33.1, max: 63.0) +[2023-10-08 17:08:43,804][19739] Avg episode reward: [(0, '765.020'), (1, '890.050')] +[2023-10-08 17:08:45,379][21195] Updated weights for policy 0, policy_version 35400 (0.0008) +[2023-10-08 17:08:45,745][21195] Updated weights for policy 0, policy_version 35410 (0.0009) +[2023-10-08 17:08:46,092][21194] Updated weights for policy 1, policy_version 35140 (0.0008) +[2023-10-08 17:08:46,122][21195] Updated weights for policy 0, policy_version 35420 (0.0009) +[2023-10-08 17:08:46,455][21194] Updated weights for policy 1, policy_version 35150 (0.0008) +[2023-10-08 17:08:46,826][21194] Updated weights for policy 1, policy_version 35160 (0.0008) +[2023-10-08 17:08:48,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 72286208. Throughput: 0: 1746.9, 1: 1730.1. Samples: 18080442. Policy #0 lag: (min: 31.0, avg: 33.1, max: 63.0) +[2023-10-08 17:08:48,803][19739] Avg episode reward: [(0, '765.020'), (1, '890.050')] +[2023-10-08 17:08:49,990][21195] Updated weights for policy 0, policy_version 35430 (0.0009) +[2023-10-08 17:08:50,349][21195] Updated weights for policy 0, policy_version 35440 (0.0008) +[2023-10-08 17:08:50,720][21195] Updated weights for policy 0, policy_version 35450 (0.0009) +[2023-10-08 17:08:50,733][21194] Updated weights for policy 1, policy_version 35170 (0.0008) +[2023-10-08 17:08:51,101][21194] Updated weights for policy 1, policy_version 35180 (0.0008) +[2023-10-08 17:08:51,473][21194] Updated weights for policy 1, policy_version 35190 (0.0009) +[2023-10-08 17:08:51,834][21194] Updated weights for policy 1, policy_version 35200 (0.0008) +[2023-10-08 17:08:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 72351744. Throughput: 0: 1716.8, 1: 1697.8. Samples: 18094446. Policy #0 lag: (min: 4.0, avg: 9.7, max: 36.0) +[2023-10-08 17:08:53,803][19739] Avg episode reward: [(0, '765.020'), (1, '890.050')] +[2023-10-08 17:08:54,752][21195] Updated weights for policy 0, policy_version 35460 (0.0008) +[2023-10-08 17:08:55,132][21195] Updated weights for policy 0, policy_version 35470 (0.0007) +[2023-10-08 17:08:55,508][21195] Updated weights for policy 0, policy_version 35480 (0.0009) +[2023-10-08 17:08:55,810][21194] Updated weights for policy 1, policy_version 35210 (0.0009) +[2023-10-08 17:08:56,179][21194] Updated weights for policy 1, policy_version 35220 (0.0010) +[2023-10-08 17:08:56,543][21194] Updated weights for policy 1, policy_version 35230 (0.0007) +[2023-10-08 17:08:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 72417280. Throughput: 0: 1737.9, 1: 1712.4. Samples: 18115944. Policy #0 lag: (min: 4.0, avg: 9.7, max: 36.0) +[2023-10-08 17:08:58,803][19739] Avg episode reward: [(0, '765.020'), (1, '890.050')] +[2023-10-08 17:08:59,269][21195] Updated weights for policy 0, policy_version 35490 (0.0007) +[2023-10-08 17:08:59,635][21195] Updated weights for policy 0, policy_version 35500 (0.0007) +[2023-10-08 17:09:00,007][21195] Updated weights for policy 0, policy_version 35510 (0.0007) +[2023-10-08 17:09:00,365][21195] Updated weights for policy 0, policy_version 35520 (0.0009) +[2023-10-08 17:09:00,538][21194] Updated weights for policy 1, policy_version 35240 (0.0007) +[2023-10-08 17:09:00,913][21194] Updated weights for policy 1, policy_version 35250 (0.0011) +[2023-10-08 17:09:01,279][21194] Updated weights for policy 1, policy_version 35260 (0.0007) +[2023-10-08 17:09:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 72482816. Throughput: 0: 1749.9, 1: 1709.3. Samples: 18131870. Policy #0 lag: (min: 4.0, avg: 9.7, max: 36.0) +[2023-10-08 17:09:03,804][19739] Avg episode reward: [(0, '766.060'), (1, '890.050')] +[2023-10-08 17:09:04,191][21195] Updated weights for policy 0, policy_version 35530 (0.0010) +[2023-10-08 17:09:04,561][21195] Updated weights for policy 0, policy_version 35540 (0.0010) +[2023-10-08 17:09:04,921][21195] Updated weights for policy 0, policy_version 35550 (0.0008) +[2023-10-08 17:09:05,222][21194] Updated weights for policy 1, policy_version 35270 (0.0008) +[2023-10-08 17:09:05,597][21194] Updated weights for policy 1, policy_version 35280 (0.0009) +[2023-10-08 17:09:05,971][21194] Updated weights for policy 1, policy_version 35290 (0.0010) +[2023-10-08 17:09:08,725][21195] Updated weights for policy 0, policy_version 35560 (0.0009) +[2023-10-08 17:09:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 72548352. Throughput: 0: 1730.8, 1: 1700.5. Samples: 18146596. Policy #0 lag: (min: 4.0, avg: 9.7, max: 36.0) +[2023-10-08 17:09:08,803][19739] Avg episode reward: [(0, '766.060'), (1, '890.050')] +[2023-10-08 17:09:09,097][21195] Updated weights for policy 0, policy_version 35570 (0.0009) +[2023-10-08 17:09:09,478][21195] Updated weights for policy 0, policy_version 35580 (0.0009) +[2023-10-08 17:09:09,937][21194] Updated weights for policy 1, policy_version 35300 (0.0010) +[2023-10-08 17:09:10,301][21194] Updated weights for policy 1, policy_version 35310 (0.0009) +[2023-10-08 17:09:10,659][21194] Updated weights for policy 1, policy_version 35320 (0.0007) +[2023-10-08 17:09:13,329][21195] Updated weights for policy 0, policy_version 35590 (0.0007) +[2023-10-08 17:09:13,696][21195] Updated weights for policy 0, policy_version 35600 (0.0007) +[2023-10-08 17:09:13,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 72613888. Throughput: 0: 1753.1, 1: 1731.4. Samples: 18168088. Policy #0 lag: (min: 4.0, avg: 9.7, max: 36.0) +[2023-10-08 17:09:13,803][19739] Avg episode reward: [(0, '766.060'), (1, '881.100')] +[2023-10-08 17:09:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000035328_36175872.pth... +[2023-10-08 17:09:13,848][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000033728_34537472.pth +[2023-10-08 17:09:14,059][21195] Updated weights for policy 0, policy_version 35610 (0.0010) +[2023-10-08 17:09:14,281][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000035616_36470784.pth... +[2023-10-08 17:09:14,313][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000033984_34799616.pth +[2023-10-08 17:09:14,432][21194] Updated weights for policy 1, policy_version 35330 (0.0008) +[2023-10-08 17:09:14,812][21194] Updated weights for policy 1, policy_version 35340 (0.0007) +[2023-10-08 17:09:15,182][21194] Updated weights for policy 1, policy_version 35350 (0.0008) +[2023-10-08 17:09:15,548][21194] Updated weights for policy 1, policy_version 35360 (0.0008) +[2023-10-08 17:09:18,004][21195] Updated weights for policy 0, policy_version 35620 (0.0008) +[2023-10-08 17:09:18,375][21195] Updated weights for policy 0, policy_version 35630 (0.0009) +[2023-10-08 17:09:18,741][21195] Updated weights for policy 0, policy_version 35640 (0.0009) +[2023-10-08 17:09:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 72679424. Throughput: 0: 1724.1, 1: 1707.6. Samples: 18182406. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:09:18,803][19739] Avg episode reward: [(0, '766.060'), (1, '890.300')] +[2023-10-08 17:09:19,421][21194] Updated weights for policy 1, policy_version 35370 (0.0011) +[2023-10-08 17:09:19,796][21194] Updated weights for policy 1, policy_version 35380 (0.0009) +[2023-10-08 17:09:20,162][21194] Updated weights for policy 1, policy_version 35390 (0.0011) +[2023-10-08 17:09:22,883][21195] Updated weights for policy 0, policy_version 35650 (0.0010) +[2023-10-08 17:09:23,247][21195] Updated weights for policy 0, policy_version 35660 (0.0007) +[2023-10-08 17:09:23,615][21195] Updated weights for policy 0, policy_version 35670 (0.0007) +[2023-10-08 17:09:23,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 72744960. Throughput: 0: 1743.1, 1: 1725.8. Samples: 18198734. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:09:23,803][19739] Avg episode reward: [(0, '769.840'), (1, '890.300')] +[2023-10-08 17:09:23,985][21195] Updated weights for policy 0, policy_version 35680 (0.0008) +[2023-10-08 17:09:24,141][21194] Updated weights for policy 1, policy_version 35400 (0.0008) +[2023-10-08 17:09:24,510][21194] Updated weights for policy 1, policy_version 35410 (0.0011) +[2023-10-08 17:09:24,862][21194] Updated weights for policy 1, policy_version 35420 (0.0011) +[2023-10-08 17:09:28,008][21195] Updated weights for policy 0, policy_version 35690 (0.0008) +[2023-10-08 17:09:28,369][21195] Updated weights for policy 0, policy_version 35700 (0.0009) +[2023-10-08 17:09:28,746][21195] Updated weights for policy 0, policy_version 35710 (0.0008) +[2023-10-08 17:09:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 72810496. Throughput: 0: 1734.9, 1: 1731.2. Samples: 18219702. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:09:28,803][19739] Avg episode reward: [(0, '769.840'), (1, '890.300')] +[2023-10-08 17:09:28,922][21194] Updated weights for policy 1, policy_version 35430 (0.0009) +[2023-10-08 17:09:29,285][21194] Updated weights for policy 1, policy_version 35440 (0.0007) +[2023-10-08 17:09:29,656][21194] Updated weights for policy 1, policy_version 35450 (0.0007) +[2023-10-08 17:09:32,725][21195] Updated weights for policy 0, policy_version 35720 (0.0011) +[2023-10-08 17:09:33,105][21195] Updated weights for policy 0, policy_version 35730 (0.0011) +[2023-10-08 17:09:33,475][21195] Updated weights for policy 0, policy_version 35740 (0.0009) +[2023-10-08 17:09:33,596][21194] Updated weights for policy 1, policy_version 35460 (0.0009) +[2023-10-08 17:09:33,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 72908800. Throughput: 0: 1710.7, 1: 1700.3. Samples: 18233938. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:09:33,803][19739] Avg episode reward: [(0, '769.370'), (1, '890.300')] +[2023-10-08 17:09:33,963][21194] Updated weights for policy 1, policy_version 35470 (0.0009) +[2023-10-08 17:09:34,336][21194] Updated weights for policy 1, policy_version 35480 (0.0007) +[2023-10-08 17:09:37,575][21195] Updated weights for policy 0, policy_version 35750 (0.0007) +[2023-10-08 17:09:37,953][21195] Updated weights for policy 0, policy_version 35760 (0.0010) +[2023-10-08 17:09:38,259][21194] Updated weights for policy 1, policy_version 35490 (0.0008) +[2023-10-08 17:09:38,325][21195] Updated weights for policy 0, policy_version 35770 (0.0008) +[2023-10-08 17:09:38,621][21194] Updated weights for policy 1, policy_version 35500 (0.0007) +[2023-10-08 17:09:38,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 72974336. Throughput: 0: 1741.7, 1: 1732.5. Samples: 18250786. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 17:09:38,803][19739] Avg episode reward: [(0, '755.490'), (1, '890.370')] +[2023-10-08 17:09:38,990][21194] Updated weights for policy 1, policy_version 35510 (0.0008) +[2023-10-08 17:09:39,368][21194] Updated weights for policy 1, policy_version 35520 (0.0009) +[2023-10-08 17:09:42,283][21195] Updated weights for policy 0, policy_version 35780 (0.0008) +[2023-10-08 17:09:42,667][21195] Updated weights for policy 0, policy_version 35790 (0.0008) +[2023-10-08 17:09:43,037][21195] Updated weights for policy 0, policy_version 35800 (0.0009) +[2023-10-08 17:09:43,251][21194] Updated weights for policy 1, policy_version 35530 (0.0007) +[2023-10-08 17:09:43,610][21194] Updated weights for policy 1, policy_version 35540 (0.0007) +[2023-10-08 17:09:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 73039872. Throughput: 0: 1718.4, 1: 1731.6. Samples: 18271194. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 17:09:43,803][19739] Avg episode reward: [(0, '759.700'), (1, '890.300')] +[2023-10-08 17:09:43,978][21194] Updated weights for policy 1, policy_version 35550 (0.0010) +[2023-10-08 17:09:46,968][21195] Updated weights for policy 0, policy_version 35810 (0.0008) +[2023-10-08 17:09:47,340][21195] Updated weights for policy 0, policy_version 35820 (0.0009) +[2023-10-08 17:09:47,711][21195] Updated weights for policy 0, policy_version 35830 (0.0008) +[2023-10-08 17:09:47,874][21194] Updated weights for policy 1, policy_version 35560 (0.0008) +[2023-10-08 17:09:48,079][21195] Updated weights for policy 0, policy_version 35840 (0.0007) +[2023-10-08 17:09:48,233][21194] Updated weights for policy 1, policy_version 35570 (0.0007) +[2023-10-08 17:09:48,601][21194] Updated weights for policy 1, policy_version 35580 (0.0010) +[2023-10-08 17:09:48,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 73138176. Throughput: 0: 1697.0, 1: 1727.1. Samples: 18285956. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 17:09:48,803][19739] Avg episode reward: [(0, '745.580'), (1, '890.300')] +[2023-10-08 17:09:51,799][21195] Updated weights for policy 0, policy_version 35850 (0.0008) +[2023-10-08 17:09:52,167][21195] Updated weights for policy 0, policy_version 35860 (0.0010) +[2023-10-08 17:09:52,541][21195] Updated weights for policy 0, policy_version 35870 (0.0008) +[2023-10-08 17:09:52,724][21194] Updated weights for policy 1, policy_version 35590 (0.0007) +[2023-10-08 17:09:53,084][21194] Updated weights for policy 1, policy_version 35600 (0.0007) +[2023-10-08 17:09:53,449][21194] Updated weights for policy 1, policy_version 35610 (0.0009) +[2023-10-08 17:09:53,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 73203712. Throughput: 0: 1718.9, 1: 1741.4. Samples: 18302310. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 17:09:53,803][19739] Avg episode reward: [(0, '745.580'), (1, '890.300')] +[2023-10-08 17:09:56,647][21195] Updated weights for policy 0, policy_version 35880 (0.0008) +[2023-10-08 17:09:57,030][21195] Updated weights for policy 0, policy_version 35890 (0.0009) +[2023-10-08 17:09:57,361][21194] Updated weights for policy 1, policy_version 35620 (0.0007) +[2023-10-08 17:09:57,393][21195] Updated weights for policy 0, policy_version 35900 (0.0009) +[2023-10-08 17:09:57,724][21194] Updated weights for policy 1, policy_version 35630 (0.0008) +[2023-10-08 17:09:58,089][21194] Updated weights for policy 1, policy_version 35640 (0.0009) +[2023-10-08 17:09:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 73269248. Throughput: 0: 1691.7, 1: 1722.1. Samples: 18321712. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 17:09:58,803][19739] Avg episode reward: [(0, '745.580'), (1, '890.300')] +[2023-10-08 17:10:01,209][21195] Updated weights for policy 0, policy_version 35910 (0.0008) +[2023-10-08 17:10:01,582][21195] Updated weights for policy 0, policy_version 35920 (0.0007) +[2023-10-08 17:10:01,948][21195] Updated weights for policy 0, policy_version 35930 (0.0007) +[2023-10-08 17:10:02,129][21194] Updated weights for policy 1, policy_version 35650 (0.0009) +[2023-10-08 17:10:02,488][21194] Updated weights for policy 1, policy_version 35660 (0.0011) +[2023-10-08 17:10:02,849][21194] Updated weights for policy 1, policy_version 35670 (0.0010) +[2023-10-08 17:10:03,207][21194] Updated weights for policy 1, policy_version 35680 (0.0010) +[2023-10-08 17:10:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 73334784. Throughput: 0: 1723.8, 1: 1739.4. Samples: 18338252. Policy #0 lag: (min: 8.0, avg: 33.4, max: 40.0) +[2023-10-08 17:10:03,803][19739] Avg episode reward: [(0, '745.580'), (1, '890.030')] +[2023-10-08 17:10:05,894][21195] Updated weights for policy 0, policy_version 35940 (0.0007) +[2023-10-08 17:10:06,271][21195] Updated weights for policy 0, policy_version 35950 (0.0009) +[2023-10-08 17:10:06,631][21195] Updated weights for policy 0, policy_version 35960 (0.0007) +[2023-10-08 17:10:07,309][21194] Updated weights for policy 1, policy_version 35690 (0.0010) +[2023-10-08 17:10:07,679][21194] Updated weights for policy 1, policy_version 35700 (0.0010) +[2023-10-08 17:10:08,043][21194] Updated weights for policy 1, policy_version 35710 (0.0008) +[2023-10-08 17:10:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 73400320. Throughput: 0: 1710.9, 1: 1729.3. Samples: 18353542. Policy #0 lag: (min: 8.0, avg: 33.4, max: 40.0) +[2023-10-08 17:10:08,803][19739] Avg episode reward: [(0, '745.580'), (1, '890.030')] +[2023-10-08 17:10:10,535][21195] Updated weights for policy 0, policy_version 35970 (0.0009) +[2023-10-08 17:10:10,904][21195] Updated weights for policy 0, policy_version 35980 (0.0011) +[2023-10-08 17:10:11,271][21195] Updated weights for policy 0, policy_version 35990 (0.0009) +[2023-10-08 17:10:11,637][21195] Updated weights for policy 0, policy_version 36000 (0.0007) +[2023-10-08 17:10:12,012][21194] Updated weights for policy 1, policy_version 35720 (0.0008) +[2023-10-08 17:10:12,391][21194] Updated weights for policy 1, policy_version 35730 (0.0010) +[2023-10-08 17:10:12,753][21194] Updated weights for policy 1, policy_version 35740 (0.0009) +[2023-10-08 17:10:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 73465856. Throughput: 0: 1709.6, 1: 1705.1. Samples: 18373360. Policy #0 lag: (min: 8.0, avg: 33.4, max: 40.0) +[2023-10-08 17:10:13,803][19739] Avg episode reward: [(0, '751.300'), (1, '890.030')] +[2023-10-08 17:10:15,600][21195] Updated weights for policy 0, policy_version 36010 (0.0010) +[2023-10-08 17:10:15,973][21195] Updated weights for policy 0, policy_version 36020 (0.0008) +[2023-10-08 17:10:16,334][21195] Updated weights for policy 0, policy_version 36030 (0.0007) +[2023-10-08 17:10:16,599][21194] Updated weights for policy 1, policy_version 35750 (0.0008) +[2023-10-08 17:10:16,961][21194] Updated weights for policy 1, policy_version 35760 (0.0009) +[2023-10-08 17:10:17,331][21194] Updated weights for policy 1, policy_version 35770 (0.0009) +[2023-10-08 17:10:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 73531392. Throughput: 0: 1733.6, 1: 1739.0. Samples: 18390204. Policy #0 lag: (min: 8.0, avg: 33.4, max: 40.0) +[2023-10-08 17:10:18,803][19739] Avg episode reward: [(0, '748.420'), (1, '890.030')] +[2023-10-08 17:10:20,383][21195] Updated weights for policy 0, policy_version 36040 (0.0007) +[2023-10-08 17:10:20,759][21195] Updated weights for policy 0, policy_version 36050 (0.0008) +[2023-10-08 17:10:21,076][21194] Updated weights for policy 1, policy_version 35780 (0.0008) +[2023-10-08 17:10:21,130][21195] Updated weights for policy 0, policy_version 36060 (0.0008) +[2023-10-08 17:10:21,441][21194] Updated weights for policy 1, policy_version 35790 (0.0009) +[2023-10-08 17:10:21,808][21194] Updated weights for policy 1, policy_version 35800 (0.0009) +[2023-10-08 17:10:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 73596928. Throughput: 0: 1705.7, 1: 1714.0. Samples: 18404672. Policy #0 lag: (min: 8.0, avg: 33.4, max: 40.0) +[2023-10-08 17:10:23,803][19739] Avg episode reward: [(0, '748.420'), (1, '882.140')] +[2023-10-08 17:10:24,879][21195] Updated weights for policy 0, policy_version 36070 (0.0008) +[2023-10-08 17:10:25,245][21195] Updated weights for policy 0, policy_version 36080 (0.0009) +[2023-10-08 17:10:25,615][21195] Updated weights for policy 0, policy_version 36090 (0.0009) +[2023-10-08 17:10:25,772][21194] Updated weights for policy 1, policy_version 35810 (0.0010) +[2023-10-08 17:10:26,139][21194] Updated weights for policy 1, policy_version 35820 (0.0007) +[2023-10-08 17:10:26,507][21194] Updated weights for policy 1, policy_version 35830 (0.0009) +[2023-10-08 17:10:26,873][21194] Updated weights for policy 1, policy_version 35840 (0.0009) +[2023-10-08 17:10:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 73662464. Throughput: 0: 1733.8, 1: 1709.4. Samples: 18426136. Policy #0 lag: (min: 17.0, avg: 23.4, max: 49.0) +[2023-10-08 17:10:28,803][19739] Avg episode reward: [(0, '748.420'), (1, '882.140')] +[2023-10-08 17:10:29,500][21195] Updated weights for policy 0, policy_version 36100 (0.0008) +[2023-10-08 17:10:29,887][21195] Updated weights for policy 0, policy_version 36110 (0.0008) +[2023-10-08 17:10:30,254][21195] Updated weights for policy 0, policy_version 36120 (0.0009) +[2023-10-08 17:10:30,672][21194] Updated weights for policy 1, policy_version 35850 (0.0009) +[2023-10-08 17:10:31,033][21194] Updated weights for policy 1, policy_version 35860 (0.0011) +[2023-10-08 17:10:31,403][21194] Updated weights for policy 1, policy_version 35870 (0.0009) +[2023-10-08 17:10:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 73728000. Throughput: 0: 1752.9, 1: 1719.2. Samples: 18442202. Policy #0 lag: (min: 17.0, avg: 23.4, max: 49.0) +[2023-10-08 17:10:33,803][19739] Avg episode reward: [(0, '741.660'), (1, '882.140')] +[2023-10-08 17:10:34,094][21195] Updated weights for policy 0, policy_version 36130 (0.0008) +[2023-10-08 17:10:34,467][21195] Updated weights for policy 0, policy_version 36140 (0.0010) +[2023-10-08 17:10:34,835][21195] Updated weights for policy 0, policy_version 36150 (0.0010) +[2023-10-08 17:10:35,203][21195] Updated weights for policy 0, policy_version 36160 (0.0008) +[2023-10-08 17:10:35,352][21194] Updated weights for policy 1, policy_version 35880 (0.0008) +[2023-10-08 17:10:35,721][21194] Updated weights for policy 1, policy_version 35890 (0.0007) +[2023-10-08 17:10:36,100][21194] Updated weights for policy 1, policy_version 35900 (0.0008) +[2023-10-08 17:10:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 73793536. Throughput: 0: 1733.3, 1: 1701.2. Samples: 18456864. Policy #0 lag: (min: 17.0, avg: 23.4, max: 49.0) +[2023-10-08 17:10:38,803][19739] Avg episode reward: [(0, '741.660'), (1, '882.140')] +[2023-10-08 17:10:38,985][21195] Updated weights for policy 0, policy_version 36170 (0.0007) +[2023-10-08 17:10:39,358][21195] Updated weights for policy 0, policy_version 36180 (0.0007) +[2023-10-08 17:10:39,730][21195] Updated weights for policy 0, policy_version 36190 (0.0007) +[2023-10-08 17:10:40,216][21194] Updated weights for policy 1, policy_version 35910 (0.0010) +[2023-10-08 17:10:40,606][21194] Updated weights for policy 1, policy_version 35920 (0.0008) +[2023-10-08 17:10:40,966][21194] Updated weights for policy 1, policy_version 35930 (0.0008) +[2023-10-08 17:10:43,515][21195] Updated weights for policy 0, policy_version 36200 (0.0008) +[2023-10-08 17:10:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 73859072. Throughput: 0: 1765.1, 1: 1711.4. Samples: 18478152. Policy #0 lag: (min: 17.0, avg: 23.4, max: 49.0) +[2023-10-08 17:10:43,803][19739] Avg episode reward: [(0, '741.660'), (1, '894.060')] +[2023-10-08 17:10:43,890][21195] Updated weights for policy 0, policy_version 36210 (0.0008) +[2023-10-08 17:10:44,250][21195] Updated weights for policy 0, policy_version 36220 (0.0009) +[2023-10-08 17:10:45,023][21194] Updated weights for policy 1, policy_version 35940 (0.0008) +[2023-10-08 17:10:45,393][21194] Updated weights for policy 1, policy_version 35950 (0.0008) +[2023-10-08 17:10:45,756][21194] Updated weights for policy 1, policy_version 35960 (0.0009) +[2023-10-08 17:10:48,145][21195] Updated weights for policy 0, policy_version 36230 (0.0008) +[2023-10-08 17:10:48,514][21195] Updated weights for policy 0, policy_version 36240 (0.0010) +[2023-10-08 17:10:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 73924608. Throughput: 0: 1736.8, 1: 1695.8. Samples: 18492722. Policy #0 lag: (min: 17.0, avg: 23.4, max: 49.0) +[2023-10-08 17:10:48,803][19739] Avg episode reward: [(0, '741.660'), (1, '894.290')] +[2023-10-08 17:10:48,885][21195] Updated weights for policy 0, policy_version 36250 (0.0011) +[2023-10-08 17:10:49,791][21194] Updated weights for policy 1, policy_version 35970 (0.0009) +[2023-10-08 17:10:50,160][21194] Updated weights for policy 1, policy_version 35980 (0.0008) +[2023-10-08 17:10:50,534][21194] Updated weights for policy 1, policy_version 35990 (0.0008) +[2023-10-08 17:10:50,897][21194] Updated weights for policy 1, policy_version 36000 (0.0010) +[2023-10-08 17:10:52,739][21195] Updated weights for policy 0, policy_version 36260 (0.0011) +[2023-10-08 17:10:53,105][21195] Updated weights for policy 0, policy_version 36270 (0.0007) +[2023-10-08 17:10:53,473][21195] Updated weights for policy 0, policy_version 36280 (0.0007) +[2023-10-08 17:10:53,802][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 74022912. Throughput: 0: 1753.7, 1: 1696.4. Samples: 18508794. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 17:10:53,803][19739] Avg episode reward: [(0, '741.660'), (1, '891.580')] +[2023-10-08 17:10:54,953][21194] Updated weights for policy 1, policy_version 36010 (0.0010) +[2023-10-08 17:10:55,316][21194] Updated weights for policy 1, policy_version 36020 (0.0010) +[2023-10-08 17:10:55,681][21194] Updated weights for policy 1, policy_version 36030 (0.0008) +[2023-10-08 17:10:57,532][21195] Updated weights for policy 0, policy_version 36290 (0.0008) +[2023-10-08 17:10:57,900][21195] Updated weights for policy 0, policy_version 36300 (0.0009) +[2023-10-08 17:10:58,275][21195] Updated weights for policy 0, policy_version 36310 (0.0010) +[2023-10-08 17:10:58,649][21195] Updated weights for policy 0, policy_version 36320 (0.0009) +[2023-10-08 17:10:58,803][19739] Fps is (10 sec: 16383.7, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 74088448. Throughput: 0: 1753.1, 1: 1723.3. Samples: 18529796. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 17:10:58,804][19739] Avg episode reward: [(0, '741.660'), (1, '892.160')] +[2023-10-08 17:10:59,680][21194] Updated weights for policy 1, policy_version 36040 (0.0007) +[2023-10-08 17:11:00,042][21194] Updated weights for policy 1, policy_version 36050 (0.0008) +[2023-10-08 17:11:00,406][21194] Updated weights for policy 1, policy_version 36060 (0.0007) +[2023-10-08 17:11:02,684][21195] Updated weights for policy 0, policy_version 36330 (0.0008) +[2023-10-08 17:11:03,061][21195] Updated weights for policy 0, policy_version 36340 (0.0008) +[2023-10-08 17:11:03,416][21195] Updated weights for policy 0, policy_version 36350 (0.0007) +[2023-10-08 17:11:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 74153984. Throughput: 0: 1731.4, 1: 1687.8. Samples: 18544068. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 17:11:03,803][19739] Avg episode reward: [(0, '755.980'), (1, '876.960')] +[2023-10-08 17:11:04,342][21194] Updated weights for policy 1, policy_version 36070 (0.0008) +[2023-10-08 17:11:04,714][21194] Updated weights for policy 1, policy_version 36080 (0.0007) +[2023-10-08 17:11:05,088][21194] Updated weights for policy 1, policy_version 36090 (0.0007) +[2023-10-08 17:11:07,147][21195] Updated weights for policy 0, policy_version 36360 (0.0008) +[2023-10-08 17:11:07,513][21195] Updated weights for policy 0, policy_version 36370 (0.0007) +[2023-10-08 17:11:07,888][21195] Updated weights for policy 0, policy_version 36380 (0.0007) +[2023-10-08 17:11:08,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 74219520. Throughput: 0: 1757.8, 1: 1710.4. Samples: 18560742. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 17:11:08,803][19739] Avg episode reward: [(0, '755.980'), (1, '876.960')] +[2023-10-08 17:11:08,923][21194] Updated weights for policy 1, policy_version 36100 (0.0010) +[2023-10-08 17:11:09,291][21194] Updated weights for policy 1, policy_version 36110 (0.0008) +[2023-10-08 17:11:09,656][21194] Updated weights for policy 1, policy_version 36120 (0.0009) +[2023-10-08 17:11:11,866][21195] Updated weights for policy 0, policy_version 36390 (0.0007) +[2023-10-08 17:11:12,235][21195] Updated weights for policy 0, policy_version 36400 (0.0008) +[2023-10-08 17:11:12,600][21195] Updated weights for policy 0, policy_version 36410 (0.0007) +[2023-10-08 17:11:13,531][21194] Updated weights for policy 1, policy_version 36130 (0.0008) +[2023-10-08 17:11:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 74285056. Throughput: 0: 1724.5, 1: 1722.6. Samples: 18581254. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 17:11:13,803][19739] Avg episode reward: [(0, '769.900'), (1, '839.210')] +[2023-10-08 17:11:13,810][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000036416_37289984.pth... +[2023-10-08 17:11:13,839][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000034784_35618816.pth +[2023-10-08 17:11:13,900][21194] Updated weights for policy 1, policy_version 36140 (0.0009) +[2023-10-08 17:11:14,266][21194] Updated weights for policy 1, policy_version 36150 (0.0008) +[2023-10-08 17:11:14,627][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000036160_37027840.pth... +[2023-10-08 17:11:14,627][21194] Updated weights for policy 1, policy_version 36160 (0.0007) +[2023-10-08 17:11:14,666][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000034528_35356672.pth +[2023-10-08 17:11:16,546][21195] Updated weights for policy 0, policy_version 36420 (0.0010) +[2023-10-08 17:11:16,912][21195] Updated weights for policy 0, policy_version 36430 (0.0007) +[2023-10-08 17:11:17,281][21195] Updated weights for policy 0, policy_version 36440 (0.0008) +[2023-10-08 17:11:18,431][21194] Updated weights for policy 1, policy_version 36170 (0.0009) +[2023-10-08 17:11:18,789][21194] Updated weights for policy 1, policy_version 36180 (0.0007) +[2023-10-08 17:11:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 74350592. Throughput: 0: 1723.2, 1: 1706.4. Samples: 18596534. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 17:11:18,803][19739] Avg episode reward: [(0, '769.900'), (1, '839.210')] +[2023-10-08 17:11:19,158][21194] Updated weights for policy 1, policy_version 36190 (0.0010) +[2023-10-08 17:11:21,364][21195] Updated weights for policy 0, policy_version 36450 (0.0009) +[2023-10-08 17:11:21,733][21195] Updated weights for policy 0, policy_version 36460 (0.0008) +[2023-10-08 17:11:22,094][21195] Updated weights for policy 0, policy_version 36470 (0.0008) +[2023-10-08 17:11:22,463][21195] Updated weights for policy 0, policy_version 36480 (0.0009) +[2023-10-08 17:11:23,232][21194] Updated weights for policy 1, policy_version 36200 (0.0008) +[2023-10-08 17:11:23,605][21194] Updated weights for policy 1, policy_version 36210 (0.0010) +[2023-10-08 17:11:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 74416128. Throughput: 0: 1737.1, 1: 1727.0. Samples: 18612746. Policy #0 lag: (min: 8.0, avg: 32.8, max: 40.0) +[2023-10-08 17:11:23,803][19739] Avg episode reward: [(0, '775.670'), (1, '798.670')] +[2023-10-08 17:11:23,965][21194] Updated weights for policy 1, policy_version 36220 (0.0007) +[2023-10-08 17:11:26,441][21195] Updated weights for policy 0, policy_version 36490 (0.0010) +[2023-10-08 17:11:26,807][21195] Updated weights for policy 0, policy_version 36500 (0.0008) +[2023-10-08 17:11:27,177][21195] Updated weights for policy 0, policy_version 36510 (0.0007) +[2023-10-08 17:11:28,044][21194] Updated weights for policy 1, policy_version 36230 (0.0009) +[2023-10-08 17:11:28,418][21194] Updated weights for policy 1, policy_version 36240 (0.0009) +[2023-10-08 17:11:28,788][21194] Updated weights for policy 1, policy_version 36250 (0.0010) +[2023-10-08 17:11:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 74481664. Throughput: 0: 1713.8, 1: 1729.3. Samples: 18633094. Policy #0 lag: (min: 8.0, avg: 32.8, max: 40.0) +[2023-10-08 17:11:28,803][19739] Avg episode reward: [(0, '775.670'), (1, '795.390')] +[2023-10-08 17:11:31,096][21195] Updated weights for policy 0, policy_version 36520 (0.0009) +[2023-10-08 17:11:31,459][21195] Updated weights for policy 0, policy_version 36530 (0.0007) +[2023-10-08 17:11:31,838][21195] Updated weights for policy 0, policy_version 36540 (0.0009) +[2023-10-08 17:11:32,783][21194] Updated weights for policy 1, policy_version 36260 (0.0009) +[2023-10-08 17:11:33,144][21194] Updated weights for policy 1, policy_version 36270 (0.0008) +[2023-10-08 17:11:33,513][21194] Updated weights for policy 1, policy_version 36280 (0.0010) +[2023-10-08 17:11:33,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 74579968. Throughput: 0: 1737.9, 1: 1729.2. Samples: 18648738. Policy #0 lag: (min: 8.0, avg: 32.8, max: 40.0) +[2023-10-08 17:11:33,803][19739] Avg episode reward: [(0, '770.620'), (1, '795.390')] +[2023-10-08 17:11:35,799][21195] Updated weights for policy 0, policy_version 36550 (0.0008) +[2023-10-08 17:11:36,169][21195] Updated weights for policy 0, policy_version 36560 (0.0008) +[2023-10-08 17:11:36,543][21195] Updated weights for policy 0, policy_version 36570 (0.0010) +[2023-10-08 17:11:37,536][21194] Updated weights for policy 1, policy_version 36290 (0.0010) +[2023-10-08 17:11:37,903][21194] Updated weights for policy 1, policy_version 36300 (0.0008) +[2023-10-08 17:11:38,269][21194] Updated weights for policy 1, policy_version 36310 (0.0010) +[2023-10-08 17:11:38,638][21194] Updated weights for policy 1, policy_version 36320 (0.0009) +[2023-10-08 17:11:38,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 74645504. Throughput: 0: 1712.2, 1: 1736.4. Samples: 18663978. Policy #0 lag: (min: 8.0, avg: 32.8, max: 40.0) +[2023-10-08 17:11:38,803][19739] Avg episode reward: [(0, '770.740'), (1, '795.390')] +[2023-10-08 17:11:40,424][21195] Updated weights for policy 0, policy_version 36580 (0.0007) +[2023-10-08 17:11:40,793][21195] Updated weights for policy 0, policy_version 36590 (0.0007) +[2023-10-08 17:11:41,168][21195] Updated weights for policy 0, policy_version 36600 (0.0008) +[2023-10-08 17:11:42,671][21194] Updated weights for policy 1, policy_version 36330 (0.0008) +[2023-10-08 17:11:43,029][21194] Updated weights for policy 1, policy_version 36340 (0.0008) +[2023-10-08 17:11:43,392][21194] Updated weights for policy 1, policy_version 36350 (0.0009) +[2023-10-08 17:11:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 74711040. Throughput: 0: 1721.9, 1: 1720.3. Samples: 18684696. Policy #0 lag: (min: 8.0, avg: 32.8, max: 40.0) +[2023-10-08 17:11:43,803][19739] Avg episode reward: [(0, '770.740'), (1, '794.780')] +[2023-10-08 17:11:45,049][21195] Updated weights for policy 0, policy_version 36610 (0.0008) +[2023-10-08 17:11:45,412][21195] Updated weights for policy 0, policy_version 36620 (0.0009) +[2023-10-08 17:11:45,781][21195] Updated weights for policy 0, policy_version 36630 (0.0007) +[2023-10-08 17:11:46,147][21195] Updated weights for policy 0, policy_version 36640 (0.0009) +[2023-10-08 17:11:47,217][21194] Updated weights for policy 1, policy_version 36360 (0.0008) +[2023-10-08 17:11:47,582][21194] Updated weights for policy 1, policy_version 36370 (0.0007) +[2023-10-08 17:11:47,955][21194] Updated weights for policy 1, policy_version 36380 (0.0008) +[2023-10-08 17:11:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 74776576. Throughput: 0: 1750.8, 1: 1744.3. Samples: 18701346. Policy #0 lag: (min: 2.0, avg: 2.0, max: 3.0) +[2023-10-08 17:11:48,803][19739] Avg episode reward: [(0, '770.740'), (1, '794.780')] +[2023-10-08 17:11:49,895][21195] Updated weights for policy 0, policy_version 36650 (0.0007) +[2023-10-08 17:11:50,261][21195] Updated weights for policy 0, policy_version 36660 (0.0008) +[2023-10-08 17:11:50,626][21195] Updated weights for policy 0, policy_version 36670 (0.0011) +[2023-10-08 17:11:51,975][21194] Updated weights for policy 1, policy_version 36390 (0.0007) +[2023-10-08 17:11:52,343][21194] Updated weights for policy 1, policy_version 36400 (0.0008) +[2023-10-08 17:11:52,701][21194] Updated weights for policy 1, policy_version 36410 (0.0008) +[2023-10-08 17:11:53,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 74842112. Throughput: 0: 1719.9, 1: 1737.8. Samples: 18716338. Policy #0 lag: (min: 2.0, avg: 2.0, max: 3.0) +[2023-10-08 17:11:53,804][19739] Avg episode reward: [(0, '770.740'), (1, '794.780')] +[2023-10-08 17:11:54,556][21195] Updated weights for policy 0, policy_version 36680 (0.0008) +[2023-10-08 17:11:54,927][21195] Updated weights for policy 0, policy_version 36690 (0.0007) +[2023-10-08 17:11:55,292][21195] Updated weights for policy 0, policy_version 36700 (0.0007) +[2023-10-08 17:11:56,512][21194] Updated weights for policy 1, policy_version 36420 (0.0009) +[2023-10-08 17:11:56,877][21194] Updated weights for policy 1, policy_version 36430 (0.0007) +[2023-10-08 17:11:57,249][21194] Updated weights for policy 1, policy_version 36440 (0.0009) +[2023-10-08 17:11:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 74907648. Throughput: 0: 1750.7, 1: 1708.9. Samples: 18736936. Policy #0 lag: (min: 2.0, avg: 2.0, max: 3.0) +[2023-10-08 17:11:58,803][19739] Avg episode reward: [(0, '770.120'), (1, '794.780')] +[2023-10-08 17:11:59,167][21195] Updated weights for policy 0, policy_version 36710 (0.0009) +[2023-10-08 17:11:59,535][21195] Updated weights for policy 0, policy_version 36720 (0.0008) +[2023-10-08 17:11:59,912][21195] Updated weights for policy 0, policy_version 36730 (0.0008) +[2023-10-08 17:12:01,126][21194] Updated weights for policy 1, policy_version 36450 (0.0009) +[2023-10-08 17:12:01,492][21194] Updated weights for policy 1, policy_version 36460 (0.0007) +[2023-10-08 17:12:01,858][21194] Updated weights for policy 1, policy_version 36470 (0.0009) +[2023-10-08 17:12:02,227][21194] Updated weights for policy 1, policy_version 36480 (0.0010) +[2023-10-08 17:12:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 74973184. Throughput: 0: 1744.6, 1: 1739.3. Samples: 18753308. Policy #0 lag: (min: 2.0, avg: 2.0, max: 3.0) +[2023-10-08 17:12:03,804][19739] Avg episode reward: [(0, '770.120'), (1, '803.020')] +[2023-10-08 17:12:03,932][21195] Updated weights for policy 0, policy_version 36740 (0.0009) +[2023-10-08 17:12:04,310][21195] Updated weights for policy 0, policy_version 36750 (0.0010) +[2023-10-08 17:12:04,674][21195] Updated weights for policy 0, policy_version 36760 (0.0011) +[2023-10-08 17:12:05,989][21194] Updated weights for policy 1, policy_version 36490 (0.0011) +[2023-10-08 17:12:06,355][21194] Updated weights for policy 1, policy_version 36500 (0.0009) +[2023-10-08 17:12:06,727][21194] Updated weights for policy 1, policy_version 36510 (0.0007) +[2023-10-08 17:12:08,597][21195] Updated weights for policy 0, policy_version 36770 (0.0009) +[2023-10-08 17:12:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 75038720. Throughput: 0: 1728.2, 1: 1708.6. Samples: 18767402. Policy #0 lag: (min: 2.0, avg: 2.0, max: 3.0) +[2023-10-08 17:12:08,803][19739] Avg episode reward: [(0, '770.120'), (1, '802.850')] +[2023-10-08 17:12:08,969][21195] Updated weights for policy 0, policy_version 36780 (0.0008) +[2023-10-08 17:12:09,335][21195] Updated weights for policy 0, policy_version 36790 (0.0008) +[2023-10-08 17:12:09,701][21195] Updated weights for policy 0, policy_version 36800 (0.0007) +[2023-10-08 17:12:10,694][21194] Updated weights for policy 1, policy_version 36520 (0.0008) +[2023-10-08 17:12:11,058][21194] Updated weights for policy 1, policy_version 36530 (0.0008) +[2023-10-08 17:12:11,437][21194] Updated weights for policy 1, policy_version 36540 (0.0009) +[2023-10-08 17:12:13,531][21195] Updated weights for policy 0, policy_version 36810 (0.0007) +[2023-10-08 17:12:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 75104256. Throughput: 0: 1752.0, 1: 1715.0. Samples: 18789110. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 17:12:13,803][19739] Avg episode reward: [(0, '770.120'), (1, '791.840')] +[2023-10-08 17:12:13,909][21195] Updated weights for policy 0, policy_version 36820 (0.0009) +[2023-10-08 17:12:14,271][21195] Updated weights for policy 0, policy_version 36830 (0.0008) +[2023-10-08 17:12:15,731][21194] Updated weights for policy 1, policy_version 36550 (0.0009) +[2023-10-08 17:12:16,116][21194] Updated weights for policy 1, policy_version 36560 (0.0010) +[2023-10-08 17:12:16,475][21194] Updated weights for policy 1, policy_version 36570 (0.0010) +[2023-10-08 17:12:18,148][21195] Updated weights for policy 0, policy_version 36840 (0.0008) +[2023-10-08 17:12:18,512][21195] Updated weights for policy 0, policy_version 36850 (0.0008) +[2023-10-08 17:12:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 75169792. Throughput: 0: 1725.6, 1: 1725.3. Samples: 18804028. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 17:12:18,803][19739] Avg episode reward: [(0, '779.480'), (1, '791.840')] +[2023-10-08 17:12:18,891][21195] Updated weights for policy 0, policy_version 36860 (0.0009) +[2023-10-08 17:12:20,382][21194] Updated weights for policy 1, policy_version 36580 (0.0010) +[2023-10-08 17:12:20,752][21194] Updated weights for policy 1, policy_version 36590 (0.0009) +[2023-10-08 17:12:21,118][21194] Updated weights for policy 1, policy_version 36600 (0.0008) +[2023-10-08 17:12:22,764][21195] Updated weights for policy 0, policy_version 36870 (0.0008) +[2023-10-08 17:12:23,141][21195] Updated weights for policy 0, policy_version 36880 (0.0007) +[2023-10-08 17:12:23,508][21195] Updated weights for policy 0, policy_version 36890 (0.0007) +[2023-10-08 17:12:23,802][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 75268096. Throughput: 0: 1754.2, 1: 1708.3. Samples: 18819790. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 17:12:23,803][19739] Avg episode reward: [(0, '779.550'), (1, '791.840')] +[2023-10-08 17:12:25,082][21194] Updated weights for policy 1, policy_version 36610 (0.0010) +[2023-10-08 17:12:25,455][21194] Updated weights for policy 1, policy_version 36620 (0.0010) +[2023-10-08 17:12:25,828][21194] Updated weights for policy 1, policy_version 36630 (0.0008) +[2023-10-08 17:12:26,189][21194] Updated weights for policy 1, policy_version 36640 (0.0007) +[2023-10-08 17:12:27,506][21195] Updated weights for policy 0, policy_version 36900 (0.0008) +[2023-10-08 17:12:27,875][21195] Updated weights for policy 0, policy_version 36910 (0.0008) +[2023-10-08 17:12:28,252][21195] Updated weights for policy 0, policy_version 36920 (0.0007) +[2023-10-08 17:12:28,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 75333632. Throughput: 0: 1743.6, 1: 1725.9. Samples: 18840822. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 17:12:28,803][19739] Avg episode reward: [(0, '751.170'), (1, '791.840')] +[2023-10-08 17:12:30,289][21194] Updated weights for policy 1, policy_version 36650 (0.0011) +[2023-10-08 17:12:30,655][21194] Updated weights for policy 1, policy_version 36660 (0.0009) +[2023-10-08 17:12:31,015][21194] Updated weights for policy 1, policy_version 36670 (0.0009) +[2023-10-08 17:12:31,899][21195] Updated weights for policy 0, policy_version 36930 (0.0008) +[2023-10-08 17:12:32,271][21195] Updated weights for policy 0, policy_version 36940 (0.0009) +[2023-10-08 17:12:32,633][21195] Updated weights for policy 0, policy_version 36950 (0.0009) +[2023-10-08 17:12:33,008][21195] Updated weights for policy 0, policy_version 36960 (0.0009) +[2023-10-08 17:12:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 75399168. Throughput: 0: 1726.4, 1: 1702.4. Samples: 18855644. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 17:12:33,803][19739] Avg episode reward: [(0, '738.830'), (1, '778.250')] +[2023-10-08 17:12:34,919][21194] Updated weights for policy 1, policy_version 36680 (0.0009) +[2023-10-08 17:12:35,277][21194] Updated weights for policy 1, policy_version 36690 (0.0009) +[2023-10-08 17:12:35,640][21194] Updated weights for policy 1, policy_version 36700 (0.0008) +[2023-10-08 17:12:36,942][21195] Updated weights for policy 0, policy_version 36970 (0.0009) +[2023-10-08 17:12:37,306][21195] Updated weights for policy 0, policy_version 36980 (0.0009) +[2023-10-08 17:12:37,678][21195] Updated weights for policy 0, policy_version 36990 (0.0008) +[2023-10-08 17:12:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 75464704. Throughput: 0: 1754.8, 1: 1711.2. Samples: 18872308. Policy #0 lag: (min: 7.0, avg: 14.9, max: 39.0) +[2023-10-08 17:12:38,803][19739] Avg episode reward: [(0, '753.350'), (1, '778.250')] +[2023-10-08 17:12:39,465][21194] Updated weights for policy 1, policy_version 36710 (0.0008) +[2023-10-08 17:12:39,822][21194] Updated weights for policy 1, policy_version 36720 (0.0007) +[2023-10-08 17:12:40,192][21194] Updated weights for policy 1, policy_version 36730 (0.0010) +[2023-10-08 17:12:41,652][21195] Updated weights for policy 0, policy_version 37000 (0.0007) +[2023-10-08 17:12:42,026][21195] Updated weights for policy 0, policy_version 37010 (0.0007) +[2023-10-08 17:12:42,395][21195] Updated weights for policy 0, policy_version 37020 (0.0007) +[2023-10-08 17:12:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 75530240. Throughput: 0: 1729.9, 1: 1729.2. Samples: 18892598. Policy #0 lag: (min: 7.0, avg: 14.9, max: 39.0) +[2023-10-08 17:12:43,803][19739] Avg episode reward: [(0, '767.190'), (1, '778.250')] +[2023-10-08 17:12:44,252][21194] Updated weights for policy 1, policy_version 36740 (0.0009) +[2023-10-08 17:12:44,621][21194] Updated weights for policy 1, policy_version 36750 (0.0007) +[2023-10-08 17:12:44,984][21194] Updated weights for policy 1, policy_version 36760 (0.0007) +[2023-10-08 17:12:46,116][21195] Updated weights for policy 0, policy_version 37030 (0.0008) +[2023-10-08 17:12:46,491][21195] Updated weights for policy 0, policy_version 37040 (0.0009) +[2023-10-08 17:12:46,863][21195] Updated weights for policy 0, policy_version 37050 (0.0009) +[2023-10-08 17:12:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 75595776. Throughput: 0: 1741.5, 1: 1696.0. Samples: 18907992. Policy #0 lag: (min: 7.0, avg: 14.9, max: 39.0) +[2023-10-08 17:12:48,803][19739] Avg episode reward: [(0, '753.030'), (1, '778.250')] +[2023-10-08 17:12:49,033][21194] Updated weights for policy 1, policy_version 36770 (0.0009) +[2023-10-08 17:12:49,400][21194] Updated weights for policy 1, policy_version 36780 (0.0007) +[2023-10-08 17:12:49,760][21194] Updated weights for policy 1, policy_version 36790 (0.0009) +[2023-10-08 17:12:50,117][21194] Updated weights for policy 1, policy_version 36800 (0.0008) +[2023-10-08 17:12:50,798][21195] Updated weights for policy 0, policy_version 37060 (0.0008) +[2023-10-08 17:12:51,162][21195] Updated weights for policy 0, policy_version 37070 (0.0008) +[2023-10-08 17:12:51,542][21195] Updated weights for policy 0, policy_version 37080 (0.0009) +[2023-10-08 17:12:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 75661312. Throughput: 0: 1743.7, 1: 1722.0. Samples: 18923356. Policy #0 lag: (min: 7.0, avg: 14.9, max: 39.0) +[2023-10-08 17:12:53,803][19739] Avg episode reward: [(0, '753.030'), (1, '784.400')] +[2023-10-08 17:12:53,871][21194] Updated weights for policy 1, policy_version 36810 (0.0008) +[2023-10-08 17:12:54,238][21194] Updated weights for policy 1, policy_version 36820 (0.0009) +[2023-10-08 17:12:54,611][21194] Updated weights for policy 1, policy_version 36830 (0.0007) +[2023-10-08 17:12:55,274][21195] Updated weights for policy 0, policy_version 37090 (0.0009) +[2023-10-08 17:12:55,657][21195] Updated weights for policy 0, policy_version 37100 (0.0007) +[2023-10-08 17:12:56,021][21195] Updated weights for policy 0, policy_version 37110 (0.0010) +[2023-10-08 17:12:56,390][21195] Updated weights for policy 0, policy_version 37120 (0.0009) +[2023-10-08 17:12:58,634][21194] Updated weights for policy 1, policy_version 36840 (0.0008) +[2023-10-08 17:12:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 75726848. Throughput: 0: 1742.8, 1: 1725.2. Samples: 18945166. Policy #0 lag: (min: 7.0, avg: 14.9, max: 39.0) +[2023-10-08 17:12:58,803][19739] Avg episode reward: [(0, '737.450'), (1, '784.400')] +[2023-10-08 17:12:58,998][21194] Updated weights for policy 1, policy_version 36850 (0.0008) +[2023-10-08 17:12:59,374][21194] Updated weights for policy 1, policy_version 36860 (0.0007) +[2023-10-08 17:13:00,341][21195] Updated weights for policy 0, policy_version 37130 (0.0007) +[2023-10-08 17:13:00,706][21195] Updated weights for policy 0, policy_version 37140 (0.0008) +[2023-10-08 17:13:01,072][21195] Updated weights for policy 0, policy_version 37150 (0.0010) +[2023-10-08 17:13:03,370][21194] Updated weights for policy 1, policy_version 36870 (0.0008) +[2023-10-08 17:13:03,754][21194] Updated weights for policy 1, policy_version 36880 (0.0011) +[2023-10-08 17:13:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 75792384. Throughput: 0: 1764.5, 1: 1712.6. Samples: 18960496. Policy #0 lag: (min: 7.0, avg: 14.9, max: 39.0) +[2023-10-08 17:13:03,804][19739] Avg episode reward: [(0, '737.450'), (1, '784.400')] +[2023-10-08 17:13:04,125][21194] Updated weights for policy 1, policy_version 36890 (0.0010) +[2023-10-08 17:13:05,012][21195] Updated weights for policy 0, policy_version 37160 (0.0009) +[2023-10-08 17:13:05,385][21195] Updated weights for policy 0, policy_version 37170 (0.0010) +[2023-10-08 17:13:05,756][21195] Updated weights for policy 0, policy_version 37180 (0.0011) +[2023-10-08 17:13:08,175][21194] Updated weights for policy 1, policy_version 36900 (0.0008) +[2023-10-08 17:13:08,541][21194] Updated weights for policy 1, policy_version 36910 (0.0008) +[2023-10-08 17:13:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 75857920. Throughput: 0: 1737.8, 1: 1722.1. Samples: 18975486. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:13:08,803][19739] Avg episode reward: [(0, '711.870'), (1, '784.400')] +[2023-10-08 17:13:08,898][21194] Updated weights for policy 1, policy_version 36920 (0.0007) +[2023-10-08 17:13:09,612][21195] Updated weights for policy 0, policy_version 37190 (0.0010) +[2023-10-08 17:13:09,981][21195] Updated weights for policy 0, policy_version 37200 (0.0007) +[2023-10-08 17:13:10,352][21195] Updated weights for policy 0, policy_version 37210 (0.0007) +[2023-10-08 17:13:12,811][21194] Updated weights for policy 1, policy_version 36930 (0.0007) +[2023-10-08 17:13:13,178][21194] Updated weights for policy 1, policy_version 36940 (0.0007) +[2023-10-08 17:13:13,548][21194] Updated weights for policy 1, policy_version 36950 (0.0009) +[2023-10-08 17:13:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 75923456. Throughput: 0: 1746.9, 1: 1715.3. Samples: 18996624. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:13:13,804][19739] Avg episode reward: [(0, '711.870'), (1, '784.400')] +[2023-10-08 17:13:13,815][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000037216_38109184.pth... +[2023-10-08 17:13:13,846][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000035616_36470784.pth +[2023-10-08 17:13:13,907][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000036960_37847040.pth... +[2023-10-08 17:13:13,910][21194] Updated weights for policy 1, policy_version 36960 (0.0007) +[2023-10-08 17:13:13,937][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000035328_36175872.pth +[2023-10-08 17:13:14,224][21195] Updated weights for policy 0, policy_version 37220 (0.0007) +[2023-10-08 17:13:14,597][21195] Updated weights for policy 0, policy_version 37230 (0.0010) +[2023-10-08 17:13:14,971][21195] Updated weights for policy 0, policy_version 37240 (0.0009) +[2023-10-08 17:13:17,775][21194] Updated weights for policy 1, policy_version 36970 (0.0008) +[2023-10-08 17:13:18,140][21194] Updated weights for policy 1, policy_version 36980 (0.0007) +[2023-10-08 17:13:18,504][21194] Updated weights for policy 1, policy_version 36990 (0.0007) +[2023-10-08 17:13:18,770][21195] Updated weights for policy 0, policy_version 37250 (0.0008) +[2023-10-08 17:13:18,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 76021760. Throughput: 0: 1760.8, 1: 1726.8. Samples: 19012582. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:13:18,803][19739] Avg episode reward: [(0, '711.870'), (1, '790.360')] +[2023-10-08 17:13:19,142][21195] Updated weights for policy 0, policy_version 37260 (0.0009) +[2023-10-08 17:13:19,514][21195] Updated weights for policy 0, policy_version 37270 (0.0010) +[2023-10-08 17:13:19,876][21195] Updated weights for policy 0, policy_version 37280 (0.0010) +[2023-10-08 17:13:22,684][21194] Updated weights for policy 1, policy_version 37000 (0.0009) +[2023-10-08 17:13:23,048][21194] Updated weights for policy 1, policy_version 37010 (0.0008) +[2023-10-08 17:13:23,417][21194] Updated weights for policy 1, policy_version 37020 (0.0007) +[2023-10-08 17:13:23,770][21195] Updated weights for policy 0, policy_version 37290 (0.0009) +[2023-10-08 17:13:23,802][19739] Fps is (10 sec: 16384.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 76087296. Throughput: 0: 1736.3, 1: 1727.2. Samples: 19028164. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:13:23,803][19739] Avg episode reward: [(0, '711.870'), (1, '785.100')] +[2023-10-08 17:13:24,138][21195] Updated weights for policy 0, policy_version 37300 (0.0010) +[2023-10-08 17:13:24,513][21195] Updated weights for policy 0, policy_version 37310 (0.0008) +[2023-10-08 17:13:27,361][21194] Updated weights for policy 1, policy_version 37030 (0.0009) +[2023-10-08 17:13:27,733][21194] Updated weights for policy 1, policy_version 37040 (0.0009) +[2023-10-08 17:13:28,099][21194] Updated weights for policy 1, policy_version 37050 (0.0009) +[2023-10-08 17:13:28,463][21195] Updated weights for policy 0, policy_version 37320 (0.0007) +[2023-10-08 17:13:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 76152832. Throughput: 0: 1757.2, 1: 1706.5. Samples: 19048466. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:13:28,803][19739] Avg episode reward: [(0, '711.870'), (1, '768.100')] +[2023-10-08 17:13:28,828][21195] Updated weights for policy 0, policy_version 37330 (0.0009) +[2023-10-08 17:13:29,204][21195] Updated weights for policy 0, policy_version 37340 (0.0011) +[2023-10-08 17:13:31,963][21194] Updated weights for policy 1, policy_version 37060 (0.0007) +[2023-10-08 17:13:32,331][21194] Updated weights for policy 1, policy_version 37070 (0.0008) +[2023-10-08 17:13:32,701][21194] Updated weights for policy 1, policy_version 37080 (0.0007) +[2023-10-08 17:13:33,215][21195] Updated weights for policy 0, policy_version 37350 (0.0010) +[2023-10-08 17:13:33,585][21195] Updated weights for policy 0, policy_version 37360 (0.0010) +[2023-10-08 17:13:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 76218368. Throughput: 0: 1728.9, 1: 1732.2. Samples: 19063744. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:13:33,803][19739] Avg episode reward: [(0, '711.870'), (1, '753.520')] +[2023-10-08 17:13:33,954][21195] Updated weights for policy 0, policy_version 37370 (0.0011) +[2023-10-08 17:13:36,668][21194] Updated weights for policy 1, policy_version 37090 (0.0011) +[2023-10-08 17:13:37,039][21194] Updated weights for policy 1, policy_version 37100 (0.0009) +[2023-10-08 17:13:37,397][21194] Updated weights for policy 1, policy_version 37110 (0.0012) +[2023-10-08 17:13:37,767][21194] Updated weights for policy 1, policy_version 37120 (0.0009) +[2023-10-08 17:13:37,906][21195] Updated weights for policy 0, policy_version 37380 (0.0010) +[2023-10-08 17:13:38,281][21195] Updated weights for policy 0, policy_version 37390 (0.0008) +[2023-10-08 17:13:38,646][21195] Updated weights for policy 0, policy_version 37400 (0.0008) +[2023-10-08 17:13:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 76283904. Throughput: 0: 1744.4, 1: 1726.1. Samples: 19079530. Policy #0 lag: (min: 12.0, avg: 12.0, max: 12.0) +[2023-10-08 17:13:38,803][19739] Avg episode reward: [(0, '725.080'), (1, '753.520')] +[2023-10-08 17:13:41,814][21194] Updated weights for policy 1, policy_version 37130 (0.0007) +[2023-10-08 17:13:42,171][21194] Updated weights for policy 1, policy_version 37140 (0.0011) +[2023-10-08 17:13:42,539][21194] Updated weights for policy 1, policy_version 37150 (0.0009) +[2023-10-08 17:13:42,668][21195] Updated weights for policy 0, policy_version 37410 (0.0009) +[2023-10-08 17:13:43,072][21195] Updated weights for policy 0, policy_version 37420 (0.0008) +[2023-10-08 17:13:43,442][21195] Updated weights for policy 0, policy_version 37430 (0.0007) +[2023-10-08 17:13:43,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 76382208. Throughput: 0: 1734.2, 1: 1699.3. Samples: 19099674. Policy #0 lag: (min: 12.0, avg: 12.0, max: 12.0) +[2023-10-08 17:13:43,803][19739] Avg episode reward: [(0, '746.670'), (1, '753.660')] +[2023-10-08 17:13:43,804][21195] Updated weights for policy 0, policy_version 37440 (0.0007) +[2023-10-08 17:13:46,603][21194] Updated weights for policy 1, policy_version 37160 (0.0007) +[2023-10-08 17:13:46,965][21194] Updated weights for policy 1, policy_version 37170 (0.0007) +[2023-10-08 17:13:47,331][21194] Updated weights for policy 1, policy_version 37180 (0.0010) +[2023-10-08 17:13:47,682][21195] Updated weights for policy 0, policy_version 37450 (0.0009) +[2023-10-08 17:13:48,040][21195] Updated weights for policy 0, policy_version 37460 (0.0009) +[2023-10-08 17:13:48,412][21195] Updated weights for policy 0, policy_version 37470 (0.0009) +[2023-10-08 17:13:48,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 76447744. Throughput: 0: 1710.2, 1: 1728.2. Samples: 19115222. Policy #0 lag: (min: 12.0, avg: 12.0, max: 12.0) +[2023-10-08 17:13:48,803][19739] Avg episode reward: [(0, '746.670'), (1, '768.780')] +[2023-10-08 17:13:51,323][21194] Updated weights for policy 1, policy_version 37190 (0.0007) +[2023-10-08 17:13:51,685][21194] Updated weights for policy 1, policy_version 37200 (0.0007) +[2023-10-08 17:13:52,044][21194] Updated weights for policy 1, policy_version 37210 (0.0010) +[2023-10-08 17:13:52,451][21195] Updated weights for policy 0, policy_version 37480 (0.0009) +[2023-10-08 17:13:52,834][21195] Updated weights for policy 0, policy_version 37490 (0.0009) +[2023-10-08 17:13:53,208][21195] Updated weights for policy 0, policy_version 37500 (0.0010) +[2023-10-08 17:13:53,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 76513280. Throughput: 0: 1741.1, 1: 1708.1. Samples: 19130702. Policy #0 lag: (min: 12.0, avg: 12.0, max: 12.0) +[2023-10-08 17:13:53,803][19739] Avg episode reward: [(0, '747.060'), (1, '766.860')] +[2023-10-08 17:13:55,925][21194] Updated weights for policy 1, policy_version 37220 (0.0007) +[2023-10-08 17:13:56,323][21194] Updated weights for policy 1, policy_version 37230 (0.0007) +[2023-10-08 17:13:56,694][21194] Updated weights for policy 1, policy_version 37240 (0.0007) +[2023-10-08 17:13:57,227][21195] Updated weights for policy 0, policy_version 37510 (0.0009) +[2023-10-08 17:13:57,603][21195] Updated weights for policy 0, policy_version 37520 (0.0007) +[2023-10-08 17:13:57,978][21195] Updated weights for policy 0, policy_version 37530 (0.0007) +[2023-10-08 17:13:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 76578816. Throughput: 0: 1717.9, 1: 1713.2. Samples: 19151022. Policy #0 lag: (min: 12.0, avg: 12.0, max: 12.0) +[2023-10-08 17:13:58,803][19739] Avg episode reward: [(0, '742.550'), (1, '766.860')] +[2023-10-08 17:14:00,597][21194] Updated weights for policy 1, policy_version 37250 (0.0007) +[2023-10-08 17:14:00,963][21194] Updated weights for policy 1, policy_version 37260 (0.0009) +[2023-10-08 17:14:01,330][21194] Updated weights for policy 1, policy_version 37270 (0.0007) +[2023-10-08 17:14:01,687][21194] Updated weights for policy 1, policy_version 37280 (0.0007) +[2023-10-08 17:14:01,888][21195] Updated weights for policy 0, policy_version 37540 (0.0008) +[2023-10-08 17:14:02,260][21195] Updated weights for policy 0, policy_version 37550 (0.0010) +[2023-10-08 17:14:02,630][21195] Updated weights for policy 0, policy_version 37560 (0.0009) +[2023-10-08 17:14:03,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 76644352. Throughput: 0: 1704.4, 1: 1716.5. Samples: 19166522. Policy #0 lag: (min: 24.0, avg: 46.1, max: 56.0) +[2023-10-08 17:14:03,804][19739] Avg episode reward: [(0, '713.770'), (1, '766.860')] +[2023-10-08 17:14:05,793][21194] Updated weights for policy 1, policy_version 37290 (0.0010) +[2023-10-08 17:14:06,156][21194] Updated weights for policy 1, policy_version 37300 (0.0011) +[2023-10-08 17:14:06,498][21195] Updated weights for policy 0, policy_version 37570 (0.0008) +[2023-10-08 17:14:06,521][21194] Updated weights for policy 1, policy_version 37310 (0.0007) +[2023-10-08 17:14:06,860][21195] Updated weights for policy 0, policy_version 37580 (0.0008) +[2023-10-08 17:14:07,237][21195] Updated weights for policy 0, policy_version 37590 (0.0007) +[2023-10-08 17:14:07,614][21195] Updated weights for policy 0, policy_version 37600 (0.0007) +[2023-10-08 17:14:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 76709888. Throughput: 0: 1723.2, 1: 1694.7. Samples: 19181968. Policy #0 lag: (min: 24.0, avg: 46.1, max: 56.0) +[2023-10-08 17:14:08,803][19739] Avg episode reward: [(0, '713.770'), (1, '766.860')] +[2023-10-08 17:14:10,344][21194] Updated weights for policy 1, policy_version 37320 (0.0008) +[2023-10-08 17:14:10,716][21194] Updated weights for policy 1, policy_version 37330 (0.0009) +[2023-10-08 17:14:11,075][21194] Updated weights for policy 1, policy_version 37340 (0.0009) +[2023-10-08 17:14:11,545][21195] Updated weights for policy 0, policy_version 37610 (0.0007) +[2023-10-08 17:14:11,918][21195] Updated weights for policy 0, policy_version 37620 (0.0010) +[2023-10-08 17:14:12,297][21195] Updated weights for policy 0, policy_version 37630 (0.0009) +[2023-10-08 17:14:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 76775424. Throughput: 0: 1700.9, 1: 1720.7. Samples: 19202436. Policy #0 lag: (min: 24.0, avg: 46.1, max: 56.0) +[2023-10-08 17:14:13,804][19739] Avg episode reward: [(0, '713.770'), (1, '781.840')] +[2023-10-08 17:14:15,140][21194] Updated weights for policy 1, policy_version 37350 (0.0008) +[2023-10-08 17:14:15,502][21194] Updated weights for policy 1, policy_version 37360 (0.0009) +[2023-10-08 17:14:15,874][21194] Updated weights for policy 1, policy_version 37370 (0.0008) +[2023-10-08 17:14:16,310][21195] Updated weights for policy 0, policy_version 37640 (0.0008) +[2023-10-08 17:14:16,679][21195] Updated weights for policy 0, policy_version 37650 (0.0008) +[2023-10-08 17:14:17,043][21195] Updated weights for policy 0, policy_version 37660 (0.0008) +[2023-10-08 17:14:18,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 76840960. Throughput: 0: 1722.5, 1: 1700.4. Samples: 19217776. Policy #0 lag: (min: 24.0, avg: 46.1, max: 56.0) +[2023-10-08 17:14:18,804][19739] Avg episode reward: [(0, '713.770'), (1, '781.840')] +[2023-10-08 17:14:19,738][21194] Updated weights for policy 1, policy_version 37380 (0.0007) +[2023-10-08 17:14:20,100][21194] Updated weights for policy 1, policy_version 37390 (0.0008) +[2023-10-08 17:14:20,470][21194] Updated weights for policy 1, policy_version 37400 (0.0009) +[2023-10-08 17:14:20,862][21195] Updated weights for policy 0, policy_version 37670 (0.0008) +[2023-10-08 17:14:21,240][21195] Updated weights for policy 0, policy_version 37680 (0.0009) +[2023-10-08 17:14:21,610][21195] Updated weights for policy 0, policy_version 37690 (0.0009) +[2023-10-08 17:14:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 76906496. Throughput: 0: 1706.0, 1: 1709.5. Samples: 19233226. Policy #0 lag: (min: 24.0, avg: 46.1, max: 56.0) +[2023-10-08 17:14:23,804][19739] Avg episode reward: [(0, '728.400'), (1, '781.840')] +[2023-10-08 17:14:24,458][21194] Updated weights for policy 1, policy_version 37410 (0.0008) +[2023-10-08 17:14:24,841][21194] Updated weights for policy 1, policy_version 37420 (0.0009) +[2023-10-08 17:14:25,211][21194] Updated weights for policy 1, policy_version 37430 (0.0009) +[2023-10-08 17:14:25,582][21194] Updated weights for policy 1, policy_version 37440 (0.0008) +[2023-10-08 17:14:25,629][21195] Updated weights for policy 0, policy_version 37700 (0.0007) +[2023-10-08 17:14:26,003][21195] Updated weights for policy 0, policy_version 37710 (0.0007) +[2023-10-08 17:14:26,366][21195] Updated weights for policy 0, policy_version 37720 (0.0008) +[2023-10-08 17:14:28,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 76972032. Throughput: 0: 1707.9, 1: 1730.7. Samples: 19254408. Policy #0 lag: (min: 24.0, avg: 46.1, max: 56.0) +[2023-10-08 17:14:28,803][19739] Avg episode reward: [(0, '742.390'), (1, '781.840')] +[2023-10-08 17:14:29,368][21194] Updated weights for policy 1, policy_version 37450 (0.0007) +[2023-10-08 17:14:29,734][21194] Updated weights for policy 1, policy_version 37460 (0.0008) +[2023-10-08 17:14:30,104][21194] Updated weights for policy 1, policy_version 37470 (0.0009) +[2023-10-08 17:14:30,317][21195] Updated weights for policy 0, policy_version 37730 (0.0007) +[2023-10-08 17:14:30,713][21195] Updated weights for policy 0, policy_version 37740 (0.0009) +[2023-10-08 17:14:31,084][21195] Updated weights for policy 0, policy_version 37750 (0.0009) +[2023-10-08 17:14:31,451][21195] Updated weights for policy 0, policy_version 37760 (0.0008) +[2023-10-08 17:14:33,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 77037568. Throughput: 0: 1728.3, 1: 1703.6. Samples: 19269660. Policy #0 lag: (min: 13.0, avg: 16.4, max: 45.0) +[2023-10-08 17:14:33,803][19739] Avg episode reward: [(0, '742.390'), (1, '782.020')] +[2023-10-08 17:14:34,042][21194] Updated weights for policy 1, policy_version 37480 (0.0009) +[2023-10-08 17:14:34,416][21194] Updated weights for policy 1, policy_version 37490 (0.0008) +[2023-10-08 17:14:34,791][21194] Updated weights for policy 1, policy_version 37500 (0.0010) +[2023-10-08 17:14:35,406][21195] Updated weights for policy 0, policy_version 37770 (0.0010) +[2023-10-08 17:14:35,776][21195] Updated weights for policy 0, policy_version 37780 (0.0008) +[2023-10-08 17:14:36,145][21195] Updated weights for policy 0, policy_version 37790 (0.0011) +[2023-10-08 17:14:38,623][21194] Updated weights for policy 1, policy_version 37510 (0.0011) +[2023-10-08 17:14:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 77103104. Throughput: 0: 1699.9, 1: 1730.8. Samples: 19285084. Policy #0 lag: (min: 13.0, avg: 16.4, max: 45.0) +[2023-10-08 17:14:38,803][19739] Avg episode reward: [(0, '742.390'), (1, '782.020')] +[2023-10-08 17:14:38,985][21194] Updated weights for policy 1, policy_version 37520 (0.0010) +[2023-10-08 17:14:39,353][21194] Updated weights for policy 1, policy_version 37530 (0.0010) +[2023-10-08 17:14:40,327][21195] Updated weights for policy 0, policy_version 37800 (0.0009) +[2023-10-08 17:14:40,697][21195] Updated weights for policy 0, policy_version 37810 (0.0009) +[2023-10-08 17:14:41,068][21195] Updated weights for policy 0, policy_version 37820 (0.0009) +[2023-10-08 17:14:43,517][21194] Updated weights for policy 1, policy_version 37540 (0.0009) +[2023-10-08 17:14:43,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 77168640. Throughput: 0: 1719.2, 1: 1732.7. Samples: 19306358. Policy #0 lag: (min: 13.0, avg: 16.4, max: 45.0) +[2023-10-08 17:14:43,803][19739] Avg episode reward: [(0, '757.340'), (1, '782.020')] +[2023-10-08 17:14:43,907][21194] Updated weights for policy 1, policy_version 37550 (0.0007) +[2023-10-08 17:14:44,281][21194] Updated weights for policy 1, policy_version 37560 (0.0010) +[2023-10-08 17:14:45,025][21195] Updated weights for policy 0, policy_version 37830 (0.0008) +[2023-10-08 17:14:45,401][21195] Updated weights for policy 0, policy_version 37840 (0.0009) +[2023-10-08 17:14:45,762][21195] Updated weights for policy 0, policy_version 37850 (0.0008) +[2023-10-08 17:14:48,416][21194] Updated weights for policy 1, policy_version 37570 (0.0008) +[2023-10-08 17:14:48,779][21194] Updated weights for policy 1, policy_version 37580 (0.0007) +[2023-10-08 17:14:48,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 77234176. Throughput: 0: 1735.8, 1: 1717.2. Samples: 19321906. Policy #0 lag: (min: 13.0, avg: 16.4, max: 45.0) +[2023-10-08 17:14:48,804][19739] Avg episode reward: [(0, '757.340'), (1, '782.020')] +[2023-10-08 17:14:49,141][21194] Updated weights for policy 1, policy_version 37590 (0.0008) +[2023-10-08 17:14:49,501][21194] Updated weights for policy 1, policy_version 37600 (0.0008) +[2023-10-08 17:14:49,719][21195] Updated weights for policy 0, policy_version 37860 (0.0008) +[2023-10-08 17:14:50,081][21195] Updated weights for policy 0, policy_version 37870 (0.0007) +[2023-10-08 17:14:50,453][21195] Updated weights for policy 0, policy_version 37880 (0.0009) +[2023-10-08 17:14:53,477][21194] Updated weights for policy 1, policy_version 37610 (0.0009) +[2023-10-08 17:14:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 77299712. Throughput: 0: 1712.0, 1: 1733.3. Samples: 19337010. Policy #0 lag: (min: 13.0, avg: 16.4, max: 45.0) +[2023-10-08 17:14:53,803][19739] Avg episode reward: [(0, '757.340'), (1, '781.470')] +[2023-10-08 17:14:53,848][21194] Updated weights for policy 1, policy_version 37620 (0.0008) +[2023-10-08 17:14:54,219][21194] Updated weights for policy 1, policy_version 37630 (0.0010) +[2023-10-08 17:14:54,304][21195] Updated weights for policy 0, policy_version 37890 (0.0009) +[2023-10-08 17:14:54,677][21195] Updated weights for policy 0, policy_version 37900 (0.0008) +[2023-10-08 17:14:55,046][21195] Updated weights for policy 0, policy_version 37910 (0.0010) +[2023-10-08 17:14:55,415][21195] Updated weights for policy 0, policy_version 37920 (0.0007) +[2023-10-08 17:14:58,021][21194] Updated weights for policy 1, policy_version 37640 (0.0009) +[2023-10-08 17:14:58,385][21194] Updated weights for policy 1, policy_version 37650 (0.0009) +[2023-10-08 17:14:58,753][21194] Updated weights for policy 1, policy_version 37660 (0.0011) +[2023-10-08 17:14:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 77365248. Throughput: 0: 1739.5, 1: 1725.6. Samples: 19358366. Policy #0 lag: (min: 13.0, avg: 16.4, max: 45.0) +[2023-10-08 17:14:58,803][19739] Avg episode reward: [(0, '757.340'), (1, '779.590')] +[2023-10-08 17:14:59,143][21195] Updated weights for policy 0, policy_version 37930 (0.0008) +[2023-10-08 17:14:59,524][21195] Updated weights for policy 0, policy_version 37940 (0.0010) +[2023-10-08 17:14:59,892][21195] Updated weights for policy 0, policy_version 37950 (0.0009) +[2023-10-08 17:15:02,740][21194] Updated weights for policy 1, policy_version 37670 (0.0008) +[2023-10-08 17:15:03,104][21194] Updated weights for policy 1, policy_version 37680 (0.0007) +[2023-10-08 17:15:03,465][21194] Updated weights for policy 1, policy_version 37690 (0.0007) +[2023-10-08 17:15:03,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 77463552. Throughput: 0: 1734.6, 1: 1730.7. Samples: 19373712. Policy #0 lag: (min: 28.0, avg: 36.0, max: 60.0) +[2023-10-08 17:15:03,803][19739] Avg episode reward: [(0, '761.100'), (1, '775.160')] +[2023-10-08 17:15:03,863][21195] Updated weights for policy 0, policy_version 37960 (0.0009) +[2023-10-08 17:15:04,235][21195] Updated weights for policy 0, policy_version 37970 (0.0011) +[2023-10-08 17:15:04,606][21195] Updated weights for policy 0, policy_version 37980 (0.0008) +[2023-10-08 17:15:07,567][21194] Updated weights for policy 1, policy_version 37700 (0.0009) +[2023-10-08 17:15:07,934][21194] Updated weights for policy 1, policy_version 37710 (0.0007) +[2023-10-08 17:15:08,287][21194] Updated weights for policy 1, policy_version 37720 (0.0008) +[2023-10-08 17:15:08,609][21195] Updated weights for policy 0, policy_version 37990 (0.0008) +[2023-10-08 17:15:08,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 77529088. Throughput: 0: 1736.1, 1: 1728.3. Samples: 19389122. Policy #0 lag: (min: 28.0, avg: 36.0, max: 60.0) +[2023-10-08 17:15:08,803][19739] Avg episode reward: [(0, '761.300'), (1, '708.390')] +[2023-10-08 17:15:08,979][21195] Updated weights for policy 0, policy_version 38000 (0.0007) +[2023-10-08 17:15:09,353][21195] Updated weights for policy 0, policy_version 38010 (0.0008) +[2023-10-08 17:15:12,229][21194] Updated weights for policy 1, policy_version 37730 (0.0007) +[2023-10-08 17:15:12,600][21194] Updated weights for policy 1, policy_version 37740 (0.0008) +[2023-10-08 17:15:12,967][21194] Updated weights for policy 1, policy_version 37750 (0.0008) +[2023-10-08 17:15:13,277][21195] Updated weights for policy 0, policy_version 38020 (0.0009) +[2023-10-08 17:15:13,333][21194] Updated weights for policy 1, policy_version 37760 (0.0007) +[2023-10-08 17:15:13,642][21195] Updated weights for policy 0, policy_version 38030 (0.0008) +[2023-10-08 17:15:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 77594624. Throughput: 0: 1738.9, 1: 1705.5. Samples: 19409408. Policy #0 lag: (min: 28.0, avg: 36.0, max: 60.0) +[2023-10-08 17:15:13,803][19739] Avg episode reward: [(0, '761.300'), (1, '692.700')] +[2023-10-08 17:15:13,810][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000037760_38666240.pth... +[2023-10-08 17:15:13,844][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000036160_37027840.pth +[2023-10-08 17:15:14,007][21195] Updated weights for policy 0, policy_version 38040 (0.0010) +[2023-10-08 17:15:14,304][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000038048_38961152.pth... +[2023-10-08 17:15:14,333][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000036416_37289984.pth +[2023-10-08 17:15:17,103][21194] Updated weights for policy 1, policy_version 37770 (0.0009) +[2023-10-08 17:15:17,462][21194] Updated weights for policy 1, policy_version 37780 (0.0007) +[2023-10-08 17:15:17,833][21194] Updated weights for policy 1, policy_version 37790 (0.0008) +[2023-10-08 17:15:18,116][21195] Updated weights for policy 0, policy_version 38050 (0.0008) +[2023-10-08 17:15:18,535][21195] Updated weights for policy 0, policy_version 38060 (0.0008) +[2023-10-08 17:15:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 77660160. Throughput: 0: 1718.8, 1: 1728.9. Samples: 19424810. Policy #0 lag: (min: 28.0, avg: 36.0, max: 60.0) +[2023-10-08 17:15:18,803][19739] Avg episode reward: [(0, '761.300'), (1, '692.700')] +[2023-10-08 17:15:18,909][21195] Updated weights for policy 0, policy_version 38070 (0.0009) +[2023-10-08 17:15:19,278][21195] Updated weights for policy 0, policy_version 38080 (0.0007) +[2023-10-08 17:15:21,947][21194] Updated weights for policy 1, policy_version 37800 (0.0011) +[2023-10-08 17:15:22,308][21194] Updated weights for policy 1, policy_version 37810 (0.0009) +[2023-10-08 17:15:22,678][21194] Updated weights for policy 1, policy_version 37820 (0.0010) +[2023-10-08 17:15:23,077][21195] Updated weights for policy 0, policy_version 38090 (0.0008) +[2023-10-08 17:15:23,446][21195] Updated weights for policy 0, policy_version 38100 (0.0009) +[2023-10-08 17:15:23,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 77725696. Throughput: 0: 1736.8, 1: 1714.4. Samples: 19440390. Policy #0 lag: (min: 28.0, avg: 36.0, max: 60.0) +[2023-10-08 17:15:23,804][19739] Avg episode reward: [(0, '761.760'), (1, '692.700')] +[2023-10-08 17:15:23,814][21195] Updated weights for policy 0, policy_version 38110 (0.0009) +[2023-10-08 17:15:26,706][21194] Updated weights for policy 1, policy_version 37830 (0.0007) +[2023-10-08 17:15:27,075][21194] Updated weights for policy 1, policy_version 37840 (0.0007) +[2023-10-08 17:15:27,436][21194] Updated weights for policy 1, policy_version 37850 (0.0008) +[2023-10-08 17:15:27,742][21195] Updated weights for policy 0, policy_version 38120 (0.0008) +[2023-10-08 17:15:28,112][21195] Updated weights for policy 0, policy_version 38130 (0.0009) +[2023-10-08 17:15:28,483][21195] Updated weights for policy 0, policy_version 38140 (0.0008) +[2023-10-08 17:15:28,803][19739] Fps is (10 sec: 16383.5, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 77824000. Throughput: 0: 1733.4, 1: 1694.0. Samples: 19460592. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:15:28,804][19739] Avg episode reward: [(0, '761.760'), (1, '692.700')] +[2023-10-08 17:15:31,465][21194] Updated weights for policy 1, policy_version 37860 (0.0008) +[2023-10-08 17:15:31,850][21194] Updated weights for policy 1, policy_version 37870 (0.0009) +[2023-10-08 17:15:32,224][21194] Updated weights for policy 1, policy_version 37880 (0.0009) +[2023-10-08 17:15:32,443][21195] Updated weights for policy 0, policy_version 38150 (0.0008) +[2023-10-08 17:15:32,802][21195] Updated weights for policy 0, policy_version 38160 (0.0010) +[2023-10-08 17:15:33,174][21195] Updated weights for policy 0, policy_version 38170 (0.0009) +[2023-10-08 17:15:33,802][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 77889536. Throughput: 0: 1703.4, 1: 1723.6. Samples: 19476120. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:15:33,803][19739] Avg episode reward: [(0, '761.760'), (1, '692.700')] +[2023-10-08 17:15:36,067][21194] Updated weights for policy 1, policy_version 37890 (0.0007) +[2023-10-08 17:15:36,430][21194] Updated weights for policy 1, policy_version 37900 (0.0007) +[2023-10-08 17:15:36,792][21194] Updated weights for policy 1, policy_version 37910 (0.0007) +[2023-10-08 17:15:37,125][21195] Updated weights for policy 0, policy_version 38180 (0.0008) +[2023-10-08 17:15:37,160][21194] Updated weights for policy 1, policy_version 37920 (0.0007) +[2023-10-08 17:15:37,491][21195] Updated weights for policy 0, policy_version 38190 (0.0010) +[2023-10-08 17:15:37,859][21195] Updated weights for policy 0, policy_version 38200 (0.0008) +[2023-10-08 17:15:38,802][19739] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 77955072. Throughput: 0: 1736.3, 1: 1701.3. Samples: 19491704. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:15:38,803][19739] Avg episode reward: [(0, '761.760'), (1, '686.550')] +[2023-10-08 17:15:41,165][21194] Updated weights for policy 1, policy_version 37930 (0.0008) +[2023-10-08 17:15:41,533][21194] Updated weights for policy 1, policy_version 37940 (0.0008) +[2023-10-08 17:15:41,798][21195] Updated weights for policy 0, policy_version 38210 (0.0008) +[2023-10-08 17:15:41,896][21194] Updated weights for policy 1, policy_version 37950 (0.0009) +[2023-10-08 17:15:42,163][21195] Updated weights for policy 0, policy_version 38220 (0.0010) +[2023-10-08 17:15:42,540][21195] Updated weights for policy 0, policy_version 38230 (0.0008) +[2023-10-08 17:15:42,903][21195] Updated weights for policy 0, policy_version 38240 (0.0008) +[2023-10-08 17:15:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 78020608. Throughput: 0: 1703.5, 1: 1705.8. Samples: 19511786. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:15:43,803][19739] Avg episode reward: [(0, '761.760'), (1, '686.550')] +[2023-10-08 17:15:45,680][21194] Updated weights for policy 1, policy_version 37960 (0.0010) +[2023-10-08 17:15:46,060][21194] Updated weights for policy 1, policy_version 37970 (0.0008) +[2023-10-08 17:15:46,422][21194] Updated weights for policy 1, policy_version 37980 (0.0008) +[2023-10-08 17:15:46,746][21195] Updated weights for policy 0, policy_version 38250 (0.0007) +[2023-10-08 17:15:47,118][21195] Updated weights for policy 0, policy_version 38260 (0.0008) +[2023-10-08 17:15:47,477][21195] Updated weights for policy 0, policy_version 38270 (0.0007) +[2023-10-08 17:15:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 78086144. Throughput: 0: 1709.6, 1: 1713.8. Samples: 19527766. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:15:48,803][19739] Avg episode reward: [(0, '761.820'), (1, '686.550')] +[2023-10-08 17:15:50,323][21194] Updated weights for policy 1, policy_version 37990 (0.0010) +[2023-10-08 17:15:50,690][21194] Updated weights for policy 1, policy_version 38000 (0.0011) +[2023-10-08 17:15:51,066][21194] Updated weights for policy 1, policy_version 38010 (0.0009) +[2023-10-08 17:15:51,430][21195] Updated weights for policy 0, policy_version 38280 (0.0008) +[2023-10-08 17:15:51,806][21195] Updated weights for policy 0, policy_version 38290 (0.0009) +[2023-10-08 17:15:52,171][21195] Updated weights for policy 0, policy_version 38300 (0.0007) +[2023-10-08 17:15:53,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 78151680. Throughput: 0: 1720.3, 1: 1702.4. Samples: 19543144. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:15:53,804][19739] Avg episode reward: [(0, '761.820'), (1, '701.460')] +[2023-10-08 17:15:55,157][21194] Updated weights for policy 1, policy_version 38020 (0.0008) +[2023-10-08 17:15:55,525][21194] Updated weights for policy 1, policy_version 38030 (0.0008) +[2023-10-08 17:15:55,869][21195] Updated weights for policy 0, policy_version 38310 (0.0007) +[2023-10-08 17:15:55,891][21194] Updated weights for policy 1, policy_version 38040 (0.0008) +[2023-10-08 17:15:56,243][21195] Updated weights for policy 0, policy_version 38320 (0.0010) +[2023-10-08 17:15:56,617][21195] Updated weights for policy 0, policy_version 38330 (0.0007) +[2023-10-08 17:15:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 78217216. Throughput: 0: 1708.7, 1: 1727.9. Samples: 19564056. Policy #0 lag: (min: 24.0, avg: 49.2, max: 56.0) +[2023-10-08 17:15:58,803][19739] Avg episode reward: [(0, '761.820'), (1, '701.460')] +[2023-10-08 17:15:59,945][21194] Updated weights for policy 1, policy_version 38050 (0.0007) +[2023-10-08 17:16:00,305][21194] Updated weights for policy 1, policy_version 38060 (0.0007) +[2023-10-08 17:16:00,404][21195] Updated weights for policy 0, policy_version 38340 (0.0007) +[2023-10-08 17:16:00,675][21194] Updated weights for policy 1, policy_version 38070 (0.0007) +[2023-10-08 17:16:00,774][21195] Updated weights for policy 0, policy_version 38350 (0.0009) +[2023-10-08 17:16:01,038][21194] Updated weights for policy 1, policy_version 38080 (0.0008) +[2023-10-08 17:16:01,148][21195] Updated weights for policy 0, policy_version 38360 (0.0008) +[2023-10-08 17:16:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 78282752. Throughput: 0: 1730.6, 1: 1702.3. Samples: 19579290. Policy #0 lag: (min: 24.0, avg: 49.2, max: 56.0) +[2023-10-08 17:16:03,804][19739] Avg episode reward: [(0, '773.350'), (1, '701.460')] +[2023-10-08 17:16:04,851][21194] Updated weights for policy 1, policy_version 38090 (0.0010) +[2023-10-08 17:16:05,222][21194] Updated weights for policy 1, policy_version 38100 (0.0009) +[2023-10-08 17:16:05,331][21195] Updated weights for policy 0, policy_version 38370 (0.0008) +[2023-10-08 17:16:05,587][21194] Updated weights for policy 1, policy_version 38110 (0.0008) +[2023-10-08 17:16:05,738][21195] Updated weights for policy 0, policy_version 38380 (0.0008) +[2023-10-08 17:16:06,112][21195] Updated weights for policy 0, policy_version 38390 (0.0010) +[2023-10-08 17:16:06,479][21195] Updated weights for policy 0, policy_version 38400 (0.0011) +[2023-10-08 17:16:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 78348288. Throughput: 0: 1707.8, 1: 1725.0. Samples: 19594864. Policy #0 lag: (min: 24.0, avg: 49.2, max: 56.0) +[2023-10-08 17:16:08,803][19739] Avg episode reward: [(0, '773.350'), (1, '710.110')] +[2023-10-08 17:16:09,190][21194] Updated weights for policy 1, policy_version 38120 (0.0008) +[2023-10-08 17:16:09,558][21194] Updated weights for policy 1, policy_version 38130 (0.0007) +[2023-10-08 17:16:09,929][21194] Updated weights for policy 1, policy_version 38140 (0.0009) +[2023-10-08 17:16:10,348][21195] Updated weights for policy 0, policy_version 38410 (0.0009) +[2023-10-08 17:16:10,709][21195] Updated weights for policy 0, policy_version 38420 (0.0008) +[2023-10-08 17:16:11,080][21195] Updated weights for policy 0, policy_version 38430 (0.0009) +[2023-10-08 17:16:13,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 78413824. Throughput: 0: 1715.7, 1: 1745.3. Samples: 19616340. Policy #0 lag: (min: 24.0, avg: 49.2, max: 56.0) +[2023-10-08 17:16:13,803][19739] Avg episode reward: [(0, '773.350'), (1, '710.340')] +[2023-10-08 17:16:13,920][21194] Updated weights for policy 1, policy_version 38150 (0.0009) +[2023-10-08 17:16:14,298][21194] Updated weights for policy 1, policy_version 38160 (0.0008) +[2023-10-08 17:16:14,651][21194] Updated weights for policy 1, policy_version 38170 (0.0010) +[2023-10-08 17:16:14,891][21195] Updated weights for policy 0, policy_version 38440 (0.0008) +[2023-10-08 17:16:15,265][21195] Updated weights for policy 0, policy_version 38450 (0.0007) +[2023-10-08 17:16:15,637][21195] Updated weights for policy 0, policy_version 38460 (0.0009) +[2023-10-08 17:16:18,617][21194] Updated weights for policy 1, policy_version 38180 (0.0008) +[2023-10-08 17:16:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 78479360. Throughput: 0: 1741.6, 1: 1716.8. Samples: 19631746. Policy #0 lag: (min: 24.0, avg: 49.2, max: 56.0) +[2023-10-08 17:16:18,803][19739] Avg episode reward: [(0, '773.350'), (1, '697.850')] +[2023-10-08 17:16:19,000][21194] Updated weights for policy 1, policy_version 38190 (0.0008) +[2023-10-08 17:16:19,365][21194] Updated weights for policy 1, policy_version 38200 (0.0007) +[2023-10-08 17:16:19,743][21195] Updated weights for policy 0, policy_version 38470 (0.0008) +[2023-10-08 17:16:20,112][21195] Updated weights for policy 0, policy_version 38480 (0.0011) +[2023-10-08 17:16:20,485][21195] Updated weights for policy 0, policy_version 38490 (0.0009) +[2023-10-08 17:16:23,333][21194] Updated weights for policy 1, policy_version 38210 (0.0008) +[2023-10-08 17:16:23,694][21194] Updated weights for policy 1, policy_version 38220 (0.0007) +[2023-10-08 17:16:23,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 78544896. Throughput: 0: 1710.6, 1: 1743.2. Samples: 19647126. Policy #0 lag: (min: 24.0, avg: 49.2, max: 56.0) +[2023-10-08 17:16:23,803][19739] Avg episode reward: [(0, '773.350'), (1, '714.830')] +[2023-10-08 17:16:24,064][21194] Updated weights for policy 1, policy_version 38230 (0.0009) +[2023-10-08 17:16:24,438][21194] Updated weights for policy 1, policy_version 38240 (0.0007) +[2023-10-08 17:16:24,463][21195] Updated weights for policy 0, policy_version 38500 (0.0008) +[2023-10-08 17:16:24,841][21195] Updated weights for policy 0, policy_version 38510 (0.0009) +[2023-10-08 17:16:25,209][21195] Updated weights for policy 0, policy_version 38520 (0.0007) +[2023-10-08 17:16:28,489][21194] Updated weights for policy 1, policy_version 38250 (0.0010) +[2023-10-08 17:16:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.3, 300 sec: 13662.6). Total num frames: 78610432. Throughput: 0: 1741.7, 1: 1746.6. Samples: 19668762. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:16:28,803][19739] Avg episode reward: [(0, '772.830'), (1, '714.830')] +[2023-10-08 17:16:28,852][21194] Updated weights for policy 1, policy_version 38260 (0.0007) +[2023-10-08 17:16:29,149][21195] Updated weights for policy 0, policy_version 38530 (0.0007) +[2023-10-08 17:16:29,227][21194] Updated weights for policy 1, policy_version 38270 (0.0008) +[2023-10-08 17:16:29,514][21195] Updated weights for policy 0, policy_version 38540 (0.0008) +[2023-10-08 17:16:29,894][21195] Updated weights for policy 0, policy_version 38550 (0.0009) +[2023-10-08 17:16:30,255][21195] Updated weights for policy 0, policy_version 38560 (0.0009) +[2023-10-08 17:16:33,010][21194] Updated weights for policy 1, policy_version 38280 (0.0010) +[2023-10-08 17:16:33,368][21194] Updated weights for policy 1, policy_version 38290 (0.0011) +[2023-10-08 17:16:33,736][21194] Updated weights for policy 1, policy_version 38300 (0.0007) +[2023-10-08 17:16:33,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 78675968. Throughput: 0: 1740.2, 1: 1734.6. Samples: 19684134. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:16:33,803][19739] Avg episode reward: [(0, '772.830'), (1, '714.830')] +[2023-10-08 17:16:34,046][21195] Updated weights for policy 0, policy_version 38570 (0.0010) +[2023-10-08 17:16:34,417][21195] Updated weights for policy 0, policy_version 38580 (0.0010) +[2023-10-08 17:16:34,793][21195] Updated weights for policy 0, policy_version 38590 (0.0009) +[2023-10-08 17:16:37,615][21194] Updated weights for policy 1, policy_version 38310 (0.0009) +[2023-10-08 17:16:37,982][21194] Updated weights for policy 1, policy_version 38320 (0.0011) +[2023-10-08 17:16:38,357][21194] Updated weights for policy 1, policy_version 38330 (0.0009) +[2023-10-08 17:16:38,773][21195] Updated weights for policy 0, policy_version 38600 (0.0008) +[2023-10-08 17:16:38,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 78774272. Throughput: 0: 1733.5, 1: 1749.3. Samples: 19699868. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:16:38,803][19739] Avg episode reward: [(0, '772.830'), (1, '714.830')] +[2023-10-08 17:16:39,143][21195] Updated weights for policy 0, policy_version 38610 (0.0010) +[2023-10-08 17:16:39,505][21195] Updated weights for policy 0, policy_version 38620 (0.0011) +[2023-10-08 17:16:42,153][21194] Updated weights for policy 1, policy_version 38340 (0.0010) +[2023-10-08 17:16:42,523][21194] Updated weights for policy 1, policy_version 38350 (0.0010) +[2023-10-08 17:16:42,893][21194] Updated weights for policy 1, policy_version 38360 (0.0008) +[2023-10-08 17:16:43,395][21195] Updated weights for policy 0, policy_version 38630 (0.0009) +[2023-10-08 17:16:43,766][21195] Updated weights for policy 0, policy_version 38640 (0.0007) +[2023-10-08 17:16:43,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 78839808. Throughput: 0: 1749.6, 1: 1724.9. Samples: 19720408. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:16:43,803][19739] Avg episode reward: [(0, '786.670'), (1, '714.830')] +[2023-10-08 17:16:44,134][21195] Updated weights for policy 0, policy_version 38650 (0.0008) +[2023-10-08 17:16:46,970][21194] Updated weights for policy 1, policy_version 38370 (0.0007) +[2023-10-08 17:16:47,326][21194] Updated weights for policy 1, policy_version 38380 (0.0008) +[2023-10-08 17:16:47,686][21194] Updated weights for policy 1, policy_version 38390 (0.0008) +[2023-10-08 17:16:47,829][21195] Updated weights for policy 0, policy_version 38660 (0.0008) +[2023-10-08 17:16:48,046][21194] Updated weights for policy 1, policy_version 38400 (0.0008) +[2023-10-08 17:16:48,193][21195] Updated weights for policy 0, policy_version 38670 (0.0009) +[2023-10-08 17:16:48,560][21195] Updated weights for policy 0, policy_version 38680 (0.0008) +[2023-10-08 17:16:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 78905344. Throughput: 0: 1732.4, 1: 1746.7. Samples: 19735850. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:16:48,803][19739] Avg episode reward: [(0, '801.520'), (1, '714.830')] +[2023-10-08 17:16:51,979][21194] Updated weights for policy 1, policy_version 38410 (0.0010) +[2023-10-08 17:16:52,339][21194] Updated weights for policy 1, policy_version 38420 (0.0011) +[2023-10-08 17:16:52,584][21195] Updated weights for policy 0, policy_version 38690 (0.0008) +[2023-10-08 17:16:52,706][21194] Updated weights for policy 1, policy_version 38430 (0.0009) +[2023-10-08 17:16:52,979][21195] Updated weights for policy 0, policy_version 38700 (0.0008) +[2023-10-08 17:16:53,347][21195] Updated weights for policy 0, policy_version 38710 (0.0007) +[2023-10-08 17:16:53,709][21195] Updated weights for policy 0, policy_version 38720 (0.0008) +[2023-10-08 17:16:53,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 79003648. Throughput: 0: 1759.5, 1: 1731.9. Samples: 19751980. Policy #0 lag: (min: 31.0, avg: 35.9, max: 63.0) +[2023-10-08 17:16:53,804][19739] Avg episode reward: [(0, '762.280'), (1, '714.830')] +[2023-10-08 17:16:56,711][21194] Updated weights for policy 1, policy_version 38440 (0.0008) +[2023-10-08 17:16:57,073][21194] Updated weights for policy 1, policy_version 38450 (0.0008) +[2023-10-08 17:16:57,446][21194] Updated weights for policy 1, policy_version 38460 (0.0008) +[2023-10-08 17:16:57,508][21195] Updated weights for policy 0, policy_version 38730 (0.0007) +[2023-10-08 17:16:57,873][21195] Updated weights for policy 0, policy_version 38740 (0.0009) +[2023-10-08 17:16:58,244][21195] Updated weights for policy 0, policy_version 38750 (0.0009) +[2023-10-08 17:16:58,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 79069184. Throughput: 0: 1742.4, 1: 1712.8. Samples: 19771824. Policy #0 lag: (min: 31.0, avg: 35.9, max: 63.0) +[2023-10-08 17:16:58,803][19739] Avg episode reward: [(0, '761.270'), (1, '735.960')] +[2023-10-08 17:17:01,344][21194] Updated weights for policy 1, policy_version 38470 (0.0008) +[2023-10-08 17:17:01,721][21194] Updated weights for policy 1, policy_version 38480 (0.0007) +[2023-10-08 17:17:02,078][21194] Updated weights for policy 1, policy_version 38490 (0.0009) +[2023-10-08 17:17:02,084][21195] Updated weights for policy 0, policy_version 38760 (0.0010) +[2023-10-08 17:17:02,445][21195] Updated weights for policy 0, policy_version 38770 (0.0009) +[2023-10-08 17:17:02,825][21195] Updated weights for policy 0, policy_version 38780 (0.0009) +[2023-10-08 17:17:03,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 79134720. Throughput: 0: 1726.6, 1: 1743.4. Samples: 19787894. Policy #0 lag: (min: 31.0, avg: 35.9, max: 63.0) +[2023-10-08 17:17:03,803][19739] Avg episode reward: [(0, '761.270'), (1, '735.960')] +[2023-10-08 17:17:06,150][21194] Updated weights for policy 1, policy_version 38500 (0.0008) +[2023-10-08 17:17:06,531][21194] Updated weights for policy 1, policy_version 38510 (0.0009) +[2023-10-08 17:17:06,893][21194] Updated weights for policy 1, policy_version 38520 (0.0009) +[2023-10-08 17:17:06,937][21195] Updated weights for policy 0, policy_version 38790 (0.0009) +[2023-10-08 17:17:07,312][21195] Updated weights for policy 0, policy_version 38800 (0.0009) +[2023-10-08 17:17:07,681][21195] Updated weights for policy 0, policy_version 38810 (0.0010) +[2023-10-08 17:17:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 79200256. Throughput: 0: 1751.5, 1: 1715.1. Samples: 19803120. Policy #0 lag: (min: 31.0, avg: 35.9, max: 63.0) +[2023-10-08 17:17:08,803][19739] Avg episode reward: [(0, '761.270'), (1, '721.410')] +[2023-10-08 17:17:10,918][21194] Updated weights for policy 1, policy_version 38530 (0.0009) +[2023-10-08 17:17:11,283][21194] Updated weights for policy 1, policy_version 38540 (0.0007) +[2023-10-08 17:17:11,597][21195] Updated weights for policy 0, policy_version 38820 (0.0007) +[2023-10-08 17:17:11,648][21194] Updated weights for policy 1, policy_version 38550 (0.0008) +[2023-10-08 17:17:11,973][21195] Updated weights for policy 0, policy_version 38830 (0.0009) +[2023-10-08 17:17:12,012][21194] Updated weights for policy 1, policy_version 38560 (0.0009) +[2023-10-08 17:17:12,343][21195] Updated weights for policy 0, policy_version 38840 (0.0010) +[2023-10-08 17:17:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 79265792. Throughput: 0: 1720.3, 1: 1706.4. Samples: 19822966. Policy #0 lag: (min: 31.0, avg: 35.9, max: 63.0) +[2023-10-08 17:17:13,803][19739] Avg episode reward: [(0, '761.270'), (1, '721.410')] +[2023-10-08 17:17:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000038848_39780352.pth... +[2023-10-08 17:17:13,811][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000038560_39485440.pth... +[2023-10-08 17:17:13,842][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000037216_38109184.pth +[2023-10-08 17:17:13,853][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000036960_37847040.pth +[2023-10-08 17:17:15,947][21194] Updated weights for policy 1, policy_version 38570 (0.0007) +[2023-10-08 17:17:16,317][21194] Updated weights for policy 1, policy_version 38580 (0.0009) +[2023-10-08 17:17:16,354][21195] Updated weights for policy 0, policy_version 38850 (0.0010) +[2023-10-08 17:17:16,685][21194] Updated weights for policy 1, policy_version 38590 (0.0007) +[2023-10-08 17:17:16,721][21195] Updated weights for policy 0, policy_version 38860 (0.0008) +[2023-10-08 17:17:17,103][21195] Updated weights for policy 0, policy_version 38870 (0.0010) +[2023-10-08 17:17:17,475][21195] Updated weights for policy 0, policy_version 38880 (0.0010) +[2023-10-08 17:17:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 79331328. Throughput: 0: 1722.5, 1: 1722.5. Samples: 19839158. Policy #0 lag: (min: 31.0, avg: 35.9, max: 63.0) +[2023-10-08 17:17:18,803][19739] Avg episode reward: [(0, '761.270'), (1, '721.410')] +[2023-10-08 17:17:20,519][21194] Updated weights for policy 1, policy_version 38600 (0.0008) +[2023-10-08 17:17:20,883][21194] Updated weights for policy 1, policy_version 38610 (0.0008) +[2023-10-08 17:17:21,241][21194] Updated weights for policy 1, policy_version 38620 (0.0008) +[2023-10-08 17:17:21,284][21195] Updated weights for policy 0, policy_version 38890 (0.0008) +[2023-10-08 17:17:21,666][21195] Updated weights for policy 0, policy_version 38900 (0.0009) +[2023-10-08 17:17:22,035][21195] Updated weights for policy 0, policy_version 38910 (0.0009) +[2023-10-08 17:17:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 79396864. Throughput: 0: 1727.6, 1: 1701.2. Samples: 19854164. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 17:17:23,803][19739] Avg episode reward: [(0, '761.270'), (1, '721.410')] +[2023-10-08 17:17:25,255][21194] Updated weights for policy 1, policy_version 38630 (0.0008) +[2023-10-08 17:17:25,622][21194] Updated weights for policy 1, policy_version 38640 (0.0010) +[2023-10-08 17:17:25,881][21195] Updated weights for policy 0, policy_version 38920 (0.0009) +[2023-10-08 17:17:26,004][21194] Updated weights for policy 1, policy_version 38650 (0.0009) +[2023-10-08 17:17:26,254][21195] Updated weights for policy 0, policy_version 38930 (0.0009) +[2023-10-08 17:17:26,625][21195] Updated weights for policy 0, policy_version 38940 (0.0008) +[2023-10-08 17:17:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 79462400. Throughput: 0: 1718.0, 1: 1717.6. Samples: 19875010. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 17:17:28,803][19739] Avg episode reward: [(0, '761.270'), (1, '721.410')] +[2023-10-08 17:17:30,088][21194] Updated weights for policy 1, policy_version 38660 (0.0007) +[2023-10-08 17:17:30,455][21194] Updated weights for policy 1, policy_version 38670 (0.0008) +[2023-10-08 17:17:30,599][21195] Updated weights for policy 0, policy_version 38950 (0.0007) +[2023-10-08 17:17:30,823][21194] Updated weights for policy 1, policy_version 38680 (0.0008) +[2023-10-08 17:17:30,959][21195] Updated weights for policy 0, policy_version 38960 (0.0010) +[2023-10-08 17:17:31,323][21195] Updated weights for policy 0, policy_version 38970 (0.0010) +[2023-10-08 17:17:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 79527936. Throughput: 0: 1740.1, 1: 1697.9. Samples: 19890558. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 17:17:33,804][19739] Avg episode reward: [(0, '763.140'), (1, '715.940')] +[2023-10-08 17:17:34,746][21194] Updated weights for policy 1, policy_version 38690 (0.0007) +[2023-10-08 17:17:35,114][21194] Updated weights for policy 1, policy_version 38700 (0.0007) +[2023-10-08 17:17:35,257][21195] Updated weights for policy 0, policy_version 38980 (0.0008) +[2023-10-08 17:17:35,472][21194] Updated weights for policy 1, policy_version 38710 (0.0009) +[2023-10-08 17:17:35,619][21195] Updated weights for policy 0, policy_version 38990 (0.0008) +[2023-10-08 17:17:35,832][21194] Updated weights for policy 1, policy_version 38720 (0.0009) +[2023-10-08 17:17:35,998][21195] Updated weights for policy 0, policy_version 39000 (0.0009) +[2023-10-08 17:17:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 79593472. Throughput: 0: 1716.4, 1: 1703.6. Samples: 19905880. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 17:17:38,803][19739] Avg episode reward: [(0, '763.140'), (1, '700.160')] +[2023-10-08 17:17:39,824][21194] Updated weights for policy 1, policy_version 38730 (0.0011) +[2023-10-08 17:17:40,005][21195] Updated weights for policy 0, policy_version 39010 (0.0010) +[2023-10-08 17:17:40,193][21194] Updated weights for policy 1, policy_version 38740 (0.0007) +[2023-10-08 17:17:40,392][21195] Updated weights for policy 0, policy_version 39020 (0.0009) +[2023-10-08 17:17:40,554][21194] Updated weights for policy 1, policy_version 38750 (0.0009) +[2023-10-08 17:17:40,759][21195] Updated weights for policy 0, policy_version 39030 (0.0010) +[2023-10-08 17:17:41,127][21195] Updated weights for policy 0, policy_version 39040 (0.0008) +[2023-10-08 17:17:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 79659008. Throughput: 0: 1727.2, 1: 1713.2. Samples: 19926642. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 17:17:43,804][19739] Avg episode reward: [(0, '763.140'), (1, '714.160')] +[2023-10-08 17:17:44,635][21194] Updated weights for policy 1, policy_version 38760 (0.0009) +[2023-10-08 17:17:44,976][21195] Updated weights for policy 0, policy_version 39050 (0.0008) +[2023-10-08 17:17:45,000][21194] Updated weights for policy 1, policy_version 38770 (0.0008) +[2023-10-08 17:17:45,349][21195] Updated weights for policy 0, policy_version 39060 (0.0008) +[2023-10-08 17:17:45,369][21194] Updated weights for policy 1, policy_version 38780 (0.0007) +[2023-10-08 17:17:45,716][21195] Updated weights for policy 0, policy_version 39070 (0.0007) +[2023-10-08 17:17:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 79724544. Throughput: 0: 1746.9, 1: 1681.4. Samples: 19942166. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 17:17:48,803][19739] Avg episode reward: [(0, '762.000'), (1, '714.160')] +[2023-10-08 17:17:49,419][21194] Updated weights for policy 1, policy_version 38790 (0.0007) +[2023-10-08 17:17:49,615][21195] Updated weights for policy 0, policy_version 39080 (0.0009) +[2023-10-08 17:17:49,782][21194] Updated weights for policy 1, policy_version 38800 (0.0007) +[2023-10-08 17:17:49,978][21195] Updated weights for policy 0, policy_version 39090 (0.0007) +[2023-10-08 17:17:50,149][21194] Updated weights for policy 1, policy_version 38810 (0.0009) +[2023-10-08 17:17:50,346][21195] Updated weights for policy 0, policy_version 39100 (0.0008) +[2023-10-08 17:17:53,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.3, 300 sec: 13773.7). Total num frames: 79790080. Throughput: 0: 1720.5, 1: 1705.6. Samples: 19957296. Policy #0 lag: (min: 5.0, avg: 5.0, max: 5.0) +[2023-10-08 17:17:53,803][19739] Avg episode reward: [(0, '771.600'), (1, '714.200')] +[2023-10-08 17:17:54,167][21195] Updated weights for policy 0, policy_version 39110 (0.0010) +[2023-10-08 17:17:54,327][21194] Updated weights for policy 1, policy_version 38820 (0.0009) +[2023-10-08 17:17:54,535][21195] Updated weights for policy 0, policy_version 39120 (0.0009) +[2023-10-08 17:17:54,722][21194] Updated weights for policy 1, policy_version 38830 (0.0008) +[2023-10-08 17:17:54,910][21195] Updated weights for policy 0, policy_version 39130 (0.0007) +[2023-10-08 17:17:55,089][21194] Updated weights for policy 1, policy_version 38840 (0.0008) +[2023-10-08 17:17:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 79855616. Throughput: 0: 1751.7, 1: 1710.0. Samples: 19978744. Policy #0 lag: (min: 5.0, avg: 5.0, max: 5.0) +[2023-10-08 17:17:58,803][19739] Avg episode reward: [(0, '755.420'), (1, '714.330')] +[2023-10-08 17:17:58,891][21195] Updated weights for policy 0, policy_version 39140 (0.0008) +[2023-10-08 17:17:58,943][21194] Updated weights for policy 1, policy_version 38850 (0.0009) +[2023-10-08 17:17:59,257][21195] Updated weights for policy 0, policy_version 39150 (0.0008) +[2023-10-08 17:17:59,313][21194] Updated weights for policy 1, policy_version 38860 (0.0008) +[2023-10-08 17:17:59,629][21195] Updated weights for policy 0, policy_version 39160 (0.0008) +[2023-10-08 17:17:59,671][21194] Updated weights for policy 1, policy_version 38870 (0.0008) +[2023-10-08 17:18:00,040][21194] Updated weights for policy 1, policy_version 38880 (0.0007) +[2023-10-08 17:18:03,530][21195] Updated weights for policy 0, policy_version 39170 (0.0007) +[2023-10-08 17:18:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 79921152. Throughput: 0: 1748.7, 1: 1691.1. Samples: 19993950. Policy #0 lag: (min: 5.0, avg: 5.0, max: 5.0) +[2023-10-08 17:18:03,803][19739] Avg episode reward: [(0, '755.600'), (1, '714.330')] +[2023-10-08 17:18:03,903][21195] Updated weights for policy 0, policy_version 39180 (0.0009) +[2023-10-08 17:18:04,057][21194] Updated weights for policy 1, policy_version 38890 (0.0008) +[2023-10-08 17:18:04,279][21195] Updated weights for policy 0, policy_version 39190 (0.0007) +[2023-10-08 17:18:04,423][21194] Updated weights for policy 1, policy_version 38900 (0.0007) +[2023-10-08 17:18:04,644][21195] Updated weights for policy 0, policy_version 39200 (0.0007) +[2023-10-08 17:18:04,788][21194] Updated weights for policy 1, policy_version 38910 (0.0010) +[2023-10-08 17:18:08,596][21195] Updated weights for policy 0, policy_version 39210 (0.0007) +[2023-10-08 17:18:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 79986688. Throughput: 0: 1744.8, 1: 1704.1. Samples: 20009362. Policy #0 lag: (min: 5.0, avg: 5.0, max: 5.0) +[2023-10-08 17:18:08,803][19739] Avg episode reward: [(0, '758.500'), (1, '714.330')] +[2023-10-08 17:18:08,881][21194] Updated weights for policy 1, policy_version 38920 (0.0008) +[2023-10-08 17:18:08,956][21195] Updated weights for policy 0, policy_version 39220 (0.0007) +[2023-10-08 17:18:09,241][21194] Updated weights for policy 1, policy_version 38930 (0.0008) +[2023-10-08 17:18:09,323][21195] Updated weights for policy 0, policy_version 39230 (0.0008) +[2023-10-08 17:18:09,603][21194] Updated weights for policy 1, policy_version 38940 (0.0009) +[2023-10-08 17:18:13,254][21195] Updated weights for policy 0, policy_version 39240 (0.0009) +[2023-10-08 17:18:13,537][21194] Updated weights for policy 1, policy_version 38950 (0.0009) +[2023-10-08 17:18:13,615][21195] Updated weights for policy 0, policy_version 39250 (0.0008) +[2023-10-08 17:18:13,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 80052224. Throughput: 0: 1752.5, 1: 1711.5. Samples: 20030888. Policy #0 lag: (min: 5.0, avg: 5.0, max: 5.0) +[2023-10-08 17:18:13,804][19739] Avg episode reward: [(0, '773.250'), (1, '714.330')] +[2023-10-08 17:18:13,908][21194] Updated weights for policy 1, policy_version 38960 (0.0008) +[2023-10-08 17:18:13,988][21195] Updated weights for policy 0, policy_version 39260 (0.0009) +[2023-10-08 17:18:14,270][21194] Updated weights for policy 1, policy_version 38970 (0.0007) +[2023-10-08 17:18:17,891][21195] Updated weights for policy 0, policy_version 39270 (0.0007) +[2023-10-08 17:18:18,257][21195] Updated weights for policy 0, policy_version 39280 (0.0009) +[2023-10-08 17:18:18,263][21194] Updated weights for policy 1, policy_version 38980 (0.0009) +[2023-10-08 17:18:18,620][21195] Updated weights for policy 0, policy_version 39290 (0.0008) +[2023-10-08 17:18:18,625][21194] Updated weights for policy 1, policy_version 38990 (0.0007) +[2023-10-08 17:18:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 80117760. Throughput: 0: 1724.3, 1: 1709.5. Samples: 20045078. Policy #0 lag: (min: 5.0, avg: 5.0, max: 5.0) +[2023-10-08 17:18:18,803][19739] Avg episode reward: [(0, '759.910'), (1, '714.330')] +[2023-10-08 17:18:18,983][21194] Updated weights for policy 1, policy_version 39000 (0.0009) +[2023-10-08 17:18:22,321][21195] Updated weights for policy 0, policy_version 39300 (0.0010) +[2023-10-08 17:18:22,690][21195] Updated weights for policy 0, policy_version 39310 (0.0010) +[2023-10-08 17:18:23,008][21194] Updated weights for policy 1, policy_version 39010 (0.0010) +[2023-10-08 17:18:23,073][21195] Updated weights for policy 0, policy_version 39320 (0.0009) +[2023-10-08 17:18:23,382][21194] Updated weights for policy 1, policy_version 39020 (0.0009) +[2023-10-08 17:18:23,745][21194] Updated weights for policy 1, policy_version 39030 (0.0010) +[2023-10-08 17:18:23,803][19739] Fps is (10 sec: 16384.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 80216064. Throughput: 0: 1754.4, 1: 1702.6. Samples: 20061448. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 17:18:23,803][19739] Avg episode reward: [(0, '759.910'), (1, '729.330')] +[2023-10-08 17:18:24,112][21194] Updated weights for policy 1, policy_version 39040 (0.0010) +[2023-10-08 17:18:27,159][21195] Updated weights for policy 0, policy_version 39330 (0.0008) +[2023-10-08 17:18:27,576][21195] Updated weights for policy 0, policy_version 39340 (0.0008) +[2023-10-08 17:18:27,934][21195] Updated weights for policy 0, policy_version 39350 (0.0008) +[2023-10-08 17:18:28,030][21194] Updated weights for policy 1, policy_version 39050 (0.0007) +[2023-10-08 17:18:28,305][21195] Updated weights for policy 0, policy_version 39360 (0.0008) +[2023-10-08 17:18:28,395][21194] Updated weights for policy 1, policy_version 39060 (0.0007) +[2023-10-08 17:18:28,766][21194] Updated weights for policy 1, policy_version 39070 (0.0009) +[2023-10-08 17:18:28,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 80281600. Throughput: 0: 1737.7, 1: 1705.0. Samples: 20081566. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 17:18:28,803][19739] Avg episode reward: [(0, '759.910'), (1, '729.330')] +[2023-10-08 17:18:32,274][21195] Updated weights for policy 0, policy_version 39370 (0.0007) +[2023-10-08 17:18:32,649][21195] Updated weights for policy 0, policy_version 39380 (0.0007) +[2023-10-08 17:18:32,694][21194] Updated weights for policy 1, policy_version 39080 (0.0008) +[2023-10-08 17:18:33,008][21195] Updated weights for policy 0, policy_version 39390 (0.0008) +[2023-10-08 17:18:33,048][21194] Updated weights for policy 1, policy_version 39090 (0.0007) +[2023-10-08 17:18:33,412][21194] Updated weights for policy 1, policy_version 39100 (0.0009) +[2023-10-08 17:18:33,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 80379904. Throughput: 0: 1715.2, 1: 1717.4. Samples: 20096636. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 17:18:33,803][19739] Avg episode reward: [(0, '760.000'), (1, '729.330')] +[2023-10-08 17:18:36,859][21195] Updated weights for policy 0, policy_version 39400 (0.0009) +[2023-10-08 17:18:37,224][21195] Updated weights for policy 0, policy_version 39410 (0.0008) +[2023-10-08 17:18:37,278][21194] Updated weights for policy 1, policy_version 39110 (0.0008) +[2023-10-08 17:18:37,590][21195] Updated weights for policy 0, policy_version 39420 (0.0007) +[2023-10-08 17:18:37,638][21194] Updated weights for policy 1, policy_version 39120 (0.0008) +[2023-10-08 17:18:38,011][21194] Updated weights for policy 1, policy_version 39130 (0.0010) +[2023-10-08 17:18:38,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 80445440. Throughput: 0: 1743.1, 1: 1723.4. Samples: 20113290. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 17:18:38,803][19739] Avg episode reward: [(0, '746.230'), (1, '729.330')] +[2023-10-08 17:18:41,629][21195] Updated weights for policy 0, policy_version 39430 (0.0008) +[2023-10-08 17:18:41,999][21195] Updated weights for policy 0, policy_version 39440 (0.0009) +[2023-10-08 17:18:42,162][21194] Updated weights for policy 1, policy_version 39140 (0.0009) +[2023-10-08 17:18:42,368][21195] Updated weights for policy 0, policy_version 39450 (0.0008) +[2023-10-08 17:18:42,561][21194] Updated weights for policy 1, policy_version 39150 (0.0008) +[2023-10-08 17:18:42,934][21194] Updated weights for policy 1, policy_version 39160 (0.0009) +[2023-10-08 17:18:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 80510976. Throughput: 0: 1714.6, 1: 1695.7. Samples: 20132208. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 17:18:43,803][19739] Avg episode reward: [(0, '746.230'), (1, '729.330')] +[2023-10-08 17:18:46,289][21195] Updated weights for policy 0, policy_version 39460 (0.0009) +[2023-10-08 17:18:46,661][21195] Updated weights for policy 0, policy_version 39470 (0.0011) +[2023-10-08 17:18:46,804][21194] Updated weights for policy 1, policy_version 39170 (0.0007) +[2023-10-08 17:18:47,037][21195] Updated weights for policy 0, policy_version 39480 (0.0008) +[2023-10-08 17:18:47,173][21194] Updated weights for policy 1, policy_version 39180 (0.0009) +[2023-10-08 17:18:47,534][21194] Updated weights for policy 1, policy_version 39190 (0.0007) +[2023-10-08 17:18:47,893][21194] Updated weights for policy 1, policy_version 39200 (0.0007) +[2023-10-08 17:18:48,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 80576512. Throughput: 0: 1721.7, 1: 1716.4. Samples: 20148666. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:18:48,803][19739] Avg episode reward: [(0, '746.230'), (1, '738.220')] +[2023-10-08 17:18:50,948][21195] Updated weights for policy 0, policy_version 39490 (0.0008) +[2023-10-08 17:18:51,324][21195] Updated weights for policy 0, policy_version 39500 (0.0008) +[2023-10-08 17:18:51,697][21195] Updated weights for policy 0, policy_version 39510 (0.0008) +[2023-10-08 17:18:52,032][21194] Updated weights for policy 1, policy_version 39210 (0.0008) +[2023-10-08 17:18:52,056][21195] Updated weights for policy 0, policy_version 39520 (0.0007) +[2023-10-08 17:18:52,405][21194] Updated weights for policy 1, policy_version 39220 (0.0010) +[2023-10-08 17:18:52,762][21194] Updated weights for policy 1, policy_version 39230 (0.0009) +[2023-10-08 17:18:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 80642048. Throughput: 0: 1723.5, 1: 1709.6. Samples: 20163854. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:18:53,803][19739] Avg episode reward: [(0, '746.040'), (1, '738.220')] +[2023-10-08 17:18:55,898][21195] Updated weights for policy 0, policy_version 39530 (0.0008) +[2023-10-08 17:18:56,266][21195] Updated weights for policy 0, policy_version 39540 (0.0008) +[2023-10-08 17:18:56,635][21195] Updated weights for policy 0, policy_version 39550 (0.0007) +[2023-10-08 17:18:56,890][21194] Updated weights for policy 1, policy_version 39240 (0.0010) +[2023-10-08 17:18:57,251][21194] Updated weights for policy 1, policy_version 39250 (0.0010) +[2023-10-08 17:18:57,618][21194] Updated weights for policy 1, policy_version 39260 (0.0012) +[2023-10-08 17:18:58,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 80707584. Throughput: 0: 1718.1, 1: 1686.8. Samples: 20184108. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:18:58,803][19739] Avg episode reward: [(0, '746.040'), (1, '726.060')] +[2023-10-08 17:19:00,355][21195] Updated weights for policy 0, policy_version 39560 (0.0009) +[2023-10-08 17:19:00,725][21195] Updated weights for policy 0, policy_version 39570 (0.0010) +[2023-10-08 17:19:01,096][21195] Updated weights for policy 0, policy_version 39580 (0.0009) +[2023-10-08 17:19:01,551][21194] Updated weights for policy 1, policy_version 39270 (0.0008) +[2023-10-08 17:19:01,917][21194] Updated weights for policy 1, policy_version 39280 (0.0009) +[2023-10-08 17:19:02,284][21194] Updated weights for policy 1, policy_version 39290 (0.0007) +[2023-10-08 17:19:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 80773120. Throughput: 0: 1746.6, 1: 1718.9. Samples: 20201026. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:19:03,804][19739] Avg episode reward: [(0, '748.870'), (1, '726.350')] +[2023-10-08 17:19:04,975][21195] Updated weights for policy 0, policy_version 39590 (0.0009) +[2023-10-08 17:19:05,343][21195] Updated weights for policy 0, policy_version 39600 (0.0009) +[2023-10-08 17:19:05,711][21195] Updated weights for policy 0, policy_version 39610 (0.0008) +[2023-10-08 17:19:06,137][21194] Updated weights for policy 1, policy_version 39300 (0.0007) +[2023-10-08 17:19:06,508][21194] Updated weights for policy 1, policy_version 39310 (0.0008) +[2023-10-08 17:19:06,870][21194] Updated weights for policy 1, policy_version 39320 (0.0009) +[2023-10-08 17:19:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 80838656. Throughput: 0: 1719.4, 1: 1703.7. Samples: 20215488. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:19:08,803][19739] Avg episode reward: [(0, '748.870'), (1, '726.350')] +[2023-10-08 17:19:09,594][21195] Updated weights for policy 0, policy_version 39620 (0.0008) +[2023-10-08 17:19:09,966][21195] Updated weights for policy 0, policy_version 39630 (0.0009) +[2023-10-08 17:19:10,341][21195] Updated weights for policy 0, policy_version 39640 (0.0009) +[2023-10-08 17:19:10,701][21194] Updated weights for policy 1, policy_version 39330 (0.0008) +[2023-10-08 17:19:11,063][21194] Updated weights for policy 1, policy_version 39340 (0.0007) +[2023-10-08 17:19:11,433][21194] Updated weights for policy 1, policy_version 39350 (0.0010) +[2023-10-08 17:19:11,796][21194] Updated weights for policy 1, policy_version 39360 (0.0011) +[2023-10-08 17:19:13,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 80904192. Throughput: 0: 1744.1, 1: 1703.5. Samples: 20236706. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:19:13,803][19739] Avg episode reward: [(0, '750.700'), (1, '726.350')] +[2023-10-08 17:19:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000039360_40304640.pth... +[2023-10-08 17:19:13,813][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000039648_40599552.pth... +[2023-10-08 17:19:13,848][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000037760_38666240.pth +[2023-10-08 17:19:13,849][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000038048_38961152.pth +[2023-10-08 17:19:14,217][21195] Updated weights for policy 0, policy_version 39650 (0.0008) +[2023-10-08 17:19:14,612][21195] Updated weights for policy 0, policy_version 39660 (0.0009) +[2023-10-08 17:19:14,986][21195] Updated weights for policy 0, policy_version 39670 (0.0009) +[2023-10-08 17:19:15,350][21195] Updated weights for policy 0, policy_version 39680 (0.0009) +[2023-10-08 17:19:15,664][21194] Updated weights for policy 1, policy_version 39370 (0.0008) +[2023-10-08 17:19:16,038][21194] Updated weights for policy 1, policy_version 39380 (0.0007) +[2023-10-08 17:19:16,402][21194] Updated weights for policy 1, policy_version 39390 (0.0008) +[2023-10-08 17:19:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 80969728. Throughput: 0: 1759.0, 1: 1709.6. Samples: 20252726. Policy #0 lag: (min: 17.0, avg: 33.2, max: 49.0) +[2023-10-08 17:19:18,803][19739] Avg episode reward: [(0, '750.240'), (1, '726.350')] +[2023-10-08 17:19:19,017][21195] Updated weights for policy 0, policy_version 39690 (0.0009) +[2023-10-08 17:19:19,383][21195] Updated weights for policy 0, policy_version 39700 (0.0008) +[2023-10-08 17:19:19,759][21195] Updated weights for policy 0, policy_version 39710 (0.0007) +[2023-10-08 17:19:20,410][21194] Updated weights for policy 1, policy_version 39400 (0.0009) +[2023-10-08 17:19:20,773][21194] Updated weights for policy 1, policy_version 39410 (0.0008) +[2023-10-08 17:19:21,139][21194] Updated weights for policy 1, policy_version 39420 (0.0009) +[2023-10-08 17:19:23,714][21195] Updated weights for policy 0, policy_version 39720 (0.0008) +[2023-10-08 17:19:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 81035264. Throughput: 0: 1735.6, 1: 1695.1. Samples: 20267672. Policy #0 lag: (min: 17.0, avg: 33.2, max: 49.0) +[2023-10-08 17:19:23,803][19739] Avg episode reward: [(0, '715.450'), (1, '726.610')] +[2023-10-08 17:19:24,085][21195] Updated weights for policy 0, policy_version 39730 (0.0009) +[2023-10-08 17:19:24,455][21195] Updated weights for policy 0, policy_version 39740 (0.0008) +[2023-10-08 17:19:25,151][21194] Updated weights for policy 1, policy_version 39430 (0.0010) +[2023-10-08 17:19:25,518][21194] Updated weights for policy 1, policy_version 39440 (0.0011) +[2023-10-08 17:19:25,872][21194] Updated weights for policy 1, policy_version 39450 (0.0010) +[2023-10-08 17:19:28,240][21195] Updated weights for policy 0, policy_version 39750 (0.0009) +[2023-10-08 17:19:28,608][21195] Updated weights for policy 0, policy_version 39760 (0.0007) +[2023-10-08 17:19:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 81100800. Throughput: 0: 1767.8, 1: 1723.4. Samples: 20289312. Policy #0 lag: (min: 17.0, avg: 33.2, max: 49.0) +[2023-10-08 17:19:28,803][19739] Avg episode reward: [(0, '724.150'), (1, '739.560')] +[2023-10-08 17:19:28,982][21195] Updated weights for policy 0, policy_version 39770 (0.0009) +[2023-10-08 17:19:29,884][21194] Updated weights for policy 1, policy_version 39460 (0.0010) +[2023-10-08 17:19:30,275][21194] Updated weights for policy 1, policy_version 39470 (0.0007) +[2023-10-08 17:19:30,642][21194] Updated weights for policy 1, policy_version 39480 (0.0008) +[2023-10-08 17:19:32,798][21195] Updated weights for policy 0, policy_version 39780 (0.0011) +[2023-10-08 17:19:33,167][21195] Updated weights for policy 0, policy_version 39790 (0.0008) +[2023-10-08 17:19:33,535][21195] Updated weights for policy 0, policy_version 39800 (0.0007) +[2023-10-08 17:19:33,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 81166336. Throughput: 0: 1738.9, 1: 1702.6. Samples: 20303530. Policy #0 lag: (min: 17.0, avg: 33.2, max: 49.0) +[2023-10-08 17:19:33,803][19739] Avg episode reward: [(0, '724.150'), (1, '739.560')] +[2023-10-08 17:19:34,602][21194] Updated weights for policy 1, policy_version 39490 (0.0008) +[2023-10-08 17:19:34,973][21194] Updated weights for policy 1, policy_version 39500 (0.0009) +[2023-10-08 17:19:35,336][21194] Updated weights for policy 1, policy_version 39510 (0.0009) +[2023-10-08 17:19:35,703][21194] Updated weights for policy 1, policy_version 39520 (0.0010) +[2023-10-08 17:19:37,645][21195] Updated weights for policy 0, policy_version 39810 (0.0009) +[2023-10-08 17:19:38,010][21195] Updated weights for policy 0, policy_version 39820 (0.0009) +[2023-10-08 17:19:38,383][21195] Updated weights for policy 0, policy_version 39830 (0.0007) +[2023-10-08 17:19:38,748][21195] Updated weights for policy 0, policy_version 39840 (0.0009) +[2023-10-08 17:19:38,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 81264640. Throughput: 0: 1754.3, 1: 1718.2. Samples: 20320116. Policy #0 lag: (min: 17.0, avg: 33.2, max: 49.0) +[2023-10-08 17:19:38,803][19739] Avg episode reward: [(0, '724.150'), (1, '739.560')] +[2023-10-08 17:19:39,589][21194] Updated weights for policy 1, policy_version 39530 (0.0011) +[2023-10-08 17:19:39,961][21194] Updated weights for policy 1, policy_version 39540 (0.0008) +[2023-10-08 17:19:40,319][21194] Updated weights for policy 1, policy_version 39550 (0.0010) +[2023-10-08 17:19:42,753][21195] Updated weights for policy 0, policy_version 39850 (0.0007) +[2023-10-08 17:19:43,116][21195] Updated weights for policy 0, policy_version 39860 (0.0008) +[2023-10-08 17:19:43,490][21195] Updated weights for policy 0, policy_version 39870 (0.0008) +[2023-10-08 17:19:43,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 81330176. Throughput: 0: 1747.9, 1: 1744.1. Samples: 20341246. Policy #0 lag: (min: 31.0, avg: 41.6, max: 63.0) +[2023-10-08 17:19:43,803][19739] Avg episode reward: [(0, '724.150'), (1, '739.560')] +[2023-10-08 17:19:44,357][21194] Updated weights for policy 1, policy_version 39560 (0.0008) +[2023-10-08 17:19:44,725][21194] Updated weights for policy 1, policy_version 39570 (0.0007) +[2023-10-08 17:19:45,088][21194] Updated weights for policy 1, policy_version 39580 (0.0010) +[2023-10-08 17:19:47,411][21195] Updated weights for policy 0, policy_version 39880 (0.0010) +[2023-10-08 17:19:47,774][21195] Updated weights for policy 0, policy_version 39890 (0.0008) +[2023-10-08 17:19:48,143][21195] Updated weights for policy 0, policy_version 39900 (0.0007) +[2023-10-08 17:19:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 81395712. Throughput: 0: 1728.5, 1: 1711.5. Samples: 20355822. Policy #0 lag: (min: 31.0, avg: 41.6, max: 63.0) +[2023-10-08 17:19:48,803][19739] Avg episode reward: [(0, '724.150'), (1, '739.560')] +[2023-10-08 17:19:49,089][21194] Updated weights for policy 1, policy_version 39590 (0.0008) +[2023-10-08 17:19:49,460][21194] Updated weights for policy 1, policy_version 39600 (0.0009) +[2023-10-08 17:19:49,827][21194] Updated weights for policy 1, policy_version 39610 (0.0008) +[2023-10-08 17:19:52,064][21195] Updated weights for policy 0, policy_version 39910 (0.0008) +[2023-10-08 17:19:52,435][21195] Updated weights for policy 0, policy_version 39920 (0.0007) +[2023-10-08 17:19:52,803][21195] Updated weights for policy 0, policy_version 39930 (0.0007) +[2023-10-08 17:19:53,714][21194] Updated weights for policy 1, policy_version 39620 (0.0007) +[2023-10-08 17:19:53,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 81461248. Throughput: 0: 1757.0, 1: 1732.4. Samples: 20372508. Policy #0 lag: (min: 31.0, avg: 41.6, max: 63.0) +[2023-10-08 17:19:53,803][19739] Avg episode reward: [(0, '724.150'), (1, '739.560')] +[2023-10-08 17:19:54,078][21194] Updated weights for policy 1, policy_version 39630 (0.0008) +[2023-10-08 17:19:54,452][21194] Updated weights for policy 1, policy_version 39640 (0.0008) +[2023-10-08 17:19:56,672][21195] Updated weights for policy 0, policy_version 39940 (0.0008) +[2023-10-08 17:19:57,046][21195] Updated weights for policy 0, policy_version 39950 (0.0010) +[2023-10-08 17:19:57,426][21195] Updated weights for policy 0, policy_version 39960 (0.0011) +[2023-10-08 17:19:58,271][21194] Updated weights for policy 1, policy_version 39650 (0.0008) +[2023-10-08 17:19:58,639][21194] Updated weights for policy 1, policy_version 39660 (0.0008) +[2023-10-08 17:19:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 81526784. Throughput: 0: 1722.9, 1: 1745.3. Samples: 20392776. Policy #0 lag: (min: 31.0, avg: 41.6, max: 63.0) +[2023-10-08 17:19:58,803][19739] Avg episode reward: [(0, '745.630'), (1, '739.830')] +[2023-10-08 17:19:59,007][21194] Updated weights for policy 1, policy_version 39670 (0.0009) +[2023-10-08 17:19:59,373][21194] Updated weights for policy 1, policy_version 39680 (0.0009) +[2023-10-08 17:20:01,426][21195] Updated weights for policy 0, policy_version 39970 (0.0010) +[2023-10-08 17:20:01,832][21195] Updated weights for policy 0, policy_version 39980 (0.0010) +[2023-10-08 17:20:02,203][21195] Updated weights for policy 0, policy_version 39990 (0.0010) +[2023-10-08 17:20:02,581][21195] Updated weights for policy 0, policy_version 40000 (0.0007) +[2023-10-08 17:20:03,326][21194] Updated weights for policy 1, policy_version 39690 (0.0010) +[2023-10-08 17:20:03,696][21194] Updated weights for policy 1, policy_version 39700 (0.0010) +[2023-10-08 17:20:03,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 81592320. Throughput: 0: 1718.8, 1: 1730.7. Samples: 20407950. Policy #0 lag: (min: 31.0, avg: 41.6, max: 63.0) +[2023-10-08 17:20:03,804][19739] Avg episode reward: [(0, '745.630'), (1, '739.830')] +[2023-10-08 17:20:04,065][21194] Updated weights for policy 1, policy_version 39710 (0.0009) +[2023-10-08 17:20:06,535][21195] Updated weights for policy 0, policy_version 40010 (0.0011) +[2023-10-08 17:20:06,899][21195] Updated weights for policy 0, policy_version 40020 (0.0010) +[2023-10-08 17:20:07,279][21195] Updated weights for policy 0, policy_version 40030 (0.0007) +[2023-10-08 17:20:07,894][21194] Updated weights for policy 1, policy_version 39720 (0.0008) +[2023-10-08 17:20:08,257][21194] Updated weights for policy 1, policy_version 39730 (0.0009) +[2023-10-08 17:20:08,627][21194] Updated weights for policy 1, policy_version 39740 (0.0009) +[2023-10-08 17:20:08,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 81690624. Throughput: 0: 1730.6, 1: 1742.9. Samples: 20423980. Policy #0 lag: (min: 31.0, avg: 41.6, max: 63.0) +[2023-10-08 17:20:08,803][19739] Avg episode reward: [(0, '749.300'), (1, '740.000')] +[2023-10-08 17:20:11,030][21195] Updated weights for policy 0, policy_version 40040 (0.0008) +[2023-10-08 17:20:11,392][21195] Updated weights for policy 0, policy_version 40050 (0.0009) +[2023-10-08 17:20:11,761][21195] Updated weights for policy 0, policy_version 40060 (0.0009) +[2023-10-08 17:20:12,642][21194] Updated weights for policy 1, policy_version 39750 (0.0009) +[2023-10-08 17:20:13,001][21194] Updated weights for policy 1, policy_version 39760 (0.0008) +[2023-10-08 17:20:13,380][21194] Updated weights for policy 1, policy_version 39770 (0.0008) +[2023-10-08 17:20:13,803][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 81756160. Throughput: 0: 1712.5, 1: 1729.4. Samples: 20444198. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:20:13,803][19739] Avg episode reward: [(0, '747.160'), (1, '740.000')] +[2023-10-08 17:20:15,629][21195] Updated weights for policy 0, policy_version 40070 (0.0010) +[2023-10-08 17:20:16,001][21195] Updated weights for policy 0, policy_version 40080 (0.0008) +[2023-10-08 17:20:16,372][21195] Updated weights for policy 0, policy_version 40090 (0.0010) +[2023-10-08 17:20:17,356][21194] Updated weights for policy 1, policy_version 39780 (0.0008) +[2023-10-08 17:20:17,731][21194] Updated weights for policy 1, policy_version 39790 (0.0007) +[2023-10-08 17:20:18,089][21194] Updated weights for policy 1, policy_version 39800 (0.0007) +[2023-10-08 17:20:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 81821696. Throughput: 0: 1741.1, 1: 1744.8. Samples: 20460398. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:20:18,803][19739] Avg episode reward: [(0, '733.250'), (1, '740.000')] +[2023-10-08 17:20:20,354][21195] Updated weights for policy 0, policy_version 40100 (0.0010) +[2023-10-08 17:20:20,721][21195] Updated weights for policy 0, policy_version 40110 (0.0008) +[2023-10-08 17:20:21,077][21195] Updated weights for policy 0, policy_version 40120 (0.0007) +[2023-10-08 17:20:22,156][21194] Updated weights for policy 1, policy_version 39810 (0.0008) +[2023-10-08 17:20:22,528][21194] Updated weights for policy 1, policy_version 39820 (0.0007) +[2023-10-08 17:20:22,885][21194] Updated weights for policy 1, policy_version 39830 (0.0007) +[2023-10-08 17:20:23,249][21194] Updated weights for policy 1, policy_version 39840 (0.0010) +[2023-10-08 17:20:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 81887232. Throughput: 0: 1717.7, 1: 1742.1. Samples: 20475810. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:20:23,803][19739] Avg episode reward: [(0, '733.250'), (1, '740.000')] +[2023-10-08 17:20:24,974][21195] Updated weights for policy 0, policy_version 40130 (0.0009) +[2023-10-08 17:20:25,339][21195] Updated weights for policy 0, policy_version 40140 (0.0008) +[2023-10-08 17:20:25,706][21195] Updated weights for policy 0, policy_version 40150 (0.0009) +[2023-10-08 17:20:26,077][21195] Updated weights for policy 0, policy_version 40160 (0.0007) +[2023-10-08 17:20:27,087][21194] Updated weights for policy 1, policy_version 39850 (0.0009) +[2023-10-08 17:20:27,455][21194] Updated weights for policy 1, policy_version 39860 (0.0011) +[2023-10-08 17:20:27,818][21194] Updated weights for policy 1, policy_version 39870 (0.0010) +[2023-10-08 17:20:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 81952768. Throughput: 0: 1728.0, 1: 1711.2. Samples: 20496012. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:20:28,803][19739] Avg episode reward: [(0, '733.250'), (1, '747.710')] +[2023-10-08 17:20:30,093][21195] Updated weights for policy 0, policy_version 40170 (0.0010) +[2023-10-08 17:20:30,459][21195] Updated weights for policy 0, policy_version 40180 (0.0011) +[2023-10-08 17:20:30,827][21195] Updated weights for policy 0, policy_version 40190 (0.0008) +[2023-10-08 17:20:31,758][21194] Updated weights for policy 1, policy_version 39880 (0.0009) +[2023-10-08 17:20:32,111][21194] Updated weights for policy 1, policy_version 39890 (0.0011) +[2023-10-08 17:20:32,476][21194] Updated weights for policy 1, policy_version 39900 (0.0008) +[2023-10-08 17:20:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 82018304. Throughput: 0: 1741.5, 1: 1742.2. Samples: 20512588. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:20:33,803][19739] Avg episode reward: [(0, '733.250'), (1, '747.710')] +[2023-10-08 17:20:34,765][21195] Updated weights for policy 0, policy_version 40200 (0.0008) +[2023-10-08 17:20:35,134][21195] Updated weights for policy 0, policy_version 40210 (0.0008) +[2023-10-08 17:20:35,504][21195] Updated weights for policy 0, policy_version 40220 (0.0010) +[2023-10-08 17:20:36,430][21194] Updated weights for policy 1, policy_version 39910 (0.0008) +[2023-10-08 17:20:36,793][21194] Updated weights for policy 1, policy_version 39920 (0.0009) +[2023-10-08 17:20:37,157][21194] Updated weights for policy 1, policy_version 39930 (0.0010) +[2023-10-08 17:20:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 82083840. Throughput: 0: 1708.1, 1: 1725.9. Samples: 20527038. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:20:38,803][19739] Avg episode reward: [(0, '746.090'), (1, '747.570')] +[2023-10-08 17:20:39,442][21195] Updated weights for policy 0, policy_version 40230 (0.0009) +[2023-10-08 17:20:39,814][21195] Updated weights for policy 0, policy_version 40240 (0.0008) +[2023-10-08 17:20:40,178][21195] Updated weights for policy 0, policy_version 40250 (0.0008) +[2023-10-08 17:20:41,229][21194] Updated weights for policy 1, policy_version 39940 (0.0011) +[2023-10-08 17:20:41,590][21194] Updated weights for policy 1, policy_version 39950 (0.0011) +[2023-10-08 17:20:41,962][21194] Updated weights for policy 1, policy_version 39960 (0.0010) +[2023-10-08 17:20:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 82149376. Throughput: 0: 1740.3, 1: 1707.4. Samples: 20547922. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:20:43,803][19739] Avg episode reward: [(0, '746.090'), (1, '747.570')] +[2023-10-08 17:20:44,067][21195] Updated weights for policy 0, policy_version 40260 (0.0011) +[2023-10-08 17:20:44,437][21195] Updated weights for policy 0, policy_version 40270 (0.0007) +[2023-10-08 17:20:44,802][21195] Updated weights for policy 0, policy_version 40280 (0.0008) +[2023-10-08 17:20:45,828][21194] Updated weights for policy 1, policy_version 39970 (0.0009) +[2023-10-08 17:20:46,198][21194] Updated weights for policy 1, policy_version 39980 (0.0007) +[2023-10-08 17:20:46,564][21194] Updated weights for policy 1, policy_version 39990 (0.0007) +[2023-10-08 17:20:46,925][21194] Updated weights for policy 1, policy_version 40000 (0.0008) +[2023-10-08 17:20:48,656][21195] Updated weights for policy 0, policy_version 40290 (0.0009) +[2023-10-08 17:20:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 82214912. Throughput: 0: 1746.7, 1: 1730.0. Samples: 20564398. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:20:48,803][19739] Avg episode reward: [(0, '733.540'), (1, '747.570')] +[2023-10-08 17:20:49,016][21195] Updated weights for policy 0, policy_version 40300 (0.0007) +[2023-10-08 17:20:49,386][21195] Updated weights for policy 0, policy_version 40310 (0.0008) +[2023-10-08 17:20:49,762][21195] Updated weights for policy 0, policy_version 40320 (0.0008) +[2023-10-08 17:20:50,943][21194] Updated weights for policy 1, policy_version 40010 (0.0007) +[2023-10-08 17:20:51,304][21194] Updated weights for policy 1, policy_version 40020 (0.0007) +[2023-10-08 17:20:51,673][21194] Updated weights for policy 1, policy_version 40030 (0.0008) +[2023-10-08 17:20:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 82280448. Throughput: 0: 1736.5, 1: 1703.8. Samples: 20578794. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:20:53,803][19739] Avg episode reward: [(0, '737.990'), (1, '747.570')] +[2023-10-08 17:20:53,825][21195] Updated weights for policy 0, policy_version 40330 (0.0011) +[2023-10-08 17:20:54,201][21195] Updated weights for policy 0, policy_version 40340 (0.0008) +[2023-10-08 17:20:54,570][21195] Updated weights for policy 0, policy_version 40350 (0.0008) +[2023-10-08 17:20:55,633][21194] Updated weights for policy 1, policy_version 40040 (0.0010) +[2023-10-08 17:20:55,998][21194] Updated weights for policy 1, policy_version 40050 (0.0009) +[2023-10-08 17:20:56,359][21194] Updated weights for policy 1, policy_version 40060 (0.0010) +[2023-10-08 17:20:58,282][21195] Updated weights for policy 0, policy_version 40360 (0.0007) +[2023-10-08 17:20:58,650][21195] Updated weights for policy 0, policy_version 40370 (0.0007) +[2023-10-08 17:20:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 82345984. Throughput: 0: 1752.4, 1: 1721.0. Samples: 20600502. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:20:58,803][19739] Avg episode reward: [(0, '737.990'), (1, '747.570')] +[2023-10-08 17:20:59,014][21195] Updated weights for policy 0, policy_version 40380 (0.0009) +[2023-10-08 17:21:00,322][21194] Updated weights for policy 1, policy_version 40070 (0.0009) +[2023-10-08 17:21:00,691][21194] Updated weights for policy 1, policy_version 40080 (0.0008) +[2023-10-08 17:21:01,065][21194] Updated weights for policy 1, policy_version 40090 (0.0008) +[2023-10-08 17:21:02,829][21195] Updated weights for policy 0, policy_version 40390 (0.0008) +[2023-10-08 17:21:03,202][21195] Updated weights for policy 0, policy_version 40400 (0.0009) +[2023-10-08 17:21:03,565][21195] Updated weights for policy 0, policy_version 40410 (0.0009) +[2023-10-08 17:21:03,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 82444288. Throughput: 0: 1723.6, 1: 1709.5. Samples: 20614886. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:21:03,804][19739] Avg episode reward: [(0, '737.990'), (1, '747.570')] +[2023-10-08 17:21:04,854][21194] Updated weights for policy 1, policy_version 40100 (0.0008) +[2023-10-08 17:21:05,250][21194] Updated weights for policy 1, policy_version 40110 (0.0007) +[2023-10-08 17:21:05,611][21194] Updated weights for policy 1, policy_version 40120 (0.0008) +[2023-10-08 17:21:07,465][21195] Updated weights for policy 0, policy_version 40420 (0.0010) +[2023-10-08 17:21:07,834][21195] Updated weights for policy 0, policy_version 40430 (0.0010) +[2023-10-08 17:21:08,186][21195] Updated weights for policy 0, policy_version 40440 (0.0011) +[2023-10-08 17:21:08,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 82509824. Throughput: 0: 1753.4, 1: 1702.5. Samples: 20631326. Policy #0 lag: (min: 9.0, avg: 21.4, max: 41.0) +[2023-10-08 17:21:08,803][19739] Avg episode reward: [(0, '751.900'), (1, '746.740')] +[2023-10-08 17:21:09,562][21194] Updated weights for policy 1, policy_version 40130 (0.0009) +[2023-10-08 17:21:09,926][21194] Updated weights for policy 1, policy_version 40140 (0.0008) +[2023-10-08 17:21:10,299][21194] Updated weights for policy 1, policy_version 40150 (0.0009) +[2023-10-08 17:21:10,659][21194] Updated weights for policy 1, policy_version 40160 (0.0009) +[2023-10-08 17:21:12,251][21195] Updated weights for policy 0, policy_version 40450 (0.0010) +[2023-10-08 17:21:12,610][21195] Updated weights for policy 0, policy_version 40460 (0.0007) +[2023-10-08 17:21:12,976][21195] Updated weights for policy 0, policy_version 40470 (0.0010) +[2023-10-08 17:21:13,339][21195] Updated weights for policy 0, policy_version 40480 (0.0010) +[2023-10-08 17:21:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 82575360. Throughput: 0: 1737.1, 1: 1726.5. Samples: 20651876. Policy #0 lag: (min: 9.0, avg: 21.4, max: 41.0) +[2023-10-08 17:21:13,803][19739] Avg episode reward: [(0, '751.900'), (1, '726.700')] +[2023-10-08 17:21:13,811][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000040160_41123840.pth... +[2023-10-08 17:21:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000040480_41451520.pth... +[2023-10-08 17:21:13,849][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000038848_39780352.pth +[2023-10-08 17:21:13,853][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000038560_39485440.pth +[2023-10-08 17:21:13,855][20740] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p0/milestones/checkpoint_000040480_41451520.pth +[2023-10-08 17:21:13,857][20836] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p1/milestones/checkpoint_000040160_41123840.pth +[2023-10-08 17:21:14,647][21194] Updated weights for policy 1, policy_version 40170 (0.0009) +[2023-10-08 17:21:15,011][21194] Updated weights for policy 1, policy_version 40180 (0.0007) +[2023-10-08 17:21:15,385][21194] Updated weights for policy 1, policy_version 40190 (0.0012) +[2023-10-08 17:21:17,194][21195] Updated weights for policy 0, policy_version 40490 (0.0007) +[2023-10-08 17:21:17,556][21195] Updated weights for policy 0, policy_version 40500 (0.0007) +[2023-10-08 17:21:17,934][21195] Updated weights for policy 0, policy_version 40510 (0.0007) +[2023-10-08 17:21:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 82640896. Throughput: 0: 1721.6, 1: 1698.7. Samples: 20666502. Policy #0 lag: (min: 9.0, avg: 21.4, max: 41.0) +[2023-10-08 17:21:18,803][19739] Avg episode reward: [(0, '751.900'), (1, '726.700')] +[2023-10-08 17:21:19,346][21194] Updated weights for policy 1, policy_version 40200 (0.0008) +[2023-10-08 17:21:19,706][21194] Updated weights for policy 1, policy_version 40210 (0.0007) +[2023-10-08 17:21:20,083][21194] Updated weights for policy 1, policy_version 40220 (0.0008) +[2023-10-08 17:21:21,933][21195] Updated weights for policy 0, policy_version 40520 (0.0009) +[2023-10-08 17:21:22,297][21195] Updated weights for policy 0, policy_version 40530 (0.0010) +[2023-10-08 17:21:22,669][21195] Updated weights for policy 0, policy_version 40540 (0.0008) +[2023-10-08 17:21:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 82706432. Throughput: 0: 1746.8, 1: 1716.0. Samples: 20682860. Policy #0 lag: (min: 9.0, avg: 21.4, max: 41.0) +[2023-10-08 17:21:23,803][19739] Avg episode reward: [(0, '751.900'), (1, '726.700')] +[2023-10-08 17:21:24,002][21194] Updated weights for policy 1, policy_version 40230 (0.0007) +[2023-10-08 17:21:24,379][21194] Updated weights for policy 1, policy_version 40240 (0.0008) +[2023-10-08 17:21:24,747][21194] Updated weights for policy 1, policy_version 40250 (0.0007) +[2023-10-08 17:21:26,567][21195] Updated weights for policy 0, policy_version 40550 (0.0009) +[2023-10-08 17:21:26,934][21195] Updated weights for policy 0, policy_version 40560 (0.0011) +[2023-10-08 17:21:27,312][21195] Updated weights for policy 0, policy_version 40570 (0.0008) +[2023-10-08 17:21:28,798][21194] Updated weights for policy 1, policy_version 40260 (0.0008) +[2023-10-08 17:21:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 82771968. Throughput: 0: 1722.8, 1: 1728.3. Samples: 20703220. Policy #0 lag: (min: 9.0, avg: 21.4, max: 41.0) +[2023-10-08 17:21:28,803][19739] Avg episode reward: [(0, '751.900'), (1, '726.700')] +[2023-10-08 17:21:29,165][21194] Updated weights for policy 1, policy_version 40270 (0.0011) +[2023-10-08 17:21:29,542][21194] Updated weights for policy 1, policy_version 40280 (0.0010) +[2023-10-08 17:21:31,127][21195] Updated weights for policy 0, policy_version 40580 (0.0007) +[2023-10-08 17:21:31,499][21195] Updated weights for policy 0, policy_version 40590 (0.0008) +[2023-10-08 17:21:31,863][21195] Updated weights for policy 0, policy_version 40600 (0.0010) +[2023-10-08 17:21:33,453][21194] Updated weights for policy 1, policy_version 40290 (0.0009) +[2023-10-08 17:21:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 82837504. Throughput: 0: 1728.5, 1: 1704.6. Samples: 20718886. Policy #0 lag: (min: 9.0, avg: 21.4, max: 41.0) +[2023-10-08 17:21:33,803][19739] Avg episode reward: [(0, '730.430'), (1, '726.700')] +[2023-10-08 17:21:33,822][21194] Updated weights for policy 1, policy_version 40300 (0.0007) +[2023-10-08 17:21:34,185][21194] Updated weights for policy 1, policy_version 40310 (0.0007) +[2023-10-08 17:21:34,547][21194] Updated weights for policy 1, policy_version 40320 (0.0008) +[2023-10-08 17:21:35,862][21195] Updated weights for policy 0, policy_version 40610 (0.0010) +[2023-10-08 17:21:36,263][21195] Updated weights for policy 0, policy_version 40620 (0.0009) +[2023-10-08 17:21:36,633][21195] Updated weights for policy 0, policy_version 40630 (0.0010) +[2023-10-08 17:21:37,004][21195] Updated weights for policy 0, policy_version 40640 (0.0009) +[2023-10-08 17:21:38,708][21194] Updated weights for policy 1, policy_version 40330 (0.0011) +[2023-10-08 17:21:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 82903040. Throughput: 0: 1729.2, 1: 1728.2. Samples: 20734376. Policy #0 lag: (min: 1.0, avg: 14.2, max: 33.0) +[2023-10-08 17:21:38,803][19739] Avg episode reward: [(0, '730.430'), (1, '741.590')] +[2023-10-08 17:21:39,074][21194] Updated weights for policy 1, policy_version 40340 (0.0012) +[2023-10-08 17:21:39,444][21194] Updated weights for policy 1, policy_version 40350 (0.0008) +[2023-10-08 17:21:40,793][21195] Updated weights for policy 0, policy_version 40650 (0.0009) +[2023-10-08 17:21:41,161][21195] Updated weights for policy 0, policy_version 40660 (0.0009) +[2023-10-08 17:21:41,532][21195] Updated weights for policy 0, policy_version 40670 (0.0007) +[2023-10-08 17:21:43,390][21194] Updated weights for policy 1, policy_version 40360 (0.0008) +[2023-10-08 17:21:43,752][21194] Updated weights for policy 1, policy_version 40370 (0.0008) +[2023-10-08 17:21:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 82968576. Throughput: 0: 1718.5, 1: 1724.3. Samples: 20755428. Policy #0 lag: (min: 1.0, avg: 14.2, max: 33.0) +[2023-10-08 17:21:43,803][19739] Avg episode reward: [(0, '730.430'), (1, '741.590')] +[2023-10-08 17:21:44,121][21194] Updated weights for policy 1, policy_version 40380 (0.0007) +[2023-10-08 17:21:45,452][21195] Updated weights for policy 0, policy_version 40680 (0.0010) +[2023-10-08 17:21:45,819][21195] Updated weights for policy 0, policy_version 40690 (0.0008) +[2023-10-08 17:21:46,187][21195] Updated weights for policy 0, policy_version 40700 (0.0009) +[2023-10-08 17:21:47,975][21194] Updated weights for policy 1, policy_version 40390 (0.0007) +[2023-10-08 17:21:48,333][21194] Updated weights for policy 1, policy_version 40400 (0.0007) +[2023-10-08 17:21:48,697][21194] Updated weights for policy 1, policy_version 40410 (0.0009) +[2023-10-08 17:21:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 83034112. Throughput: 0: 1744.7, 1: 1719.9. Samples: 20770790. Policy #0 lag: (min: 1.0, avg: 14.2, max: 33.0) +[2023-10-08 17:21:48,803][19739] Avg episode reward: [(0, '730.430'), (1, '756.720')] +[2023-10-08 17:21:50,198][21195] Updated weights for policy 0, policy_version 40710 (0.0008) +[2023-10-08 17:21:50,564][21195] Updated weights for policy 0, policy_version 40720 (0.0007) +[2023-10-08 17:21:50,938][21195] Updated weights for policy 0, policy_version 40730 (0.0009) +[2023-10-08 17:21:52,742][21194] Updated weights for policy 1, policy_version 40420 (0.0007) +[2023-10-08 17:21:53,128][21194] Updated weights for policy 1, policy_version 40430 (0.0009) +[2023-10-08 17:21:53,487][21194] Updated weights for policy 1, policy_version 40440 (0.0011) +[2023-10-08 17:21:53,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 83132416. Throughput: 0: 1711.2, 1: 1733.2. Samples: 20786324. Policy #0 lag: (min: 1.0, avg: 14.2, max: 33.0) +[2023-10-08 17:21:53,804][19739] Avg episode reward: [(0, '730.430'), (1, '756.720')] +[2023-10-08 17:21:54,741][21195] Updated weights for policy 0, policy_version 40740 (0.0009) +[2023-10-08 17:21:55,117][21195] Updated weights for policy 0, policy_version 40750 (0.0007) +[2023-10-08 17:21:55,480][21195] Updated weights for policy 0, policy_version 40760 (0.0007) +[2023-10-08 17:21:57,331][21194] Updated weights for policy 1, policy_version 40450 (0.0011) +[2023-10-08 17:21:57,695][21194] Updated weights for policy 1, policy_version 40460 (0.0010) +[2023-10-08 17:21:58,067][21194] Updated weights for policy 1, policy_version 40470 (0.0009) +[2023-10-08 17:21:58,424][21194] Updated weights for policy 1, policy_version 40480 (0.0009) +[2023-10-08 17:21:58,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 83197952. Throughput: 0: 1733.1, 1: 1715.9. Samples: 20807082. Policy #0 lag: (min: 1.0, avg: 14.2, max: 33.0) +[2023-10-08 17:21:58,803][19739] Avg episode reward: [(0, '733.080'), (1, '761.180')] +[2023-10-08 17:21:59,604][21195] Updated weights for policy 0, policy_version 40770 (0.0008) +[2023-10-08 17:21:59,971][21195] Updated weights for policy 0, policy_version 40780 (0.0007) +[2023-10-08 17:22:00,343][21195] Updated weights for policy 0, policy_version 40790 (0.0009) +[2023-10-08 17:22:00,717][21195] Updated weights for policy 0, policy_version 40800 (0.0010) +[2023-10-08 17:22:02,378][21194] Updated weights for policy 1, policy_version 40490 (0.0007) +[2023-10-08 17:22:02,745][21194] Updated weights for policy 1, policy_version 40500 (0.0007) +[2023-10-08 17:22:03,111][21194] Updated weights for policy 1, policy_version 40510 (0.0007) +[2023-10-08 17:22:03,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 83263488. Throughput: 0: 1754.8, 1: 1735.5. Samples: 20823564. Policy #0 lag: (min: 1.0, avg: 14.2, max: 33.0) +[2023-10-08 17:22:03,803][19739] Avg episode reward: [(0, '733.080'), (1, '768.190')] +[2023-10-08 17:22:04,491][21195] Updated weights for policy 0, policy_version 40810 (0.0009) +[2023-10-08 17:22:04,867][21195] Updated weights for policy 0, policy_version 40820 (0.0007) +[2023-10-08 17:22:05,232][21195] Updated weights for policy 0, policy_version 40830 (0.0008) +[2023-10-08 17:22:07,051][21194] Updated weights for policy 1, policy_version 40520 (0.0009) +[2023-10-08 17:22:07,407][21194] Updated weights for policy 1, policy_version 40530 (0.0009) +[2023-10-08 17:22:07,772][21194] Updated weights for policy 1, policy_version 40540 (0.0008) +[2023-10-08 17:22:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 83329024. Throughput: 0: 1732.4, 1: 1730.9. Samples: 20838708. Policy #0 lag: (min: 31.0, avg: 31.2, max: 41.0) +[2023-10-08 17:22:08,803][19739] Avg episode reward: [(0, '726.140'), (1, '768.190')] +[2023-10-08 17:22:09,108][21195] Updated weights for policy 0, policy_version 40840 (0.0008) +[2023-10-08 17:22:09,485][21195] Updated weights for policy 0, policy_version 40850 (0.0008) +[2023-10-08 17:22:09,847][21195] Updated weights for policy 0, policy_version 40860 (0.0008) +[2023-10-08 17:22:11,732][21194] Updated weights for policy 1, policy_version 40550 (0.0009) +[2023-10-08 17:22:12,105][21194] Updated weights for policy 1, policy_version 40560 (0.0008) +[2023-10-08 17:22:12,470][21194] Updated weights for policy 1, policy_version 40570 (0.0008) +[2023-10-08 17:22:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 83394560. Throughput: 0: 1754.5, 1: 1705.4. Samples: 20858916. Policy #0 lag: (min: 31.0, avg: 31.2, max: 41.0) +[2023-10-08 17:22:13,803][19739] Avg episode reward: [(0, '726.370'), (1, '768.190')] +[2023-10-08 17:22:13,850][21195] Updated weights for policy 0, policy_version 40870 (0.0008) +[2023-10-08 17:22:14,218][21195] Updated weights for policy 0, policy_version 40880 (0.0010) +[2023-10-08 17:22:14,580][21195] Updated weights for policy 0, policy_version 40890 (0.0009) +[2023-10-08 17:22:16,337][21194] Updated weights for policy 1, policy_version 40580 (0.0009) +[2023-10-08 17:22:16,700][21194] Updated weights for policy 1, policy_version 40590 (0.0007) +[2023-10-08 17:22:17,068][21194] Updated weights for policy 1, policy_version 40600 (0.0007) +[2023-10-08 17:22:18,523][21195] Updated weights for policy 0, policy_version 40900 (0.0010) +[2023-10-08 17:22:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 83460096. Throughput: 0: 1741.2, 1: 1733.8. Samples: 20875260. Policy #0 lag: (min: 31.0, avg: 31.2, max: 41.0) +[2023-10-08 17:22:18,803][19739] Avg episode reward: [(0, '726.590'), (1, '728.050')] +[2023-10-08 17:22:18,890][21195] Updated weights for policy 0, policy_version 40910 (0.0009) +[2023-10-08 17:22:19,263][21195] Updated weights for policy 0, policy_version 40920 (0.0010) +[2023-10-08 17:22:21,027][21194] Updated weights for policy 1, policy_version 40610 (0.0009) +[2023-10-08 17:22:21,397][21194] Updated weights for policy 1, policy_version 40620 (0.0009) +[2023-10-08 17:22:21,751][21194] Updated weights for policy 1, policy_version 40630 (0.0009) +[2023-10-08 17:22:22,117][21194] Updated weights for policy 1, policy_version 40640 (0.0008) +[2023-10-08 17:22:23,369][21195] Updated weights for policy 0, policy_version 40930 (0.0007) +[2023-10-08 17:22:23,781][21195] Updated weights for policy 0, policy_version 40940 (0.0009) +[2023-10-08 17:22:23,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 83525632. Throughput: 0: 1746.0, 1: 1709.0. Samples: 20889852. Policy #0 lag: (min: 31.0, avg: 31.2, max: 41.0) +[2023-10-08 17:22:23,804][19739] Avg episode reward: [(0, '737.950'), (1, '728.050')] +[2023-10-08 17:22:24,140][21195] Updated weights for policy 0, policy_version 40950 (0.0011) +[2023-10-08 17:22:24,509][21195] Updated weights for policy 0, policy_version 40960 (0.0009) +[2023-10-08 17:22:26,145][21194] Updated weights for policy 1, policy_version 40650 (0.0009) +[2023-10-08 17:22:26,501][21194] Updated weights for policy 1, policy_version 40660 (0.0007) +[2023-10-08 17:22:26,866][21194] Updated weights for policy 1, policy_version 40670 (0.0009) +[2023-10-08 17:22:28,260][21195] Updated weights for policy 0, policy_version 40970 (0.0010) +[2023-10-08 17:22:28,641][21195] Updated weights for policy 0, policy_version 40980 (0.0010) +[2023-10-08 17:22:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 83591168. Throughput: 0: 1752.6, 1: 1708.4. Samples: 20911174. Policy #0 lag: (min: 31.0, avg: 31.2, max: 41.0) +[2023-10-08 17:22:28,803][19739] Avg episode reward: [(0, '737.950'), (1, '728.050')] +[2023-10-08 17:22:29,008][21195] Updated weights for policy 0, policy_version 40990 (0.0008) +[2023-10-08 17:22:30,917][21194] Updated weights for policy 1, policy_version 40680 (0.0007) +[2023-10-08 17:22:31,292][21194] Updated weights for policy 1, policy_version 40690 (0.0007) +[2023-10-08 17:22:31,655][21194] Updated weights for policy 1, policy_version 40700 (0.0008) +[2023-10-08 17:22:32,815][21195] Updated weights for policy 0, policy_version 41000 (0.0008) +[2023-10-08 17:22:33,181][21195] Updated weights for policy 0, policy_version 41010 (0.0008) +[2023-10-08 17:22:33,546][21195] Updated weights for policy 0, policy_version 41020 (0.0008) +[2023-10-08 17:22:33,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 83689472. Throughput: 0: 1722.1, 1: 1727.8. Samples: 20926034. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:22:33,804][19739] Avg episode reward: [(0, '709.710'), (1, '727.950')] +[2023-10-08 17:22:35,669][21194] Updated weights for policy 1, policy_version 40710 (0.0009) +[2023-10-08 17:22:36,029][21194] Updated weights for policy 1, policy_version 40720 (0.0008) +[2023-10-08 17:22:36,390][21194] Updated weights for policy 1, policy_version 40730 (0.0007) +[2023-10-08 17:22:37,343][21195] Updated weights for policy 0, policy_version 41030 (0.0008) +[2023-10-08 17:22:37,729][21195] Updated weights for policy 0, policy_version 41040 (0.0009) +[2023-10-08 17:22:38,090][21195] Updated weights for policy 0, policy_version 41050 (0.0009) +[2023-10-08 17:22:38,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 83755008. Throughput: 0: 1758.8, 1: 1700.8. Samples: 20942002. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:22:38,803][19739] Avg episode reward: [(0, '709.130'), (1, '727.950')] +[2023-10-08 17:22:40,288][21194] Updated weights for policy 1, policy_version 40740 (0.0008) +[2023-10-08 17:22:40,651][21194] Updated weights for policy 1, policy_version 40750 (0.0008) +[2023-10-08 17:22:41,012][21194] Updated weights for policy 1, policy_version 40760 (0.0008) +[2023-10-08 17:22:41,980][21195] Updated weights for policy 0, policy_version 41060 (0.0009) +[2023-10-08 17:22:42,347][21195] Updated weights for policy 0, policy_version 41070 (0.0009) +[2023-10-08 17:22:42,719][21195] Updated weights for policy 0, policy_version 41080 (0.0009) +[2023-10-08 17:22:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 83820544. Throughput: 0: 1734.8, 1: 1722.7. Samples: 20962666. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:22:43,803][19739] Avg episode reward: [(0, '730.220'), (1, '727.950')] +[2023-10-08 17:22:44,949][21194] Updated weights for policy 1, policy_version 40770 (0.0008) +[2023-10-08 17:22:45,314][21194] Updated weights for policy 1, policy_version 40780 (0.0009) +[2023-10-08 17:22:45,684][21194] Updated weights for policy 1, policy_version 40790 (0.0009) +[2023-10-08 17:22:46,042][21194] Updated weights for policy 1, policy_version 40800 (0.0009) +[2023-10-08 17:22:46,658][21195] Updated weights for policy 0, policy_version 41090 (0.0008) +[2023-10-08 17:22:47,032][21195] Updated weights for policy 0, policy_version 41100 (0.0008) +[2023-10-08 17:22:47,401][21195] Updated weights for policy 0, policy_version 41110 (0.0008) +[2023-10-08 17:22:47,765][21195] Updated weights for policy 0, policy_version 41120 (0.0007) +[2023-10-08 17:22:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 83886080. Throughput: 0: 1725.3, 1: 1704.5. Samples: 20977906. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:22:48,803][19739] Avg episode reward: [(0, '730.220'), (1, '725.170')] +[2023-10-08 17:22:50,001][21194] Updated weights for policy 1, policy_version 40810 (0.0007) +[2023-10-08 17:22:50,371][21194] Updated weights for policy 1, policy_version 40820 (0.0009) +[2023-10-08 17:22:50,743][21194] Updated weights for policy 1, policy_version 40830 (0.0010) +[2023-10-08 17:22:51,662][21195] Updated weights for policy 0, policy_version 41130 (0.0011) +[2023-10-08 17:22:52,020][21195] Updated weights for policy 0, policy_version 41140 (0.0009) +[2023-10-08 17:22:52,387][21195] Updated weights for policy 0, policy_version 41150 (0.0007) +[2023-10-08 17:22:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 83951616. Throughput: 0: 1740.4, 1: 1705.6. Samples: 20993778. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:22:53,803][19739] Avg episode reward: [(0, '713.360'), (1, '725.170')] +[2023-10-08 17:22:54,707][21194] Updated weights for policy 1, policy_version 40840 (0.0010) +[2023-10-08 17:22:55,082][21194] Updated weights for policy 1, policy_version 40850 (0.0008) +[2023-10-08 17:22:55,443][21194] Updated weights for policy 1, policy_version 40860 (0.0011) +[2023-10-08 17:22:56,161][21195] Updated weights for policy 0, policy_version 41160 (0.0008) +[2023-10-08 17:22:56,526][21195] Updated weights for policy 0, policy_version 41170 (0.0009) +[2023-10-08 17:22:56,898][21195] Updated weights for policy 0, policy_version 41180 (0.0009) +[2023-10-08 17:22:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 84017152. Throughput: 0: 1727.9, 1: 1740.8. Samples: 21015008. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:22:58,803][19739] Avg episode reward: [(0, '713.360'), (1, '732.940')] +[2023-10-08 17:22:59,179][21194] Updated weights for policy 1, policy_version 40870 (0.0008) +[2023-10-08 17:22:59,555][21194] Updated weights for policy 1, policy_version 40880 (0.0007) +[2023-10-08 17:22:59,923][21194] Updated weights for policy 1, policy_version 40890 (0.0009) +[2023-10-08 17:23:01,026][21195] Updated weights for policy 0, policy_version 41190 (0.0009) +[2023-10-08 17:23:01,407][21195] Updated weights for policy 0, policy_version 41200 (0.0011) +[2023-10-08 17:23:01,771][21195] Updated weights for policy 0, policy_version 41210 (0.0009) +[2023-10-08 17:23:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 84082688. Throughput: 0: 1736.1, 1: 1709.7. Samples: 21030324. Policy #0 lag: (min: 31.0, avg: 34.4, max: 63.0) +[2023-10-08 17:23:03,803][19739] Avg episode reward: [(0, '713.360'), (1, '732.940')] +[2023-10-08 17:23:03,879][21194] Updated weights for policy 1, policy_version 40900 (0.0008) +[2023-10-08 17:23:04,243][21194] Updated weights for policy 1, policy_version 40910 (0.0008) +[2023-10-08 17:23:04,603][21194] Updated weights for policy 1, policy_version 40920 (0.0008) +[2023-10-08 17:23:05,714][21195] Updated weights for policy 0, policy_version 41220 (0.0008) +[2023-10-08 17:23:06,081][21195] Updated weights for policy 0, policy_version 41230 (0.0008) +[2023-10-08 17:23:06,459][21195] Updated weights for policy 0, policy_version 41240 (0.0009) +[2023-10-08 17:23:08,649][21194] Updated weights for policy 1, policy_version 40930 (0.0008) +[2023-10-08 17:23:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 84148224. Throughput: 0: 1728.9, 1: 1738.6. Samples: 21045892. Policy #0 lag: (min: 31.0, avg: 34.4, max: 63.0) +[2023-10-08 17:23:08,803][19739] Avg episode reward: [(0, '725.620'), (1, '698.300')] +[2023-10-08 17:23:09,026][21194] Updated weights for policy 1, policy_version 40940 (0.0008) +[2023-10-08 17:23:09,392][21194] Updated weights for policy 1, policy_version 40950 (0.0008) +[2023-10-08 17:23:09,748][21194] Updated weights for policy 1, policy_version 40960 (0.0008) +[2023-10-08 17:23:10,455][21195] Updated weights for policy 0, policy_version 41250 (0.0009) +[2023-10-08 17:23:10,854][21195] Updated weights for policy 0, policy_version 41260 (0.0009) +[2023-10-08 17:23:11,237][21195] Updated weights for policy 0, policy_version 41270 (0.0011) +[2023-10-08 17:23:11,604][21195] Updated weights for policy 0, policy_version 41280 (0.0011) +[2023-10-08 17:23:13,737][21194] Updated weights for policy 1, policy_version 40970 (0.0009) +[2023-10-08 17:23:13,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 84213760. Throughput: 0: 1723.9, 1: 1740.4. Samples: 21067068. Policy #0 lag: (min: 31.0, avg: 34.4, max: 63.0) +[2023-10-08 17:23:13,804][19739] Avg episode reward: [(0, '725.620'), (1, '696.220')] +[2023-10-08 17:23:13,814][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000041280_42270720.pth... +[2023-10-08 17:23:13,847][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000039648_40599552.pth +[2023-10-08 17:23:14,106][21194] Updated weights for policy 1, policy_version 40980 (0.0009) +[2023-10-08 17:23:14,466][21194] Updated weights for policy 1, policy_version 40990 (0.0008) +[2023-10-08 17:23:14,536][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000040992_41975808.pth... +[2023-10-08 17:23:14,575][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000039360_40304640.pth +[2023-10-08 17:23:15,272][21195] Updated weights for policy 0, policy_version 41290 (0.0009) +[2023-10-08 17:23:15,639][21195] Updated weights for policy 0, policy_version 41300 (0.0007) +[2023-10-08 17:23:16,009][21195] Updated weights for policy 0, policy_version 41310 (0.0008) +[2023-10-08 17:23:18,506][21194] Updated weights for policy 1, policy_version 41000 (0.0010) +[2023-10-08 17:23:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 84279296. Throughput: 0: 1754.0, 1: 1721.7. Samples: 21082440. Policy #0 lag: (min: 31.0, avg: 34.4, max: 63.0) +[2023-10-08 17:23:18,803][19739] Avg episode reward: [(0, '725.620'), (1, '696.250')] +[2023-10-08 17:23:18,877][21194] Updated weights for policy 1, policy_version 41010 (0.0007) +[2023-10-08 17:23:19,228][21194] Updated weights for policy 1, policy_version 41020 (0.0008) +[2023-10-08 17:23:19,851][21195] Updated weights for policy 0, policy_version 41320 (0.0008) +[2023-10-08 17:23:20,214][21195] Updated weights for policy 0, policy_version 41330 (0.0008) +[2023-10-08 17:23:20,583][21195] Updated weights for policy 0, policy_version 41340 (0.0008) +[2023-10-08 17:23:23,131][21194] Updated weights for policy 1, policy_version 41030 (0.0008) +[2023-10-08 17:23:23,502][21194] Updated weights for policy 1, policy_version 41040 (0.0009) +[2023-10-08 17:23:23,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 84344832. Throughput: 0: 1721.0, 1: 1740.6. Samples: 21097774. Policy #0 lag: (min: 31.0, avg: 34.4, max: 63.0) +[2023-10-08 17:23:23,804][19739] Avg episode reward: [(0, '713.150'), (1, '696.250')] +[2023-10-08 17:23:23,869][21194] Updated weights for policy 1, policy_version 41050 (0.0009) +[2023-10-08 17:23:24,558][21195] Updated weights for policy 0, policy_version 41350 (0.0007) +[2023-10-08 17:23:24,922][21195] Updated weights for policy 0, policy_version 41360 (0.0009) +[2023-10-08 17:23:25,287][21195] Updated weights for policy 0, policy_version 41370 (0.0009) +[2023-10-08 17:23:27,825][21194] Updated weights for policy 1, policy_version 41060 (0.0008) +[2023-10-08 17:23:28,219][21194] Updated weights for policy 1, policy_version 41070 (0.0009) +[2023-10-08 17:23:28,588][21194] Updated weights for policy 1, policy_version 41080 (0.0009) +[2023-10-08 17:23:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 84410368. Throughput: 0: 1741.5, 1: 1728.9. Samples: 21118834. Policy #0 lag: (min: 31.0, avg: 34.4, max: 63.0) +[2023-10-08 17:23:28,803][19739] Avg episode reward: [(0, '713.150'), (1, '696.250')] +[2023-10-08 17:23:29,200][21195] Updated weights for policy 0, policy_version 41380 (0.0008) +[2023-10-08 17:23:29,566][21195] Updated weights for policy 0, policy_version 41390 (0.0008) +[2023-10-08 17:23:29,937][21195] Updated weights for policy 0, policy_version 41400 (0.0007) +[2023-10-08 17:23:32,541][21194] Updated weights for policy 1, policy_version 41090 (0.0009) +[2023-10-08 17:23:32,914][21194] Updated weights for policy 1, policy_version 41100 (0.0009) +[2023-10-08 17:23:33,290][21194] Updated weights for policy 1, policy_version 41110 (0.0008) +[2023-10-08 17:23:33,663][21194] Updated weights for policy 1, policy_version 41120 (0.0007) +[2023-10-08 17:23:33,803][19739] Fps is (10 sec: 16384.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 84508672. Throughput: 0: 1752.8, 1: 1733.7. Samples: 21134798. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 17:23:33,803][19739] Avg episode reward: [(0, '713.180'), (1, '696.250')] +[2023-10-08 17:23:33,895][21195] Updated weights for policy 0, policy_version 41410 (0.0008) +[2023-10-08 17:23:34,266][21195] Updated weights for policy 0, policy_version 41420 (0.0008) +[2023-10-08 17:23:34,639][21195] Updated weights for policy 0, policy_version 41430 (0.0007) +[2023-10-08 17:23:35,000][21195] Updated weights for policy 0, policy_version 41440 (0.0007) +[2023-10-08 17:23:37,500][21194] Updated weights for policy 1, policy_version 41130 (0.0007) +[2023-10-08 17:23:37,868][21194] Updated weights for policy 1, policy_version 41140 (0.0008) +[2023-10-08 17:23:38,225][21194] Updated weights for policy 1, policy_version 41150 (0.0010) +[2023-10-08 17:23:38,793][21195] Updated weights for policy 0, policy_version 41450 (0.0008) +[2023-10-08 17:23:38,803][19739] Fps is (10 sec: 16383.7, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 84574208. Throughput: 0: 1739.3, 1: 1738.3. Samples: 21150270. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 17:23:38,804][19739] Avg episode reward: [(0, '713.180'), (1, '698.510')] +[2023-10-08 17:23:39,160][21195] Updated weights for policy 0, policy_version 41460 (0.0009) +[2023-10-08 17:23:39,537][21195] Updated weights for policy 0, policy_version 41470 (0.0009) +[2023-10-08 17:23:42,324][21194] Updated weights for policy 1, policy_version 41160 (0.0009) +[2023-10-08 17:23:42,698][21194] Updated weights for policy 1, policy_version 41170 (0.0008) +[2023-10-08 17:23:43,055][21194] Updated weights for policy 1, policy_version 41180 (0.0008) +[2023-10-08 17:23:43,439][21195] Updated weights for policy 0, policy_version 41480 (0.0009) +[2023-10-08 17:23:43,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 84639744. Throughput: 0: 1755.8, 1: 1702.7. Samples: 21170640. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 17:23:43,803][19739] Avg episode reward: [(0, '713.180'), (1, '713.130')] +[2023-10-08 17:23:43,819][21195] Updated weights for policy 0, policy_version 41490 (0.0009) +[2023-10-08 17:23:44,197][21195] Updated weights for policy 0, policy_version 41500 (0.0007) +[2023-10-08 17:23:47,016][21194] Updated weights for policy 1, policy_version 41190 (0.0009) +[2023-10-08 17:23:47,384][21194] Updated weights for policy 1, policy_version 41200 (0.0010) +[2023-10-08 17:23:47,747][21194] Updated weights for policy 1, policy_version 41210 (0.0011) +[2023-10-08 17:23:48,142][21195] Updated weights for policy 0, policy_version 41510 (0.0010) +[2023-10-08 17:23:48,508][21195] Updated weights for policy 0, policy_version 41520 (0.0011) +[2023-10-08 17:23:48,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 84705280. Throughput: 0: 1733.6, 1: 1730.6. Samples: 21186214. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 17:23:48,803][19739] Avg episode reward: [(0, '713.180'), (1, '713.130')] +[2023-10-08 17:23:48,879][21195] Updated weights for policy 0, policy_version 41530 (0.0011) +[2023-10-08 17:23:51,682][21194] Updated weights for policy 1, policy_version 41220 (0.0010) +[2023-10-08 17:23:52,048][21194] Updated weights for policy 1, policy_version 41230 (0.0011) +[2023-10-08 17:23:52,414][21194] Updated weights for policy 1, policy_version 41240 (0.0007) +[2023-10-08 17:23:52,862][21195] Updated weights for policy 0, policy_version 41540 (0.0010) +[2023-10-08 17:23:53,233][21195] Updated weights for policy 0, policy_version 41550 (0.0009) +[2023-10-08 17:23:53,596][21195] Updated weights for policy 0, policy_version 41560 (0.0011) +[2023-10-08 17:23:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 84770816. Throughput: 0: 1752.9, 1: 1714.2. Samples: 21201910. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 17:23:53,803][19739] Avg episode reward: [(0, '713.180'), (1, '713.130')] +[2023-10-08 17:23:56,352][21194] Updated weights for policy 1, policy_version 41250 (0.0007) +[2023-10-08 17:23:56,722][21194] Updated weights for policy 1, policy_version 41260 (0.0007) +[2023-10-08 17:23:57,085][21194] Updated weights for policy 1, policy_version 41270 (0.0007) +[2023-10-08 17:23:57,452][21194] Updated weights for policy 1, policy_version 41280 (0.0007) +[2023-10-08 17:23:57,570][21195] Updated weights for policy 0, policy_version 41570 (0.0009) +[2023-10-08 17:23:57,949][21195] Updated weights for policy 0, policy_version 41580 (0.0007) +[2023-10-08 17:23:58,313][21195] Updated weights for policy 0, policy_version 41590 (0.0009) +[2023-10-08 17:23:58,684][21195] Updated weights for policy 0, policy_version 41600 (0.0007) +[2023-10-08 17:23:58,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 84869120. Throughput: 0: 1748.0, 1: 1699.3. Samples: 21222198. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:23:58,803][19739] Avg episode reward: [(0, '713.180'), (1, '713.130')] +[2023-10-08 17:24:01,628][21194] Updated weights for policy 1, policy_version 41290 (0.0009) +[2023-10-08 17:24:01,986][21194] Updated weights for policy 1, policy_version 41300 (0.0009) +[2023-10-08 17:24:02,347][21194] Updated weights for policy 1, policy_version 41310 (0.0007) +[2023-10-08 17:24:02,574][21195] Updated weights for policy 0, policy_version 41610 (0.0008) +[2023-10-08 17:24:02,938][21195] Updated weights for policy 0, policy_version 41620 (0.0010) +[2023-10-08 17:24:03,303][21195] Updated weights for policy 0, policy_version 41630 (0.0008) +[2023-10-08 17:24:03,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 84934656. Throughput: 0: 1725.5, 1: 1720.9. Samples: 21237528. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:24:03,803][19739] Avg episode reward: [(0, '721.960'), (1, '713.130')] +[2023-10-08 17:24:06,096][21194] Updated weights for policy 1, policy_version 41320 (0.0009) +[2023-10-08 17:24:06,467][21194] Updated weights for policy 1, policy_version 41330 (0.0010) +[2023-10-08 17:24:06,819][21194] Updated weights for policy 1, policy_version 41340 (0.0008) +[2023-10-08 17:24:07,233][21195] Updated weights for policy 0, policy_version 41640 (0.0007) +[2023-10-08 17:24:07,603][21195] Updated weights for policy 0, policy_version 41650 (0.0008) +[2023-10-08 17:24:07,965][21195] Updated weights for policy 0, policy_version 41660 (0.0007) +[2023-10-08 17:24:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 85000192. Throughput: 0: 1754.4, 1: 1696.2. Samples: 21253054. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:24:08,803][19739] Avg episode reward: [(0, '721.960'), (1, '728.170')] +[2023-10-08 17:24:10,723][21194] Updated weights for policy 1, policy_version 41350 (0.0011) +[2023-10-08 17:24:11,084][21194] Updated weights for policy 1, policy_version 41360 (0.0008) +[2023-10-08 17:24:11,447][21194] Updated weights for policy 1, policy_version 41370 (0.0007) +[2023-10-08 17:24:11,807][21195] Updated weights for policy 0, policy_version 41670 (0.0009) +[2023-10-08 17:24:12,180][21195] Updated weights for policy 0, policy_version 41680 (0.0007) +[2023-10-08 17:24:12,542][21195] Updated weights for policy 0, policy_version 41690 (0.0007) +[2023-10-08 17:24:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 85065728. Throughput: 0: 1723.2, 1: 1710.7. Samples: 21273358. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:24:13,803][19739] Avg episode reward: [(0, '722.320'), (1, '728.170')] +[2023-10-08 17:24:15,372][21194] Updated weights for policy 1, policy_version 41380 (0.0009) +[2023-10-08 17:24:15,763][21194] Updated weights for policy 1, policy_version 41390 (0.0010) +[2023-10-08 17:24:16,122][21194] Updated weights for policy 1, policy_version 41400 (0.0010) +[2023-10-08 17:24:16,437][21195] Updated weights for policy 0, policy_version 41700 (0.0007) +[2023-10-08 17:24:16,804][21195] Updated weights for policy 0, policy_version 41710 (0.0007) +[2023-10-08 17:24:17,180][21195] Updated weights for policy 0, policy_version 41720 (0.0008) +[2023-10-08 17:24:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 85131264. Throughput: 0: 1716.3, 1: 1715.1. Samples: 21289208. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:24:18,803][19739] Avg episode reward: [(0, '722.320'), (1, '735.740')] +[2023-10-08 17:24:20,118][21194] Updated weights for policy 1, policy_version 41410 (0.0009) +[2023-10-08 17:24:20,493][21194] Updated weights for policy 1, policy_version 41420 (0.0009) +[2023-10-08 17:24:20,860][21194] Updated weights for policy 1, policy_version 41430 (0.0007) +[2023-10-08 17:24:21,170][21195] Updated weights for policy 0, policy_version 41730 (0.0009) +[2023-10-08 17:24:21,218][21194] Updated weights for policy 1, policy_version 41440 (0.0009) +[2023-10-08 17:24:21,537][21195] Updated weights for policy 0, policy_version 41740 (0.0010) +[2023-10-08 17:24:21,909][21195] Updated weights for policy 0, policy_version 41750 (0.0008) +[2023-10-08 17:24:22,279][21195] Updated weights for policy 0, policy_version 41760 (0.0009) +[2023-10-08 17:24:23,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 85196800. Throughput: 0: 1724.0, 1: 1705.6. Samples: 21304604. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:24:23,804][19739] Avg episode reward: [(0, '722.320'), (1, '735.740')] +[2023-10-08 17:24:25,126][21194] Updated weights for policy 1, policy_version 41450 (0.0009) +[2023-10-08 17:24:25,501][21194] Updated weights for policy 1, policy_version 41460 (0.0008) +[2023-10-08 17:24:25,861][21194] Updated weights for policy 1, policy_version 41470 (0.0009) +[2023-10-08 17:24:26,334][21195] Updated weights for policy 0, policy_version 41770 (0.0008) +[2023-10-08 17:24:26,702][21195] Updated weights for policy 0, policy_version 41780 (0.0008) +[2023-10-08 17:24:27,072][21195] Updated weights for policy 0, policy_version 41790 (0.0010) +[2023-10-08 17:24:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 85262336. Throughput: 0: 1703.8, 1: 1731.3. Samples: 21325218. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 17:24:28,803][19739] Avg episode reward: [(0, '722.320'), (1, '735.740')] +[2023-10-08 17:24:29,811][21194] Updated weights for policy 1, policy_version 41480 (0.0008) +[2023-10-08 17:24:30,181][21194] Updated weights for policy 1, policy_version 41490 (0.0007) +[2023-10-08 17:24:30,539][21194] Updated weights for policy 1, policy_version 41500 (0.0008) +[2023-10-08 17:24:30,906][21195] Updated weights for policy 0, policy_version 41800 (0.0009) +[2023-10-08 17:24:31,278][21195] Updated weights for policy 0, policy_version 41810 (0.0007) +[2023-10-08 17:24:31,640][21195] Updated weights for policy 0, policy_version 41820 (0.0010) +[2023-10-08 17:24:33,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 85327872. Throughput: 0: 1724.4, 1: 1707.6. Samples: 21340650. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 17:24:33,803][19739] Avg episode reward: [(0, '731.510'), (1, '735.740')] +[2023-10-08 17:24:34,314][21194] Updated weights for policy 1, policy_version 41510 (0.0009) +[2023-10-08 17:24:34,674][21194] Updated weights for policy 1, policy_version 41520 (0.0010) +[2023-10-08 17:24:35,039][21194] Updated weights for policy 1, policy_version 41530 (0.0011) +[2023-10-08 17:24:35,636][21195] Updated weights for policy 0, policy_version 41830 (0.0008) +[2023-10-08 17:24:36,005][21195] Updated weights for policy 0, policy_version 41840 (0.0007) +[2023-10-08 17:24:36,368][21195] Updated weights for policy 0, policy_version 41850 (0.0009) +[2023-10-08 17:24:38,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 85393408. Throughput: 0: 1704.1, 1: 1725.1. Samples: 21356226. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 17:24:38,804][19739] Avg episode reward: [(0, '731.510'), (1, '750.900')] +[2023-10-08 17:24:38,992][21194] Updated weights for policy 1, policy_version 41540 (0.0011) +[2023-10-08 17:24:39,363][21194] Updated weights for policy 1, policy_version 41550 (0.0007) +[2023-10-08 17:24:39,728][21194] Updated weights for policy 1, policy_version 41560 (0.0009) +[2023-10-08 17:24:40,236][21195] Updated weights for policy 0, policy_version 41860 (0.0010) +[2023-10-08 17:24:40,608][21195] Updated weights for policy 0, policy_version 41870 (0.0010) +[2023-10-08 17:24:40,974][21195] Updated weights for policy 0, policy_version 41880 (0.0009) +[2023-10-08 17:24:43,748][21194] Updated weights for policy 1, policy_version 41570 (0.0009) +[2023-10-08 17:24:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 85458944. Throughput: 0: 1711.3, 1: 1744.5. Samples: 21377710. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 17:24:43,803][19739] Avg episode reward: [(0, '731.510'), (1, '750.900')] +[2023-10-08 17:24:44,117][21194] Updated weights for policy 1, policy_version 41580 (0.0007) +[2023-10-08 17:24:44,483][21194] Updated weights for policy 1, policy_version 41590 (0.0007) +[2023-10-08 17:24:44,858][21194] Updated weights for policy 1, policy_version 41600 (0.0008) +[2023-10-08 17:24:44,963][21195] Updated weights for policy 0, policy_version 41890 (0.0008) +[2023-10-08 17:24:45,358][21195] Updated weights for policy 0, policy_version 41900 (0.0008) +[2023-10-08 17:24:45,715][21195] Updated weights for policy 0, policy_version 41910 (0.0010) +[2023-10-08 17:24:46,086][21195] Updated weights for policy 0, policy_version 41920 (0.0010) +[2023-10-08 17:24:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 85524480. Throughput: 0: 1734.0, 1: 1719.5. Samples: 21392932. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 17:24:48,803][19739] Avg episode reward: [(0, '731.590'), (1, '766.070')] +[2023-10-08 17:24:48,886][21194] Updated weights for policy 1, policy_version 41610 (0.0009) +[2023-10-08 17:24:49,252][21194] Updated weights for policy 1, policy_version 41620 (0.0010) +[2023-10-08 17:24:49,613][21194] Updated weights for policy 1, policy_version 41630 (0.0009) +[2023-10-08 17:24:49,933][21195] Updated weights for policy 0, policy_version 41930 (0.0007) +[2023-10-08 17:24:50,298][21195] Updated weights for policy 0, policy_version 41940 (0.0010) +[2023-10-08 17:24:50,674][21195] Updated weights for policy 0, policy_version 41950 (0.0011) +[2023-10-08 17:24:53,575][21194] Updated weights for policy 1, policy_version 41640 (0.0009) +[2023-10-08 17:24:53,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 85590016. Throughput: 0: 1702.5, 1: 1745.2. Samples: 21408202. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 17:24:53,803][19739] Avg episode reward: [(0, '717.820'), (1, '766.070')] +[2023-10-08 17:24:53,947][21194] Updated weights for policy 1, policy_version 41650 (0.0008) +[2023-10-08 17:24:54,307][21194] Updated weights for policy 1, policy_version 41660 (0.0008) +[2023-10-08 17:24:54,669][21195] Updated weights for policy 0, policy_version 41960 (0.0008) +[2023-10-08 17:24:55,036][21195] Updated weights for policy 0, policy_version 41970 (0.0007) +[2023-10-08 17:24:55,404][21195] Updated weights for policy 0, policy_version 41980 (0.0009) +[2023-10-08 17:24:58,347][21194] Updated weights for policy 1, policy_version 41670 (0.0009) +[2023-10-08 17:24:58,716][21194] Updated weights for policy 1, policy_version 41680 (0.0008) +[2023-10-08 17:24:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 85655552. Throughput: 0: 1731.8, 1: 1739.5. Samples: 21429568. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 17:24:58,803][19739] Avg episode reward: [(0, '732.680'), (1, '766.070')] +[2023-10-08 17:24:59,076][21194] Updated weights for policy 1, policy_version 41690 (0.0007) +[2023-10-08 17:24:59,307][21195] Updated weights for policy 0, policy_version 41990 (0.0008) +[2023-10-08 17:24:59,673][21195] Updated weights for policy 0, policy_version 42000 (0.0009) +[2023-10-08 17:25:00,052][21195] Updated weights for policy 0, policy_version 42010 (0.0010) +[2023-10-08 17:25:03,143][21194] Updated weights for policy 1, policy_version 41700 (0.0010) +[2023-10-08 17:25:03,514][21194] Updated weights for policy 1, policy_version 41710 (0.0009) +[2023-10-08 17:25:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 85721088. Throughput: 0: 1734.5, 1: 1726.2. Samples: 21444942. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 17:25:03,804][19739] Avg episode reward: [(0, '744.010'), (1, '766.070')] +[2023-10-08 17:25:03,884][21194] Updated weights for policy 1, policy_version 41720 (0.0008) +[2023-10-08 17:25:03,936][21195] Updated weights for policy 0, policy_version 42020 (0.0008) +[2023-10-08 17:25:04,310][21195] Updated weights for policy 0, policy_version 42030 (0.0008) +[2023-10-08 17:25:04,675][21195] Updated weights for policy 0, policy_version 42040 (0.0009) +[2023-10-08 17:25:07,901][21194] Updated weights for policy 1, policy_version 41730 (0.0009) +[2023-10-08 17:25:08,272][21194] Updated weights for policy 1, policy_version 41740 (0.0008) +[2023-10-08 17:25:08,570][21195] Updated weights for policy 0, policy_version 42050 (0.0007) +[2023-10-08 17:25:08,643][21194] Updated weights for policy 1, policy_version 41750 (0.0010) +[2023-10-08 17:25:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 85786624. Throughput: 0: 1727.1, 1: 1728.8. Samples: 21460120. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 17:25:08,803][19739] Avg episode reward: [(0, '744.010'), (1, '766.070')] +[2023-10-08 17:25:08,939][21195] Updated weights for policy 0, policy_version 42060 (0.0007) +[2023-10-08 17:25:09,004][21194] Updated weights for policy 1, policy_version 41760 (0.0008) +[2023-10-08 17:25:09,304][21195] Updated weights for policy 0, policy_version 42070 (0.0011) +[2023-10-08 17:25:09,676][21195] Updated weights for policy 0, policy_version 42080 (0.0009) +[2023-10-08 17:25:12,905][21194] Updated weights for policy 1, policy_version 41770 (0.0008) +[2023-10-08 17:25:13,267][21194] Updated weights for policy 1, policy_version 41780 (0.0007) +[2023-10-08 17:25:13,636][21194] Updated weights for policy 1, policy_version 41790 (0.0008) +[2023-10-08 17:25:13,653][21195] Updated weights for policy 0, policy_version 42090 (0.0008) +[2023-10-08 17:25:13,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 85884928. Throughput: 0: 1745.2, 1: 1722.5. Samples: 21481266. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 17:25:13,803][19739] Avg episode reward: [(0, '757.470'), (1, '779.770')] +[2023-10-08 17:25:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000041792_42795008.pth... +[2023-10-08 17:25:13,840][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000040160_41123840.pth +[2023-10-08 17:25:14,021][21195] Updated weights for policy 0, policy_version 42100 (0.0009) +[2023-10-08 17:25:14,392][21195] Updated weights for policy 0, policy_version 42110 (0.0008) +[2023-10-08 17:25:14,462][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000042112_43122688.pth... +[2023-10-08 17:25:14,502][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000040480_41451520.pth +[2023-10-08 17:25:17,436][21194] Updated weights for policy 1, policy_version 41800 (0.0007) +[2023-10-08 17:25:17,800][21194] Updated weights for policy 1, policy_version 41810 (0.0007) +[2023-10-08 17:25:18,162][21194] Updated weights for policy 1, policy_version 41820 (0.0010) +[2023-10-08 17:25:18,498][21195] Updated weights for policy 0, policy_version 42120 (0.0010) +[2023-10-08 17:25:18,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 85950464. Throughput: 0: 1729.9, 1: 1733.9. Samples: 21496520. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 17:25:18,803][19739] Avg episode reward: [(0, '758.170'), (1, '789.700')] +[2023-10-08 17:25:18,871][21195] Updated weights for policy 0, policy_version 42130 (0.0007) +[2023-10-08 17:25:19,247][21195] Updated weights for policy 0, policy_version 42140 (0.0008) +[2023-10-08 17:25:22,351][21194] Updated weights for policy 1, policy_version 41830 (0.0009) +[2023-10-08 17:25:22,710][21194] Updated weights for policy 1, policy_version 41840 (0.0008) +[2023-10-08 17:25:23,009][21195] Updated weights for policy 0, policy_version 42150 (0.0008) +[2023-10-08 17:25:23,081][21194] Updated weights for policy 1, policy_version 41850 (0.0007) +[2023-10-08 17:25:23,372][21195] Updated weights for policy 0, policy_version 42160 (0.0008) +[2023-10-08 17:25:23,740][21195] Updated weights for policy 0, policy_version 42170 (0.0007) +[2023-10-08 17:25:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 86016000. Throughput: 0: 1739.1, 1: 1727.4. Samples: 21512216. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 17:25:23,803][19739] Avg episode reward: [(0, '758.170'), (1, '789.700')] +[2023-10-08 17:25:26,998][21194] Updated weights for policy 1, policy_version 41860 (0.0009) +[2023-10-08 17:25:27,371][21194] Updated weights for policy 1, policy_version 41870 (0.0009) +[2023-10-08 17:25:27,595][21195] Updated weights for policy 0, policy_version 42180 (0.0008) +[2023-10-08 17:25:27,738][21194] Updated weights for policy 1, policy_version 41880 (0.0009) +[2023-10-08 17:25:27,954][21195] Updated weights for policy 0, policy_version 42190 (0.0009) +[2023-10-08 17:25:28,332][21195] Updated weights for policy 0, policy_version 42200 (0.0008) +[2023-10-08 17:25:28,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 86114304. Throughput: 0: 1738.8, 1: 1696.6. Samples: 21532304. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:25:28,803][19739] Avg episode reward: [(0, '758.170'), (1, '789.700')] +[2023-10-08 17:25:31,602][21194] Updated weights for policy 1, policy_version 41890 (0.0009) +[2023-10-08 17:25:31,976][21194] Updated weights for policy 1, policy_version 41900 (0.0007) +[2023-10-08 17:25:32,284][21195] Updated weights for policy 0, policy_version 42210 (0.0007) +[2023-10-08 17:25:32,336][21194] Updated weights for policy 1, policy_version 41910 (0.0007) +[2023-10-08 17:25:32,680][21195] Updated weights for policy 0, policy_version 42220 (0.0007) +[2023-10-08 17:25:32,699][21194] Updated weights for policy 1, policy_version 41920 (0.0008) +[2023-10-08 17:25:33,055][21195] Updated weights for policy 0, policy_version 42230 (0.0008) +[2023-10-08 17:25:33,417][21195] Updated weights for policy 0, policy_version 42240 (0.0007) +[2023-10-08 17:25:33,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 86179840. Throughput: 0: 1714.2, 1: 1725.9. Samples: 21547738. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:25:33,803][19739] Avg episode reward: [(0, '758.170'), (1, '789.700')] +[2023-10-08 17:25:36,588][21194] Updated weights for policy 1, policy_version 41930 (0.0008) +[2023-10-08 17:25:36,956][21194] Updated weights for policy 1, policy_version 41940 (0.0007) +[2023-10-08 17:25:37,308][21195] Updated weights for policy 0, policy_version 42250 (0.0007) +[2023-10-08 17:25:37,324][21194] Updated weights for policy 1, policy_version 41950 (0.0007) +[2023-10-08 17:25:37,684][21195] Updated weights for policy 0, policy_version 42260 (0.0010) +[2023-10-08 17:25:38,050][21195] Updated weights for policy 0, policy_version 42270 (0.0008) +[2023-10-08 17:25:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 86245376. Throughput: 0: 1743.9, 1: 1712.9. Samples: 21563760. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:25:38,804][19739] Avg episode reward: [(0, '766.590'), (1, '789.700')] +[2023-10-08 17:25:41,370][21194] Updated weights for policy 1, policy_version 41960 (0.0008) +[2023-10-08 17:25:41,741][21194] Updated weights for policy 1, policy_version 41970 (0.0008) +[2023-10-08 17:25:42,000][21195] Updated weights for policy 0, policy_version 42280 (0.0007) +[2023-10-08 17:25:42,100][21194] Updated weights for policy 1, policy_version 41980 (0.0007) +[2023-10-08 17:25:42,374][21195] Updated weights for policy 0, policy_version 42290 (0.0007) +[2023-10-08 17:25:42,746][21195] Updated weights for policy 0, policy_version 42300 (0.0010) +[2023-10-08 17:25:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 86310912. Throughput: 0: 1714.7, 1: 1702.9. Samples: 21583362. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:25:43,803][19739] Avg episode reward: [(0, '746.880'), (1, '789.700')] +[2023-10-08 17:25:45,942][21194] Updated weights for policy 1, policy_version 41990 (0.0008) +[2023-10-08 17:25:46,306][21194] Updated weights for policy 1, policy_version 42000 (0.0009) +[2023-10-08 17:25:46,672][21194] Updated weights for policy 1, policy_version 42010 (0.0010) +[2023-10-08 17:25:46,905][21195] Updated weights for policy 0, policy_version 42310 (0.0009) +[2023-10-08 17:25:47,275][21195] Updated weights for policy 0, policy_version 42320 (0.0009) +[2023-10-08 17:25:47,636][21195] Updated weights for policy 0, policy_version 42330 (0.0009) +[2023-10-08 17:25:48,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 86376448. Throughput: 0: 1710.5, 1: 1726.4. Samples: 21599598. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:25:48,803][19739] Avg episode reward: [(0, '746.880'), (1, '804.780')] +[2023-10-08 17:25:50,628][21194] Updated weights for policy 1, policy_version 42020 (0.0008) +[2023-10-08 17:25:50,990][21194] Updated weights for policy 1, policy_version 42030 (0.0008) +[2023-10-08 17:25:51,351][21194] Updated weights for policy 1, policy_version 42040 (0.0007) +[2023-10-08 17:25:51,440][21195] Updated weights for policy 0, policy_version 42340 (0.0008) +[2023-10-08 17:25:51,805][21195] Updated weights for policy 0, policy_version 42350 (0.0008) +[2023-10-08 17:25:52,183][21195] Updated weights for policy 0, policy_version 42360 (0.0008) +[2023-10-08 17:25:53,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 86441984. Throughput: 0: 1726.1, 1: 1706.1. Samples: 21614570. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:25:53,804][19739] Avg episode reward: [(0, '746.880'), (1, '804.780')] +[2023-10-08 17:25:55,390][21194] Updated weights for policy 1, policy_version 42050 (0.0008) +[2023-10-08 17:25:55,763][21194] Updated weights for policy 1, policy_version 42060 (0.0010) +[2023-10-08 17:25:56,020][21195] Updated weights for policy 0, policy_version 42370 (0.0008) +[2023-10-08 17:25:56,137][21194] Updated weights for policy 1, policy_version 42070 (0.0007) +[2023-10-08 17:25:56,395][21195] Updated weights for policy 0, policy_version 42380 (0.0007) +[2023-10-08 17:25:56,502][21194] Updated weights for policy 1, policy_version 42080 (0.0008) +[2023-10-08 17:25:56,766][21195] Updated weights for policy 0, policy_version 42390 (0.0007) +[2023-10-08 17:25:57,135][21195] Updated weights for policy 0, policy_version 42400 (0.0008) +[2023-10-08 17:25:58,803][19739] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 86507520. Throughput: 0: 1707.3, 1: 1708.6. Samples: 21634984. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:25:58,804][19739] Avg episode reward: [(0, '746.880'), (1, '808.170')] +[2023-10-08 17:26:00,645][21194] Updated weights for policy 1, policy_version 42090 (0.0010) +[2023-10-08 17:26:01,009][21194] Updated weights for policy 1, policy_version 42100 (0.0008) +[2023-10-08 17:26:01,182][21195] Updated weights for policy 0, policy_version 42410 (0.0008) +[2023-10-08 17:26:01,379][21194] Updated weights for policy 1, policy_version 42110 (0.0007) +[2023-10-08 17:26:01,550][21195] Updated weights for policy 0, policy_version 42420 (0.0009) +[2023-10-08 17:26:01,917][21195] Updated weights for policy 0, policy_version 42430 (0.0010) +[2023-10-08 17:26:03,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 86573056. Throughput: 0: 1723.6, 1: 1704.8. Samples: 21650798. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:26:03,803][19739] Avg episode reward: [(0, '746.880'), (1, '808.940')] +[2023-10-08 17:26:05,207][21194] Updated weights for policy 1, policy_version 42120 (0.0008) +[2023-10-08 17:26:05,575][21194] Updated weights for policy 1, policy_version 42130 (0.0008) +[2023-10-08 17:26:05,842][21195] Updated weights for policy 0, policy_version 42440 (0.0010) +[2023-10-08 17:26:05,948][21194] Updated weights for policy 1, policy_version 42140 (0.0010) +[2023-10-08 17:26:06,217][21195] Updated weights for policy 0, policy_version 42450 (0.0010) +[2023-10-08 17:26:06,586][21195] Updated weights for policy 0, policy_version 42460 (0.0010) +[2023-10-08 17:26:08,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 86638592. Throughput: 0: 1712.0, 1: 1692.3. Samples: 21665406. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:26:08,803][19739] Avg episode reward: [(0, '737.820'), (1, '779.500')] +[2023-10-08 17:26:10,086][21194] Updated weights for policy 1, policy_version 42150 (0.0008) +[2023-10-08 17:26:10,455][21194] Updated weights for policy 1, policy_version 42160 (0.0007) +[2023-10-08 17:26:10,593][21195] Updated weights for policy 0, policy_version 42470 (0.0007) +[2023-10-08 17:26:10,824][21194] Updated weights for policy 1, policy_version 42170 (0.0008) +[2023-10-08 17:26:10,955][21195] Updated weights for policy 0, policy_version 42480 (0.0007) +[2023-10-08 17:26:11,319][21195] Updated weights for policy 0, policy_version 42490 (0.0007) +[2023-10-08 17:26:13,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 86704128. Throughput: 0: 1716.4, 1: 1716.1. Samples: 21686768. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:26:13,804][19739] Avg episode reward: [(0, '736.960'), (1, '795.040')] +[2023-10-08 17:26:14,660][21194] Updated weights for policy 1, policy_version 42180 (0.0008) +[2023-10-08 17:26:15,022][21194] Updated weights for policy 1, policy_version 42190 (0.0007) +[2023-10-08 17:26:15,114][21195] Updated weights for policy 0, policy_version 42500 (0.0007) +[2023-10-08 17:26:15,378][21194] Updated weights for policy 1, policy_version 42200 (0.0009) +[2023-10-08 17:26:15,473][21195] Updated weights for policy 0, policy_version 42510 (0.0007) +[2023-10-08 17:26:15,854][21195] Updated weights for policy 0, policy_version 42520 (0.0009) +[2023-10-08 17:26:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 86769664. Throughput: 0: 1742.5, 1: 1692.9. Samples: 21702334. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:26:18,803][19739] Avg episode reward: [(0, '726.650'), (1, '795.040')] +[2023-10-08 17:26:19,450][21194] Updated weights for policy 1, policy_version 42210 (0.0008) +[2023-10-08 17:26:19,828][21194] Updated weights for policy 1, policy_version 42220 (0.0009) +[2023-10-08 17:26:19,860][21195] Updated weights for policy 0, policy_version 42530 (0.0007) +[2023-10-08 17:26:20,189][21194] Updated weights for policy 1, policy_version 42230 (0.0009) +[2023-10-08 17:26:20,229][21195] Updated weights for policy 0, policy_version 42540 (0.0008) +[2023-10-08 17:26:20,554][21194] Updated weights for policy 1, policy_version 42240 (0.0009) +[2023-10-08 17:26:20,599][21195] Updated weights for policy 0, policy_version 42550 (0.0008) +[2023-10-08 17:26:20,966][21195] Updated weights for policy 0, policy_version 42560 (0.0008) +[2023-10-08 17:26:23,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 86835200. Throughput: 0: 1713.2, 1: 1706.3. Samples: 21717640. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:26:23,804][19739] Avg episode reward: [(0, '727.340'), (1, '795.040')] +[2023-10-08 17:26:24,627][21194] Updated weights for policy 1, policy_version 42250 (0.0008) +[2023-10-08 17:26:24,897][21195] Updated weights for policy 0, policy_version 42570 (0.0010) +[2023-10-08 17:26:25,002][21194] Updated weights for policy 1, policy_version 42260 (0.0008) +[2023-10-08 17:26:25,272][21195] Updated weights for policy 0, policy_version 42580 (0.0009) +[2023-10-08 17:26:25,368][21194] Updated weights for policy 1, policy_version 42270 (0.0010) +[2023-10-08 17:26:25,631][21195] Updated weights for policy 0, policy_version 42590 (0.0009) +[2023-10-08 17:26:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 86900736. Throughput: 0: 1738.1, 1: 1716.2. Samples: 21738806. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:26:28,803][19739] Avg episode reward: [(0, '727.340'), (1, '795.040')] +[2023-10-08 17:26:29,523][21195] Updated weights for policy 0, policy_version 42600 (0.0008) +[2023-10-08 17:26:29,537][21194] Updated weights for policy 1, policy_version 42280 (0.0007) +[2023-10-08 17:26:29,889][21195] Updated weights for policy 0, policy_version 42610 (0.0008) +[2023-10-08 17:26:29,912][21194] Updated weights for policy 1, policy_version 42290 (0.0007) +[2023-10-08 17:26:30,265][21195] Updated weights for policy 0, policy_version 42620 (0.0009) +[2023-10-08 17:26:30,282][21194] Updated weights for policy 1, policy_version 42300 (0.0008) +[2023-10-08 17:26:33,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 86966272. Throughput: 0: 1743.2, 1: 1692.6. Samples: 21754212. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:26:33,803][19739] Avg episode reward: [(0, '730.260'), (1, '795.040')] +[2023-10-08 17:26:34,033][21195] Updated weights for policy 0, policy_version 42630 (0.0008) +[2023-10-08 17:26:34,246][21194] Updated weights for policy 1, policy_version 42310 (0.0008) +[2023-10-08 17:26:34,392][21195] Updated weights for policy 0, policy_version 42640 (0.0009) +[2023-10-08 17:26:34,620][21194] Updated weights for policy 1, policy_version 42320 (0.0009) +[2023-10-08 17:26:34,762][21195] Updated weights for policy 0, policy_version 42650 (0.0010) +[2023-10-08 17:26:34,982][21194] Updated weights for policy 1, policy_version 42330 (0.0008) +[2023-10-08 17:26:38,625][21195] Updated weights for policy 0, policy_version 42660 (0.0010) +[2023-10-08 17:26:38,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 87031808. Throughput: 0: 1726.5, 1: 1716.6. Samples: 21769508. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:26:38,803][19739] Avg episode reward: [(0, '730.260'), (1, '780.370')] +[2023-10-08 17:26:38,915][21194] Updated weights for policy 1, policy_version 42340 (0.0008) +[2023-10-08 17:26:39,002][21195] Updated weights for policy 0, policy_version 42670 (0.0008) +[2023-10-08 17:26:39,276][21194] Updated weights for policy 1, policy_version 42350 (0.0007) +[2023-10-08 17:26:39,358][21195] Updated weights for policy 0, policy_version 42680 (0.0009) +[2023-10-08 17:26:39,646][21194] Updated weights for policy 1, policy_version 42360 (0.0008) +[2023-10-08 17:26:43,295][21195] Updated weights for policy 0, policy_version 42690 (0.0008) +[2023-10-08 17:26:43,498][21194] Updated weights for policy 1, policy_version 42370 (0.0010) +[2023-10-08 17:26:43,668][21195] Updated weights for policy 0, policy_version 42700 (0.0007) +[2023-10-08 17:26:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 87097344. Throughput: 0: 1743.9, 1: 1722.9. Samples: 21790990. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:26:43,803][19739] Avg episode reward: [(0, '730.290'), (1, '780.370')] +[2023-10-08 17:26:43,879][21194] Updated weights for policy 1, policy_version 42380 (0.0007) +[2023-10-08 17:26:44,035][21195] Updated weights for policy 0, policy_version 42710 (0.0008) +[2023-10-08 17:26:44,253][21194] Updated weights for policy 1, policy_version 42390 (0.0007) +[2023-10-08 17:26:44,404][21195] Updated weights for policy 0, policy_version 42720 (0.0008) +[2023-10-08 17:26:44,615][21194] Updated weights for policy 1, policy_version 42400 (0.0009) +[2023-10-08 17:26:48,318][21195] Updated weights for policy 0, policy_version 42730 (0.0007) +[2023-10-08 17:26:48,422][21194] Updated weights for policy 1, policy_version 42410 (0.0008) +[2023-10-08 17:26:48,692][21195] Updated weights for policy 0, policy_version 42740 (0.0009) +[2023-10-08 17:26:48,788][21194] Updated weights for policy 1, policy_version 42420 (0.0008) +[2023-10-08 17:26:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 87162880. Throughput: 0: 1726.4, 1: 1711.9. Samples: 21805522. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:26:48,803][19739] Avg episode reward: [(0, '749.690'), (1, '780.370')] +[2023-10-08 17:26:49,052][21195] Updated weights for policy 0, policy_version 42750 (0.0009) +[2023-10-08 17:26:49,155][21194] Updated weights for policy 1, policy_version 42430 (0.0007) +[2023-10-08 17:26:53,110][21195] Updated weights for policy 0, policy_version 42760 (0.0007) +[2023-10-08 17:26:53,212][21194] Updated weights for policy 1, policy_version 42440 (0.0009) +[2023-10-08 17:26:53,478][21195] Updated weights for policy 0, policy_version 42770 (0.0008) +[2023-10-08 17:26:53,578][21194] Updated weights for policy 1, policy_version 42450 (0.0008) +[2023-10-08 17:26:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.3, 300 sec: 13662.6). Total num frames: 87228416. Throughput: 0: 1743.4, 1: 1722.9. Samples: 21821392. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:26:53,803][19739] Avg episode reward: [(0, '749.690'), (1, '780.370')] +[2023-10-08 17:26:53,845][21195] Updated weights for policy 0, policy_version 42780 (0.0009) +[2023-10-08 17:26:53,948][21194] Updated weights for policy 1, policy_version 42460 (0.0010) +[2023-10-08 17:26:57,873][21195] Updated weights for policy 0, policy_version 42790 (0.0009) +[2023-10-08 17:26:57,928][21194] Updated weights for policy 1, policy_version 42470 (0.0008) +[2023-10-08 17:26:58,234][21195] Updated weights for policy 0, policy_version 42800 (0.0009) +[2023-10-08 17:26:58,296][21194] Updated weights for policy 1, policy_version 42480 (0.0007) +[2023-10-08 17:26:58,600][21195] Updated weights for policy 0, policy_version 42810 (0.0008) +[2023-10-08 17:26:58,657][21194] Updated weights for policy 1, policy_version 42490 (0.0007) +[2023-10-08 17:26:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.3, 300 sec: 13662.6). Total num frames: 87293952. Throughput: 0: 1736.6, 1: 1721.9. Samples: 21842400. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:26:58,803][19739] Avg episode reward: [(0, '749.100'), (1, '779.610')] +[2023-10-08 17:27:02,542][21195] Updated weights for policy 0, policy_version 42820 (0.0008) +[2023-10-08 17:27:02,614][21194] Updated weights for policy 1, policy_version 42500 (0.0008) +[2023-10-08 17:27:02,909][21195] Updated weights for policy 0, policy_version 42830 (0.0008) +[2023-10-08 17:27:02,984][21194] Updated weights for policy 1, policy_version 42510 (0.0009) +[2023-10-08 17:27:03,284][21195] Updated weights for policy 0, policy_version 42840 (0.0008) +[2023-10-08 17:27:03,342][21194] Updated weights for policy 1, policy_version 42520 (0.0008) +[2023-10-08 17:27:03,802][19739] Fps is (10 sec: 19660.8, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 87425024. Throughput: 0: 1710.6, 1: 1723.2. Samples: 21856858. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:27:03,803][19739] Avg episode reward: [(0, '749.100'), (1, '779.610')] +[2023-10-08 17:27:07,125][21195] Updated weights for policy 0, policy_version 42850 (0.0008) +[2023-10-08 17:27:07,208][21194] Updated weights for policy 1, policy_version 42530 (0.0008) +[2023-10-08 17:27:07,496][21195] Updated weights for policy 0, policy_version 42860 (0.0008) +[2023-10-08 17:27:07,569][21194] Updated weights for policy 1, policy_version 42540 (0.0007) +[2023-10-08 17:27:07,857][21195] Updated weights for policy 0, policy_version 42870 (0.0008) +[2023-10-08 17:27:07,934][21194] Updated weights for policy 1, policy_version 42550 (0.0010) +[2023-10-08 17:27:08,230][21195] Updated weights for policy 0, policy_version 42880 (0.0009) +[2023-10-08 17:27:08,290][21194] Updated weights for policy 1, policy_version 42560 (0.0008) +[2023-10-08 17:27:08,803][19739] Fps is (10 sec: 19660.7, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 87490560. Throughput: 0: 1745.8, 1: 1723.7. Samples: 21873766. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:27:08,803][19739] Avg episode reward: [(0, '749.100'), (1, '793.880')] +[2023-10-08 17:27:12,250][21194] Updated weights for policy 1, policy_version 42570 (0.0008) +[2023-10-08 17:27:12,352][21195] Updated weights for policy 0, policy_version 42890 (0.0008) +[2023-10-08 17:27:12,614][21194] Updated weights for policy 1, policy_version 42580 (0.0009) +[2023-10-08 17:27:12,723][21195] Updated weights for policy 0, policy_version 42900 (0.0010) +[2023-10-08 17:27:12,991][21194] Updated weights for policy 1, policy_version 42590 (0.0009) +[2023-10-08 17:27:13,093][21195] Updated weights for policy 0, policy_version 42910 (0.0007) +[2023-10-08 17:27:13,803][19739] Fps is (10 sec: 13106.7, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 87556096. Throughput: 0: 1729.1, 1: 1701.2. Samples: 21893172. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:27:13,804][19739] Avg episode reward: [(0, '749.100'), (1, '793.880')] +[2023-10-08 17:27:13,816][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000042592_43614208.pth... +[2023-10-08 17:27:13,816][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000042912_43941888.pth... +[2023-10-08 17:27:13,851][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000040992_41975808.pth +[2023-10-08 17:27:13,853][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000041280_42270720.pth +[2023-10-08 17:27:16,903][21194] Updated weights for policy 1, policy_version 42600 (0.0007) +[2023-10-08 17:27:16,920][21195] Updated weights for policy 0, policy_version 42920 (0.0008) +[2023-10-08 17:27:17,275][21194] Updated weights for policy 1, policy_version 42610 (0.0008) +[2023-10-08 17:27:17,291][21195] Updated weights for policy 0, policy_version 42930 (0.0008) +[2023-10-08 17:27:17,634][21194] Updated weights for policy 1, policy_version 42620 (0.0008) +[2023-10-08 17:27:17,650][21195] Updated weights for policy 0, policy_version 42940 (0.0009) +[2023-10-08 17:27:18,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 87621632. Throughput: 0: 1717.1, 1: 1728.2. Samples: 21909252. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 17:27:18,804][19739] Avg episode reward: [(0, '749.100'), (1, '793.880')] +[2023-10-08 17:27:21,494][21195] Updated weights for policy 0, policy_version 42950 (0.0008) +[2023-10-08 17:27:21,650][21194] Updated weights for policy 1, policy_version 42630 (0.0007) +[2023-10-08 17:27:21,860][21195] Updated weights for policy 0, policy_version 42960 (0.0008) +[2023-10-08 17:27:22,007][21194] Updated weights for policy 1, policy_version 42640 (0.0007) +[2023-10-08 17:27:22,232][21195] Updated weights for policy 0, policy_version 42970 (0.0009) +[2023-10-08 17:27:22,384][21194] Updated weights for policy 1, policy_version 42650 (0.0008) +[2023-10-08 17:27:23,803][19739] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 87687168. Throughput: 0: 1734.1, 1: 1714.4. Samples: 21924690. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 17:27:23,803][19739] Avg episode reward: [(0, '755.120'), (1, '793.880')] +[2023-10-08 17:27:26,192][21195] Updated weights for policy 0, policy_version 42980 (0.0007) +[2023-10-08 17:27:26,234][21194] Updated weights for policy 1, policy_version 42660 (0.0009) +[2023-10-08 17:27:26,551][21195] Updated weights for policy 0, policy_version 42990 (0.0007) +[2023-10-08 17:27:26,590][21194] Updated weights for policy 1, policy_version 42670 (0.0008) +[2023-10-08 17:27:26,917][21195] Updated weights for policy 0, policy_version 43000 (0.0009) +[2023-10-08 17:27:26,957][21194] Updated weights for policy 1, policy_version 42680 (0.0008) +[2023-10-08 17:27:28,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 87752704. Throughput: 0: 1718.2, 1: 1699.0. Samples: 21944764. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 17:27:28,803][19739] Avg episode reward: [(0, '755.120'), (1, '799.270')] +[2023-10-08 17:27:30,869][21195] Updated weights for policy 0, policy_version 43010 (0.0008) +[2023-10-08 17:27:31,139][21194] Updated weights for policy 1, policy_version 42690 (0.0007) +[2023-10-08 17:27:31,238][21195] Updated weights for policy 0, policy_version 43020 (0.0008) +[2023-10-08 17:27:31,542][21194] Updated weights for policy 1, policy_version 42700 (0.0007) +[2023-10-08 17:27:31,594][21195] Updated weights for policy 0, policy_version 43030 (0.0007) +[2023-10-08 17:27:31,911][21194] Updated weights for policy 1, policy_version 42710 (0.0009) +[2023-10-08 17:27:31,964][21195] Updated weights for policy 0, policy_version 43040 (0.0008) +[2023-10-08 17:27:32,273][21194] Updated weights for policy 1, policy_version 42720 (0.0008) +[2023-10-08 17:27:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 87818240. Throughput: 0: 1735.2, 1: 1727.2. Samples: 21961330. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 17:27:33,803][19739] Avg episode reward: [(0, '755.370'), (1, '799.270')] +[2023-10-08 17:27:35,806][21195] Updated weights for policy 0, policy_version 43050 (0.0008) +[2023-10-08 17:27:36,066][21194] Updated weights for policy 1, policy_version 42730 (0.0008) +[2023-10-08 17:27:36,179][21195] Updated weights for policy 0, policy_version 43060 (0.0008) +[2023-10-08 17:27:36,428][21194] Updated weights for policy 1, policy_version 42740 (0.0007) +[2023-10-08 17:27:36,542][21195] Updated weights for policy 0, policy_version 43070 (0.0008) +[2023-10-08 17:27:36,787][21194] Updated weights for policy 1, policy_version 42750 (0.0010) +[2023-10-08 17:27:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 87883776. Throughput: 0: 1721.2, 1: 1705.8. Samples: 21975604. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 17:27:38,803][19739] Avg episode reward: [(0, '740.910'), (1, '799.270')] +[2023-10-08 17:27:40,630][21195] Updated weights for policy 0, policy_version 43080 (0.0009) +[2023-10-08 17:27:40,792][21194] Updated weights for policy 1, policy_version 42760 (0.0007) +[2023-10-08 17:27:41,009][21195] Updated weights for policy 0, policy_version 43090 (0.0008) +[2023-10-08 17:27:41,153][21194] Updated weights for policy 1, policy_version 42770 (0.0008) +[2023-10-08 17:27:41,367][21195] Updated weights for policy 0, policy_version 43100 (0.0008) +[2023-10-08 17:27:41,514][21194] Updated weights for policy 1, policy_version 42780 (0.0008) +[2023-10-08 17:27:43,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 87949312. Throughput: 0: 1723.2, 1: 1713.0. Samples: 21997030. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 17:27:43,804][19739] Avg episode reward: [(0, '740.920'), (1, '799.270')] +[2023-10-08 17:27:45,204][21195] Updated weights for policy 0, policy_version 43110 (0.0009) +[2023-10-08 17:27:45,380][21194] Updated weights for policy 1, policy_version 42790 (0.0009) +[2023-10-08 17:27:45,559][21195] Updated weights for policy 0, policy_version 43120 (0.0007) +[2023-10-08 17:27:45,736][21194] Updated weights for policy 1, policy_version 42800 (0.0008) +[2023-10-08 17:27:45,925][21195] Updated weights for policy 0, policy_version 43130 (0.0009) +[2023-10-08 17:27:46,099][21194] Updated weights for policy 1, policy_version 42810 (0.0008) +[2023-10-08 17:27:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 88014848. Throughput: 0: 1751.9, 1: 1716.1. Samples: 22012918. Policy #0 lag: (min: 16.0, avg: 42.7, max: 48.0) +[2023-10-08 17:27:48,803][19739] Avg episode reward: [(0, '740.920'), (1, '814.370')] +[2023-10-08 17:27:49,988][21195] Updated weights for policy 0, policy_version 43140 (0.0008) +[2023-10-08 17:27:50,110][21194] Updated weights for policy 1, policy_version 42820 (0.0009) +[2023-10-08 17:27:50,357][21195] Updated weights for policy 0, policy_version 43150 (0.0007) +[2023-10-08 17:27:50,472][21194] Updated weights for policy 1, policy_version 42830 (0.0010) +[2023-10-08 17:27:50,722][21195] Updated weights for policy 0, policy_version 43160 (0.0008) +[2023-10-08 17:27:50,831][21194] Updated weights for policy 1, policy_version 42840 (0.0007) +[2023-10-08 17:27:53,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 88080384. Throughput: 0: 1716.7, 1: 1706.7. Samples: 22027816. Policy #0 lag: (min: 16.0, avg: 42.7, max: 48.0) +[2023-10-08 17:27:53,803][19739] Avg episode reward: [(0, '740.920'), (1, '804.290')] +[2023-10-08 17:27:54,562][21195] Updated weights for policy 0, policy_version 43170 (0.0008) +[2023-10-08 17:27:54,929][21194] Updated weights for policy 1, policy_version 42850 (0.0009) +[2023-10-08 17:27:54,932][21195] Updated weights for policy 0, policy_version 43180 (0.0007) +[2023-10-08 17:27:55,300][21195] Updated weights for policy 0, policy_version 43190 (0.0009) +[2023-10-08 17:27:55,300][21194] Updated weights for policy 1, policy_version 42860 (0.0008) +[2023-10-08 17:27:55,662][21195] Updated weights for policy 0, policy_version 43200 (0.0010) +[2023-10-08 17:27:55,666][21194] Updated weights for policy 1, policy_version 42870 (0.0007) +[2023-10-08 17:27:56,029][21194] Updated weights for policy 1, policy_version 42880 (0.0007) +[2023-10-08 17:27:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 88145920. Throughput: 0: 1738.5, 1: 1726.5. Samples: 22049096. Policy #0 lag: (min: 16.0, avg: 42.7, max: 48.0) +[2023-10-08 17:27:58,803][19739] Avg episode reward: [(0, '740.920'), (1, '818.290')] +[2023-10-08 17:27:59,651][21195] Updated weights for policy 0, policy_version 43210 (0.0008) +[2023-10-08 17:28:00,029][21195] Updated weights for policy 0, policy_version 43220 (0.0007) +[2023-10-08 17:28:00,174][21194] Updated weights for policy 1, policy_version 42890 (0.0007) +[2023-10-08 17:28:00,393][21195] Updated weights for policy 0, policy_version 43230 (0.0008) +[2023-10-08 17:28:00,549][21194] Updated weights for policy 1, policy_version 42900 (0.0007) +[2023-10-08 17:28:00,914][21194] Updated weights for policy 1, policy_version 42910 (0.0007) +[2023-10-08 17:28:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 88211456. Throughput: 0: 1745.7, 1: 1700.6. Samples: 22064336. Policy #0 lag: (min: 16.0, avg: 42.7, max: 48.0) +[2023-10-08 17:28:03,803][19739] Avg episode reward: [(0, '740.920'), (1, '803.270')] +[2023-10-08 17:28:04,270][21195] Updated weights for policy 0, policy_version 43240 (0.0010) +[2023-10-08 17:28:04,640][21195] Updated weights for policy 0, policy_version 43250 (0.0007) +[2023-10-08 17:28:04,866][21194] Updated weights for policy 1, policy_version 42920 (0.0007) +[2023-10-08 17:28:05,015][21195] Updated weights for policy 0, policy_version 43260 (0.0007) +[2023-10-08 17:28:05,225][21194] Updated weights for policy 1, policy_version 42930 (0.0007) +[2023-10-08 17:28:05,588][21194] Updated weights for policy 1, policy_version 42940 (0.0007) +[2023-10-08 17:28:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 88276992. Throughput: 0: 1726.6, 1: 1721.3. Samples: 22079848. Policy #0 lag: (min: 16.0, avg: 42.7, max: 48.0) +[2023-10-08 17:28:08,803][19739] Avg episode reward: [(0, '740.920'), (1, '800.170')] +[2023-10-08 17:28:08,948][21195] Updated weights for policy 0, policy_version 43270 (0.0009) +[2023-10-08 17:28:09,311][21195] Updated weights for policy 0, policy_version 43280 (0.0008) +[2023-10-08 17:28:09,371][21194] Updated weights for policy 1, policy_version 42950 (0.0009) +[2023-10-08 17:28:09,681][21195] Updated weights for policy 0, policy_version 43290 (0.0007) +[2023-10-08 17:28:09,733][21194] Updated weights for policy 1, policy_version 42960 (0.0009) +[2023-10-08 17:28:10,099][21194] Updated weights for policy 1, policy_version 42970 (0.0009) +[2023-10-08 17:28:13,513][21195] Updated weights for policy 0, policy_version 43300 (0.0008) +[2023-10-08 17:28:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.3, 300 sec: 13773.7). Total num frames: 88342528. Throughput: 0: 1742.4, 1: 1733.6. Samples: 22101184. Policy #0 lag: (min: 16.0, avg: 42.7, max: 48.0) +[2023-10-08 17:28:13,803][19739] Avg episode reward: [(0, '752.070'), (1, '800.170')] +[2023-10-08 17:28:13,891][21195] Updated weights for policy 0, policy_version 43310 (0.0009) +[2023-10-08 17:28:13,936][21194] Updated weights for policy 1, policy_version 42980 (0.0009) +[2023-10-08 17:28:14,257][21195] Updated weights for policy 0, policy_version 43320 (0.0009) +[2023-10-08 17:28:14,295][21194] Updated weights for policy 1, policy_version 42990 (0.0009) +[2023-10-08 17:28:14,654][21194] Updated weights for policy 1, policy_version 43000 (0.0009) +[2023-10-08 17:28:18,428][21195] Updated weights for policy 0, policy_version 43330 (0.0008) +[2023-10-08 17:28:18,743][21194] Updated weights for policy 1, policy_version 43010 (0.0007) +[2023-10-08 17:28:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 88408064. Throughput: 0: 1725.0, 1: 1707.7. Samples: 22115802. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 17:28:18,803][21195] Updated weights for policy 0, policy_version 43340 (0.0008) +[2023-10-08 17:28:18,803][19739] Avg episode reward: [(0, '752.210'), (1, '776.650')] +[2023-10-08 17:28:19,115][21194] Updated weights for policy 1, policy_version 43020 (0.0007) +[2023-10-08 17:28:19,171][21195] Updated weights for policy 0, policy_version 43350 (0.0007) +[2023-10-08 17:28:19,475][21194] Updated weights for policy 1, policy_version 43030 (0.0008) +[2023-10-08 17:28:19,536][21195] Updated weights for policy 0, policy_version 43360 (0.0008) +[2023-10-08 17:28:19,846][21194] Updated weights for policy 1, policy_version 43040 (0.0008) +[2023-10-08 17:28:23,603][21195] Updated weights for policy 0, policy_version 43370 (0.0008) +[2023-10-08 17:28:23,791][21194] Updated weights for policy 1, policy_version 43050 (0.0010) +[2023-10-08 17:28:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 88473600. Throughput: 0: 1731.0, 1: 1728.9. Samples: 22131300. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 17:28:23,803][19739] Avg episode reward: [(0, '752.210'), (1, '776.870')] +[2023-10-08 17:28:23,967][21195] Updated weights for policy 0, policy_version 43380 (0.0008) +[2023-10-08 17:28:24,166][21194] Updated weights for policy 1, policy_version 43060 (0.0007) +[2023-10-08 17:28:24,328][21195] Updated weights for policy 0, policy_version 43390 (0.0008) +[2023-10-08 17:28:24,541][21194] Updated weights for policy 1, policy_version 43070 (0.0007) +[2023-10-08 17:28:28,348][21195] Updated weights for policy 0, policy_version 43400 (0.0008) +[2023-10-08 17:28:28,475][21194] Updated weights for policy 1, policy_version 43080 (0.0007) +[2023-10-08 17:28:28,718][21195] Updated weights for policy 0, policy_version 43410 (0.0008) +[2023-10-08 17:28:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 88539136. Throughput: 0: 1727.4, 1: 1728.0. Samples: 22152526. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 17:28:28,803][19739] Avg episode reward: [(0, '752.210'), (1, '776.870')] +[2023-10-08 17:28:28,843][21194] Updated weights for policy 1, policy_version 43090 (0.0007) +[2023-10-08 17:28:29,088][21195] Updated weights for policy 0, policy_version 43420 (0.0007) +[2023-10-08 17:28:29,212][21194] Updated weights for policy 1, policy_version 43100 (0.0007) +[2023-10-08 17:28:32,814][21195] Updated weights for policy 0, policy_version 43430 (0.0009) +[2023-10-08 17:28:33,183][21195] Updated weights for policy 0, policy_version 43440 (0.0008) +[2023-10-08 17:28:33,231][21194] Updated weights for policy 1, policy_version 43110 (0.0008) +[2023-10-08 17:28:33,556][21195] Updated weights for policy 0, policy_version 43450 (0.0009) +[2023-10-08 17:28:33,598][21194] Updated weights for policy 1, policy_version 43120 (0.0009) +[2023-10-08 17:28:33,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 88637440. Throughput: 0: 1698.5, 1: 1718.8. Samples: 22166696. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 17:28:33,803][19739] Avg episode reward: [(0, '752.210'), (1, '776.890')] +[2023-10-08 17:28:33,961][21194] Updated weights for policy 1, policy_version 43130 (0.0009) +[2023-10-08 17:28:37,346][21195] Updated weights for policy 0, policy_version 43460 (0.0009) +[2023-10-08 17:28:37,718][21195] Updated weights for policy 0, policy_version 43470 (0.0007) +[2023-10-08 17:28:37,984][21194] Updated weights for policy 1, policy_version 43140 (0.0007) +[2023-10-08 17:28:38,091][21195] Updated weights for policy 0, policy_version 43480 (0.0007) +[2023-10-08 17:28:38,350][21194] Updated weights for policy 1, policy_version 43150 (0.0008) +[2023-10-08 17:28:38,726][21194] Updated weights for policy 1, policy_version 43160 (0.0007) +[2023-10-08 17:28:38,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 88702976. Throughput: 0: 1730.8, 1: 1723.2. Samples: 22183250. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 17:28:38,803][19739] Avg episode reward: [(0, '752.210'), (1, '776.890')] +[2023-10-08 17:28:42,089][21195] Updated weights for policy 0, policy_version 43490 (0.0007) +[2023-10-08 17:28:42,457][21195] Updated weights for policy 0, policy_version 43500 (0.0008) +[2023-10-08 17:28:42,684][21194] Updated weights for policy 1, policy_version 43170 (0.0009) +[2023-10-08 17:28:42,822][21195] Updated weights for policy 0, policy_version 43510 (0.0009) +[2023-10-08 17:28:43,037][21194] Updated weights for policy 1, policy_version 43180 (0.0007) +[2023-10-08 17:28:43,181][21195] Updated weights for policy 0, policy_version 43520 (0.0007) +[2023-10-08 17:28:43,406][21194] Updated weights for policy 1, policy_version 43190 (0.0007) +[2023-10-08 17:28:43,768][21194] Updated weights for policy 1, policy_version 43200 (0.0007) +[2023-10-08 17:28:43,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 88801280. Throughput: 0: 1708.1, 1: 1719.7. Samples: 22203350. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:28:43,803][19739] Avg episode reward: [(0, '752.210'), (1, '776.890')] +[2023-10-08 17:28:47,346][21195] Updated weights for policy 0, policy_version 43530 (0.0008) +[2023-10-08 17:28:47,700][21194] Updated weights for policy 1, policy_version 43210 (0.0009) +[2023-10-08 17:28:47,706][21195] Updated weights for policy 0, policy_version 43540 (0.0009) +[2023-10-08 17:28:48,057][21194] Updated weights for policy 1, policy_version 43220 (0.0008) +[2023-10-08 17:28:48,075][21195] Updated weights for policy 0, policy_version 43550 (0.0007) +[2023-10-08 17:28:48,417][21194] Updated weights for policy 1, policy_version 43230 (0.0009) +[2023-10-08 17:28:48,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 88866816. Throughput: 0: 1695.2, 1: 1730.8. Samples: 22218506. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:28:48,803][19739] Avg episode reward: [(0, '752.210'), (1, '776.890')] +[2023-10-08 17:28:51,867][21195] Updated weights for policy 0, policy_version 43560 (0.0010) +[2023-10-08 17:28:52,231][21195] Updated weights for policy 0, policy_version 43570 (0.0010) +[2023-10-08 17:28:52,539][21194] Updated weights for policy 1, policy_version 43240 (0.0007) +[2023-10-08 17:28:52,597][21195] Updated weights for policy 0, policy_version 43580 (0.0008) +[2023-10-08 17:28:52,900][21194] Updated weights for policy 1, policy_version 43250 (0.0007) +[2023-10-08 17:28:53,274][21194] Updated weights for policy 1, policy_version 43260 (0.0007) +[2023-10-08 17:28:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 88932352. Throughput: 0: 1723.5, 1: 1719.7. Samples: 22234790. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:28:53,803][19739] Avg episode reward: [(0, '752.210'), (1, '791.840')] +[2023-10-08 17:28:56,585][21195] Updated weights for policy 0, policy_version 43590 (0.0008) +[2023-10-08 17:28:56,957][21195] Updated weights for policy 0, policy_version 43600 (0.0007) +[2023-10-08 17:28:57,158][21194] Updated weights for policy 1, policy_version 43270 (0.0009) +[2023-10-08 17:28:57,323][21195] Updated weights for policy 0, policy_version 43610 (0.0008) +[2023-10-08 17:28:57,527][21194] Updated weights for policy 1, policy_version 43280 (0.0008) +[2023-10-08 17:28:57,888][21194] Updated weights for policy 1, policy_version 43290 (0.0008) +[2023-10-08 17:28:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 88997888. Throughput: 0: 1697.4, 1: 1694.7. Samples: 22253828. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:28:58,803][19739] Avg episode reward: [(0, '752.210'), (1, '791.840')] +[2023-10-08 17:29:01,280][21195] Updated weights for policy 0, policy_version 43620 (0.0008) +[2023-10-08 17:29:01,643][21195] Updated weights for policy 0, policy_version 43630 (0.0008) +[2023-10-08 17:29:01,787][21194] Updated weights for policy 1, policy_version 43300 (0.0008) +[2023-10-08 17:29:02,013][21195] Updated weights for policy 0, policy_version 43640 (0.0008) +[2023-10-08 17:29:02,142][21194] Updated weights for policy 1, policy_version 43310 (0.0009) +[2023-10-08 17:29:02,505][21194] Updated weights for policy 1, policy_version 43320 (0.0009) +[2023-10-08 17:29:03,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 89063424. Throughput: 0: 1713.2, 1: 1719.9. Samples: 22270288. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:29:03,803][19739] Avg episode reward: [(0, '752.450'), (1, '796.510')] +[2023-10-08 17:29:06,073][21195] Updated weights for policy 0, policy_version 43650 (0.0007) +[2023-10-08 17:29:06,446][21195] Updated weights for policy 0, policy_version 43660 (0.0009) +[2023-10-08 17:29:06,710][21194] Updated weights for policy 1, policy_version 43330 (0.0008) +[2023-10-08 17:29:06,822][21195] Updated weights for policy 0, policy_version 43670 (0.0008) +[2023-10-08 17:29:07,120][21194] Updated weights for policy 1, policy_version 43340 (0.0009) +[2023-10-08 17:29:07,188][21195] Updated weights for policy 0, policy_version 43680 (0.0008) +[2023-10-08 17:29:07,485][21194] Updated weights for policy 1, policy_version 43350 (0.0008) +[2023-10-08 17:29:07,852][21194] Updated weights for policy 1, policy_version 43360 (0.0008) +[2023-10-08 17:29:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 89128960. Throughput: 0: 1714.8, 1: 1709.9. Samples: 22285412. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:29:08,803][19739] Avg episode reward: [(0, '754.060'), (1, '796.510')] +[2023-10-08 17:29:11,219][21195] Updated weights for policy 0, policy_version 43690 (0.0008) +[2023-10-08 17:29:11,583][21195] Updated weights for policy 0, policy_version 43700 (0.0009) +[2023-10-08 17:29:11,713][21194] Updated weights for policy 1, policy_version 43370 (0.0007) +[2023-10-08 17:29:11,943][21195] Updated weights for policy 0, policy_version 43710 (0.0009) +[2023-10-08 17:29:12,078][21194] Updated weights for policy 1, policy_version 43380 (0.0008) +[2023-10-08 17:29:12,449][21194] Updated weights for policy 1, policy_version 43390 (0.0009) +[2023-10-08 17:29:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 89194496. Throughput: 0: 1707.7, 1: 1683.6. Samples: 22305134. Policy #0 lag: (min: 18.0, avg: 20.2, max: 49.0) +[2023-10-08 17:29:13,803][19739] Avg episode reward: [(0, '754.060'), (1, '796.510')] +[2023-10-08 17:29:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000043712_44761088.pth... +[2023-10-08 17:29:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000043392_44433408.pth... +[2023-10-08 17:29:13,847][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000041792_42795008.pth +[2023-10-08 17:29:13,851][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000042112_43122688.pth +[2023-10-08 17:29:15,838][21195] Updated weights for policy 0, policy_version 43720 (0.0008) +[2023-10-08 17:29:16,201][21195] Updated weights for policy 0, policy_version 43730 (0.0009) +[2023-10-08 17:29:16,494][21194] Updated weights for policy 1, policy_version 43400 (0.0008) +[2023-10-08 17:29:16,573][21195] Updated weights for policy 0, policy_version 43740 (0.0008) +[2023-10-08 17:29:16,865][21194] Updated weights for policy 1, policy_version 43410 (0.0007) +[2023-10-08 17:29:17,234][21194] Updated weights for policy 1, policy_version 43420 (0.0009) +[2023-10-08 17:29:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 89260032. Throughput: 0: 1733.1, 1: 1714.0. Samples: 22321814. Policy #0 lag: (min: 18.0, avg: 20.2, max: 49.0) +[2023-10-08 17:29:18,803][19739] Avg episode reward: [(0, '754.060'), (1, '796.510')] +[2023-10-08 17:29:20,503][21195] Updated weights for policy 0, policy_version 43750 (0.0008) +[2023-10-08 17:29:20,871][21195] Updated weights for policy 0, policy_version 43760 (0.0009) +[2023-10-08 17:29:21,207][21194] Updated weights for policy 1, policy_version 43430 (0.0007) +[2023-10-08 17:29:21,231][21195] Updated weights for policy 0, policy_version 43770 (0.0007) +[2023-10-08 17:29:21,574][21194] Updated weights for policy 1, policy_version 43440 (0.0011) +[2023-10-08 17:29:21,946][21194] Updated weights for policy 1, policy_version 43450 (0.0010) +[2023-10-08 17:29:23,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 89325568. Throughput: 0: 1699.7, 1: 1691.3. Samples: 22335846. Policy #0 lag: (min: 18.0, avg: 20.2, max: 49.0) +[2023-10-08 17:29:23,804][19739] Avg episode reward: [(0, '754.400'), (1, '811.620')] +[2023-10-08 17:29:25,376][21195] Updated weights for policy 0, policy_version 43780 (0.0008) +[2023-10-08 17:29:25,743][21195] Updated weights for policy 0, policy_version 43790 (0.0008) +[2023-10-08 17:29:26,073][21194] Updated weights for policy 1, policy_version 43460 (0.0009) +[2023-10-08 17:29:26,115][21195] Updated weights for policy 0, policy_version 43800 (0.0007) +[2023-10-08 17:29:26,445][21194] Updated weights for policy 1, policy_version 43470 (0.0008) +[2023-10-08 17:29:26,802][21194] Updated weights for policy 1, policy_version 43480 (0.0007) +[2023-10-08 17:29:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 89391104. Throughput: 0: 1721.2, 1: 1693.5. Samples: 22357012. Policy #0 lag: (min: 18.0, avg: 20.2, max: 49.0) +[2023-10-08 17:29:28,803][19739] Avg episode reward: [(0, '741.240'), (1, '811.620')] +[2023-10-08 17:29:29,997][21195] Updated weights for policy 0, policy_version 43810 (0.0007) +[2023-10-08 17:29:30,357][21195] Updated weights for policy 0, policy_version 43820 (0.0008) +[2023-10-08 17:29:30,733][21195] Updated weights for policy 0, policy_version 43830 (0.0007) +[2023-10-08 17:29:30,766][21194] Updated weights for policy 1, policy_version 43490 (0.0008) +[2023-10-08 17:29:31,101][21195] Updated weights for policy 0, policy_version 43840 (0.0008) +[2023-10-08 17:29:31,122][21194] Updated weights for policy 1, policy_version 43500 (0.0008) +[2023-10-08 17:29:31,501][21194] Updated weights for policy 1, policy_version 43510 (0.0008) +[2023-10-08 17:29:31,860][21194] Updated weights for policy 1, policy_version 43520 (0.0007) +[2023-10-08 17:29:33,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 89456640. Throughput: 0: 1735.3, 1: 1705.0. Samples: 22373320. Policy #0 lag: (min: 18.0, avg: 20.2, max: 49.0) +[2023-10-08 17:29:33,803][19739] Avg episode reward: [(0, '712.720'), (1, '811.620')] +[2023-10-08 17:29:35,090][21195] Updated weights for policy 0, policy_version 43850 (0.0007) +[2023-10-08 17:29:35,465][21195] Updated weights for policy 0, policy_version 43860 (0.0008) +[2023-10-08 17:29:35,831][21195] Updated weights for policy 0, policy_version 43870 (0.0007) +[2023-10-08 17:29:35,927][21194] Updated weights for policy 1, policy_version 43530 (0.0007) +[2023-10-08 17:29:36,305][21194] Updated weights for policy 1, policy_version 43540 (0.0011) +[2023-10-08 17:29:36,676][21194] Updated weights for policy 1, policy_version 43550 (0.0010) +[2023-10-08 17:29:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 89522176. Throughput: 0: 1704.0, 1: 1689.6. Samples: 22387502. Policy #0 lag: (min: 18.0, avg: 20.2, max: 49.0) +[2023-10-08 17:29:38,803][19739] Avg episode reward: [(0, '712.720'), (1, '811.620')] +[2023-10-08 17:29:39,862][21195] Updated weights for policy 0, policy_version 43880 (0.0009) +[2023-10-08 17:29:40,236][21195] Updated weights for policy 0, policy_version 43890 (0.0008) +[2023-10-08 17:29:40,534][21194] Updated weights for policy 1, policy_version 43560 (0.0008) +[2023-10-08 17:29:40,598][21195] Updated weights for policy 0, policy_version 43900 (0.0009) +[2023-10-08 17:29:40,903][21194] Updated weights for policy 1, policy_version 43570 (0.0008) +[2023-10-08 17:29:41,269][21194] Updated weights for policy 1, policy_version 43580 (0.0011) +[2023-10-08 17:29:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 89587712. Throughput: 0: 1725.2, 1: 1719.1. Samples: 22408820. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:29:43,803][19739] Avg episode reward: [(0, '703.880'), (1, '811.620')] +[2023-10-08 17:29:44,433][21195] Updated weights for policy 0, policy_version 43910 (0.0009) +[2023-10-08 17:29:44,803][21195] Updated weights for policy 0, policy_version 43920 (0.0007) +[2023-10-08 17:29:45,179][21195] Updated weights for policy 0, policy_version 43930 (0.0008) +[2023-10-08 17:29:45,182][21194] Updated weights for policy 1, policy_version 43590 (0.0008) +[2023-10-08 17:29:45,543][21194] Updated weights for policy 1, policy_version 43600 (0.0010) +[2023-10-08 17:29:45,921][21194] Updated weights for policy 1, policy_version 43610 (0.0009) +[2023-10-08 17:29:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 89653248. Throughput: 0: 1728.5, 1: 1699.0. Samples: 22424526. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:29:48,803][19739] Avg episode reward: [(0, '703.880'), (1, '811.620')] +[2023-10-08 17:29:49,082][21195] Updated weights for policy 0, policy_version 43940 (0.0008) +[2023-10-08 17:29:49,458][21195] Updated weights for policy 0, policy_version 43950 (0.0008) +[2023-10-08 17:29:49,817][21195] Updated weights for policy 0, policy_version 43960 (0.0009) +[2023-10-08 17:29:49,840][21194] Updated weights for policy 1, policy_version 43620 (0.0008) +[2023-10-08 17:29:50,204][21194] Updated weights for policy 1, policy_version 43630 (0.0008) +[2023-10-08 17:29:50,567][21194] Updated weights for policy 1, policy_version 43640 (0.0011) +[2023-10-08 17:29:53,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 89718784. Throughput: 0: 1715.9, 1: 1707.6. Samples: 22439470. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:29:53,804][19739] Avg episode reward: [(0, '703.880'), (1, '825.800')] +[2023-10-08 17:29:53,881][21195] Updated weights for policy 0, policy_version 43970 (0.0009) +[2023-10-08 17:29:54,246][21195] Updated weights for policy 0, policy_version 43980 (0.0008) +[2023-10-08 17:29:54,480][21194] Updated weights for policy 1, policy_version 43650 (0.0008) +[2023-10-08 17:29:54,622][21195] Updated weights for policy 0, policy_version 43990 (0.0007) +[2023-10-08 17:29:54,873][21194] Updated weights for policy 1, policy_version 43660 (0.0008) +[2023-10-08 17:29:54,989][21195] Updated weights for policy 0, policy_version 44000 (0.0008) +[2023-10-08 17:29:55,239][21194] Updated weights for policy 1, policy_version 43670 (0.0010) +[2023-10-08 17:29:55,603][21194] Updated weights for policy 1, policy_version 43680 (0.0009) +[2023-10-08 17:29:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 89784320. Throughput: 0: 1729.3, 1: 1730.2. Samples: 22460812. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:29:58,803][19739] Avg episode reward: [(0, '703.880'), (1, '825.800')] +[2023-10-08 17:29:58,915][21195] Updated weights for policy 0, policy_version 44010 (0.0007) +[2023-10-08 17:29:59,279][21195] Updated weights for policy 0, policy_version 44020 (0.0008) +[2023-10-08 17:29:59,499][21194] Updated weights for policy 1, policy_version 43690 (0.0009) +[2023-10-08 17:29:59,649][21195] Updated weights for policy 0, policy_version 44030 (0.0008) +[2023-10-08 17:29:59,869][21194] Updated weights for policy 1, policy_version 43700 (0.0008) +[2023-10-08 17:30:00,230][21194] Updated weights for policy 1, policy_version 43710 (0.0009) +[2023-10-08 17:30:03,558][21195] Updated weights for policy 0, policy_version 44040 (0.0008) +[2023-10-08 17:30:03,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 89849856. Throughput: 0: 1715.8, 1: 1699.3. Samples: 22475494. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:30:03,803][19739] Avg episode reward: [(0, '703.880'), (1, '817.640')] +[2023-10-08 17:30:03,929][21195] Updated weights for policy 0, policy_version 44050 (0.0009) +[2023-10-08 17:30:04,295][21195] Updated weights for policy 0, policy_version 44060 (0.0008) +[2023-10-08 17:30:04,409][21194] Updated weights for policy 1, policy_version 43720 (0.0008) +[2023-10-08 17:30:04,768][21194] Updated weights for policy 1, policy_version 43730 (0.0007) +[2023-10-08 17:30:05,136][21194] Updated weights for policy 1, policy_version 43740 (0.0007) +[2023-10-08 17:30:08,098][21195] Updated weights for policy 0, policy_version 44070 (0.0008) +[2023-10-08 17:30:08,466][21195] Updated weights for policy 0, policy_version 44080 (0.0007) +[2023-10-08 17:30:08,779][21194] Updated weights for policy 1, policy_version 43750 (0.0008) +[2023-10-08 17:30:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 89915392. Throughput: 0: 1733.3, 1: 1730.4. Samples: 22491710. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:30:08,803][19739] Avg episode reward: [(0, '703.880'), (1, '837.630')] +[2023-10-08 17:30:08,832][21195] Updated weights for policy 0, policy_version 44090 (0.0008) +[2023-10-08 17:30:09,146][21194] Updated weights for policy 1, policy_version 43760 (0.0008) +[2023-10-08 17:30:09,509][21194] Updated weights for policy 1, policy_version 43770 (0.0007) +[2023-10-08 17:30:12,780][21195] Updated weights for policy 0, policy_version 44100 (0.0008) +[2023-10-08 17:30:13,148][21195] Updated weights for policy 0, policy_version 44110 (0.0008) +[2023-10-08 17:30:13,506][21195] Updated weights for policy 0, policy_version 44120 (0.0007) +[2023-10-08 17:30:13,521][21194] Updated weights for policy 1, policy_version 43780 (0.0007) +[2023-10-08 17:30:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 89980928. Throughput: 0: 1727.3, 1: 1735.6. Samples: 22512842. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:30:13,803][19739] Avg episode reward: [(0, '703.880'), (1, '822.880')] +[2023-10-08 17:30:13,889][21194] Updated weights for policy 1, policy_version 43790 (0.0009) +[2023-10-08 17:30:14,254][21194] Updated weights for policy 1, policy_version 43800 (0.0009) +[2023-10-08 17:30:17,512][21195] Updated weights for policy 0, policy_version 44130 (0.0008) +[2023-10-08 17:30:17,873][21195] Updated weights for policy 0, policy_version 44140 (0.0010) +[2023-10-08 17:30:18,246][21195] Updated weights for policy 0, policy_version 44150 (0.0008) +[2023-10-08 17:30:18,256][21194] Updated weights for policy 1, policy_version 43810 (0.0008) +[2023-10-08 17:30:18,622][21195] Updated weights for policy 0, policy_version 44160 (0.0008) +[2023-10-08 17:30:18,626][21194] Updated weights for policy 1, policy_version 43820 (0.0008) +[2023-10-08 17:30:18,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 90079232. Throughput: 0: 1700.0, 1: 1713.7. Samples: 22526936. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:30:18,803][19739] Avg episode reward: [(0, '703.880'), (1, '817.150')] +[2023-10-08 17:30:18,997][21194] Updated weights for policy 1, policy_version 43830 (0.0009) +[2023-10-08 17:30:19,361][21194] Updated weights for policy 1, policy_version 43840 (0.0010) +[2023-10-08 17:30:22,593][21195] Updated weights for policy 0, policy_version 44170 (0.0011) +[2023-10-08 17:30:22,967][21195] Updated weights for policy 0, policy_version 44180 (0.0009) +[2023-10-08 17:30:23,214][21194] Updated weights for policy 1, policy_version 43850 (0.0009) +[2023-10-08 17:30:23,333][21195] Updated weights for policy 0, policy_version 44190 (0.0009) +[2023-10-08 17:30:23,583][21194] Updated weights for policy 1, policy_version 43860 (0.0007) +[2023-10-08 17:30:23,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 90144768. Throughput: 0: 1737.3, 1: 1736.6. Samples: 22543830. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:30:23,803][19739] Avg episode reward: [(0, '703.880'), (1, '817.150')] +[2023-10-08 17:30:23,947][21194] Updated weights for policy 1, policy_version 43870 (0.0007) +[2023-10-08 17:30:27,290][21195] Updated weights for policy 0, policy_version 44200 (0.0009) +[2023-10-08 17:30:27,670][21195] Updated weights for policy 0, policy_version 44210 (0.0009) +[2023-10-08 17:30:28,032][21194] Updated weights for policy 1, policy_version 43880 (0.0008) +[2023-10-08 17:30:28,050][21195] Updated weights for policy 0, policy_version 44220 (0.0008) +[2023-10-08 17:30:28,392][21194] Updated weights for policy 1, policy_version 43890 (0.0008) +[2023-10-08 17:30:28,768][21194] Updated weights for policy 1, policy_version 43900 (0.0010) +[2023-10-08 17:30:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 90210304. Throughput: 0: 1714.5, 1: 1728.1. Samples: 22563738. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:30:28,803][19739] Avg episode reward: [(0, '703.880'), (1, '831.160')] +[2023-10-08 17:30:32,072][21195] Updated weights for policy 0, policy_version 44230 (0.0007) +[2023-10-08 17:30:32,444][21195] Updated weights for policy 0, policy_version 44240 (0.0007) +[2023-10-08 17:30:32,814][21195] Updated weights for policy 0, policy_version 44250 (0.0008) +[2023-10-08 17:30:32,881][21194] Updated weights for policy 1, policy_version 43910 (0.0010) +[2023-10-08 17:30:33,252][21194] Updated weights for policy 1, policy_version 43920 (0.0009) +[2023-10-08 17:30:33,625][21194] Updated weights for policy 1, policy_version 43930 (0.0007) +[2023-10-08 17:30:33,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 90275840. Throughput: 0: 1699.3, 1: 1724.8. Samples: 22578612. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:30:33,804][19739] Avg episode reward: [(0, '718.880'), (1, '831.160')] +[2023-10-08 17:30:36,612][21195] Updated weights for policy 0, policy_version 44260 (0.0008) +[2023-10-08 17:30:36,987][21195] Updated weights for policy 0, policy_version 44270 (0.0008) +[2023-10-08 17:30:37,355][21195] Updated weights for policy 0, policy_version 44280 (0.0009) +[2023-10-08 17:30:37,545][21194] Updated weights for policy 1, policy_version 43940 (0.0008) +[2023-10-08 17:30:37,904][21194] Updated weights for policy 1, policy_version 43950 (0.0009) +[2023-10-08 17:30:38,274][21194] Updated weights for policy 1, policy_version 43960 (0.0007) +[2023-10-08 17:30:38,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 90374144. Throughput: 0: 1726.3, 1: 1732.2. Samples: 22595102. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:30:38,803][19739] Avg episode reward: [(0, '733.390'), (1, '831.160')] +[2023-10-08 17:30:41,341][21195] Updated weights for policy 0, policy_version 44290 (0.0009) +[2023-10-08 17:30:41,704][21195] Updated weights for policy 0, policy_version 44300 (0.0010) +[2023-10-08 17:30:42,077][21195] Updated weights for policy 0, policy_version 44310 (0.0007) +[2023-10-08 17:30:42,257][21194] Updated weights for policy 1, policy_version 43970 (0.0009) +[2023-10-08 17:30:42,435][21195] Updated weights for policy 0, policy_version 44320 (0.0008) +[2023-10-08 17:30:42,660][21194] Updated weights for policy 1, policy_version 43980 (0.0009) +[2023-10-08 17:30:43,025][21194] Updated weights for policy 1, policy_version 43990 (0.0008) +[2023-10-08 17:30:43,396][21194] Updated weights for policy 1, policy_version 44000 (0.0009) +[2023-10-08 17:30:43,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13773.6). Total num frames: 90439680. Throughput: 0: 1701.8, 1: 1717.3. Samples: 22614672. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:30:43,804][19739] Avg episode reward: [(0, '733.390'), (1, '832.000')] +[2023-10-08 17:30:46,351][21195] Updated weights for policy 0, policy_version 44330 (0.0007) +[2023-10-08 17:30:46,726][21195] Updated weights for policy 0, policy_version 44340 (0.0007) +[2023-10-08 17:30:47,095][21195] Updated weights for policy 0, policy_version 44350 (0.0007) +[2023-10-08 17:30:47,343][21194] Updated weights for policy 1, policy_version 44010 (0.0007) +[2023-10-08 17:30:47,706][21194] Updated weights for policy 1, policy_version 44020 (0.0009) +[2023-10-08 17:30:48,077][21194] Updated weights for policy 1, policy_version 44030 (0.0010) +[2023-10-08 17:30:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 90505216. Throughput: 0: 1721.5, 1: 1735.6. Samples: 22631062. Policy #0 lag: (min: 31.0, avg: 31.0, max: 33.0) +[2023-10-08 17:30:48,803][19739] Avg episode reward: [(0, '748.620'), (1, '847.030')] +[2023-10-08 17:30:51,053][21195] Updated weights for policy 0, policy_version 44360 (0.0010) +[2023-10-08 17:30:51,429][21195] Updated weights for policy 0, policy_version 44370 (0.0010) +[2023-10-08 17:30:51,804][21195] Updated weights for policy 0, policy_version 44380 (0.0008) +[2023-10-08 17:30:51,880][21194] Updated weights for policy 1, policy_version 44040 (0.0008) +[2023-10-08 17:30:52,249][21194] Updated weights for policy 1, policy_version 44050 (0.0007) +[2023-10-08 17:30:52,609][21194] Updated weights for policy 1, policy_version 44060 (0.0007) +[2023-10-08 17:30:53,803][19739] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 90570752. Throughput: 0: 1707.6, 1: 1724.3. Samples: 22646146. Policy #0 lag: (min: 31.0, avg: 31.0, max: 33.0) +[2023-10-08 17:30:53,803][19739] Avg episode reward: [(0, '748.620'), (1, '847.030')] +[2023-10-08 17:30:55,766][21195] Updated weights for policy 0, policy_version 44390 (0.0007) +[2023-10-08 17:30:56,141][21195] Updated weights for policy 0, policy_version 44400 (0.0008) +[2023-10-08 17:30:56,492][21194] Updated weights for policy 1, policy_version 44070 (0.0009) +[2023-10-08 17:30:56,518][21195] Updated weights for policy 0, policy_version 44410 (0.0008) +[2023-10-08 17:30:56,862][21194] Updated weights for policy 1, policy_version 44080 (0.0008) +[2023-10-08 17:30:57,222][21194] Updated weights for policy 1, policy_version 44090 (0.0007) +[2023-10-08 17:30:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 90636288. Throughput: 0: 1709.9, 1: 1708.8. Samples: 22666686. Policy #0 lag: (min: 31.0, avg: 31.0, max: 33.0) +[2023-10-08 17:30:58,803][19739] Avg episode reward: [(0, '778.200'), (1, '847.030')] +[2023-10-08 17:31:00,436][21195] Updated weights for policy 0, policy_version 44420 (0.0010) +[2023-10-08 17:31:00,812][21195] Updated weights for policy 0, policy_version 44430 (0.0008) +[2023-10-08 17:31:01,182][21195] Updated weights for policy 0, policy_version 44440 (0.0007) +[2023-10-08 17:31:01,216][21194] Updated weights for policy 1, policy_version 44100 (0.0007) +[2023-10-08 17:31:01,578][21194] Updated weights for policy 1, policy_version 44110 (0.0007) +[2023-10-08 17:31:01,938][21194] Updated weights for policy 1, policy_version 44120 (0.0009) +[2023-10-08 17:31:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 90701824. Throughput: 0: 1742.4, 1: 1735.9. Samples: 22683460. Policy #0 lag: (min: 31.0, avg: 31.0, max: 33.0) +[2023-10-08 17:31:03,803][19739] Avg episode reward: [(0, '778.200'), (1, '847.030')] +[2023-10-08 17:31:04,976][21195] Updated weights for policy 0, policy_version 44450 (0.0008) +[2023-10-08 17:31:05,342][21195] Updated weights for policy 0, policy_version 44460 (0.0009) +[2023-10-08 17:31:05,715][21195] Updated weights for policy 0, policy_version 44470 (0.0007) +[2023-10-08 17:31:05,971][21194] Updated weights for policy 1, policy_version 44130 (0.0008) +[2023-10-08 17:31:06,081][21195] Updated weights for policy 0, policy_version 44480 (0.0009) +[2023-10-08 17:31:06,342][21194] Updated weights for policy 1, policy_version 44140 (0.0009) +[2023-10-08 17:31:06,713][21194] Updated weights for policy 1, policy_version 44150 (0.0008) +[2023-10-08 17:31:07,086][21194] Updated weights for policy 1, policy_version 44160 (0.0007) +[2023-10-08 17:31:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 90767360. Throughput: 0: 1709.8, 1: 1708.4. Samples: 22697648. Policy #0 lag: (min: 31.0, avg: 31.0, max: 33.0) +[2023-10-08 17:31:08,803][19739] Avg episode reward: [(0, '767.420'), (1, '847.030')] +[2023-10-08 17:31:09,941][21195] Updated weights for policy 0, policy_version 44490 (0.0008) +[2023-10-08 17:31:10,319][21195] Updated weights for policy 0, policy_version 44500 (0.0007) +[2023-10-08 17:31:10,694][21195] Updated weights for policy 0, policy_version 44510 (0.0009) +[2023-10-08 17:31:10,928][21194] Updated weights for policy 1, policy_version 44170 (0.0009) +[2023-10-08 17:31:11,294][21194] Updated weights for policy 1, policy_version 44180 (0.0009) +[2023-10-08 17:31:11,657][21194] Updated weights for policy 1, policy_version 44190 (0.0007) +[2023-10-08 17:31:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 90832896. Throughput: 0: 1744.1, 1: 1714.5. Samples: 22719378. Policy #0 lag: (min: 31.0, avg: 31.0, max: 33.0) +[2023-10-08 17:31:13,803][19739] Avg episode reward: [(0, '767.420'), (1, '847.030')] +[2023-10-08 17:31:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000044192_45252608.pth... +[2023-10-08 17:31:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000044512_45580288.pth... +[2023-10-08 17:31:13,841][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000042592_43614208.pth +[2023-10-08 17:31:13,851][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000042912_43941888.pth +[2023-10-08 17:31:14,424][21195] Updated weights for policy 0, policy_version 44520 (0.0007) +[2023-10-08 17:31:14,789][21195] Updated weights for policy 0, policy_version 44530 (0.0009) +[2023-10-08 17:31:15,154][21195] Updated weights for policy 0, policy_version 44540 (0.0008) +[2023-10-08 17:31:15,640][21194] Updated weights for policy 1, policy_version 44200 (0.0008) +[2023-10-08 17:31:16,004][21194] Updated weights for policy 1, policy_version 44210 (0.0008) +[2023-10-08 17:31:16,368][21194] Updated weights for policy 1, policy_version 44220 (0.0007) +[2023-10-08 17:31:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 90898432. Throughput: 0: 1759.1, 1: 1724.8. Samples: 22735386. Policy #0 lag: (min: 31.0, avg: 31.0, max: 33.0) +[2023-10-08 17:31:18,803][19739] Avg episode reward: [(0, '767.420'), (1, '862.040')] +[2023-10-08 17:31:19,121][21195] Updated weights for policy 0, policy_version 44550 (0.0008) +[2023-10-08 17:31:19,496][21195] Updated weights for policy 0, policy_version 44560 (0.0009) +[2023-10-08 17:31:19,877][21195] Updated weights for policy 0, policy_version 44570 (0.0007) +[2023-10-08 17:31:20,291][21194] Updated weights for policy 1, policy_version 44230 (0.0009) +[2023-10-08 17:31:20,658][21194] Updated weights for policy 1, policy_version 44240 (0.0010) +[2023-10-08 17:31:21,024][21194] Updated weights for policy 1, policy_version 44250 (0.0008) +[2023-10-08 17:31:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 90963968. Throughput: 0: 1733.4, 1: 1710.0. Samples: 22750054. Policy #0 lag: (min: 16.0, avg: 42.0, max: 48.0) +[2023-10-08 17:31:23,803][19739] Avg episode reward: [(0, '767.420'), (1, '862.040')] +[2023-10-08 17:31:23,853][21195] Updated weights for policy 0, policy_version 44580 (0.0007) +[2023-10-08 17:31:24,211][21195] Updated weights for policy 0, policy_version 44590 (0.0008) +[2023-10-08 17:31:24,581][21195] Updated weights for policy 0, policy_version 44600 (0.0007) +[2023-10-08 17:31:24,910][21194] Updated weights for policy 1, policy_version 44260 (0.0009) +[2023-10-08 17:31:25,272][21194] Updated weights for policy 1, policy_version 44270 (0.0008) +[2023-10-08 17:31:25,641][21194] Updated weights for policy 1, policy_version 44280 (0.0010) +[2023-10-08 17:31:28,789][21195] Updated weights for policy 0, policy_version 44610 (0.0009) +[2023-10-08 17:31:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 91029504. Throughput: 0: 1757.7, 1: 1731.0. Samples: 22771662. Policy #0 lag: (min: 16.0, avg: 42.0, max: 48.0) +[2023-10-08 17:31:28,803][19739] Avg episode reward: [(0, '767.420'), (1, '862.040')] +[2023-10-08 17:31:29,167][21195] Updated weights for policy 0, policy_version 44620 (0.0011) +[2023-10-08 17:31:29,423][21194] Updated weights for policy 1, policy_version 44290 (0.0008) +[2023-10-08 17:31:29,524][21195] Updated weights for policy 0, policy_version 44630 (0.0009) +[2023-10-08 17:31:29,821][21194] Updated weights for policy 1, policy_version 44300 (0.0008) +[2023-10-08 17:31:29,893][21195] Updated weights for policy 0, policy_version 44640 (0.0008) +[2023-10-08 17:31:30,193][21194] Updated weights for policy 1, policy_version 44310 (0.0008) +[2023-10-08 17:31:30,560][21194] Updated weights for policy 1, policy_version 44320 (0.0009) +[2023-10-08 17:31:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 91095040. Throughput: 0: 1739.0, 1: 1711.0. Samples: 22786314. Policy #0 lag: (min: 16.0, avg: 42.0, max: 48.0) +[2023-10-08 17:31:33,804][19739] Avg episode reward: [(0, '767.490'), (1, '862.040')] +[2023-10-08 17:31:33,829][21195] Updated weights for policy 0, policy_version 44650 (0.0008) +[2023-10-08 17:31:34,196][21195] Updated weights for policy 0, policy_version 44660 (0.0008) +[2023-10-08 17:31:34,560][21195] Updated weights for policy 0, policy_version 44670 (0.0008) +[2023-10-08 17:31:34,597][21194] Updated weights for policy 1, policy_version 44330 (0.0009) +[2023-10-08 17:31:34,969][21194] Updated weights for policy 1, policy_version 44340 (0.0010) +[2023-10-08 17:31:35,328][21194] Updated weights for policy 1, policy_version 44350 (0.0010) +[2023-10-08 17:31:38,555][21195] Updated weights for policy 0, policy_version 44680 (0.0008) +[2023-10-08 17:31:38,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 91160576. Throughput: 0: 1744.9, 1: 1716.0. Samples: 22801884. Policy #0 lag: (min: 16.0, avg: 42.0, max: 48.0) +[2023-10-08 17:31:38,803][19739] Avg episode reward: [(0, '767.490'), (1, '877.200')] +[2023-10-08 17:31:38,935][21195] Updated weights for policy 0, policy_version 44690 (0.0007) +[2023-10-08 17:31:39,234][21194] Updated weights for policy 1, policy_version 44360 (0.0007) +[2023-10-08 17:31:39,309][21195] Updated weights for policy 0, policy_version 44700 (0.0008) +[2023-10-08 17:31:39,597][21194] Updated weights for policy 1, policy_version 44370 (0.0007) +[2023-10-08 17:31:39,963][21194] Updated weights for policy 1, policy_version 44380 (0.0007) +[2023-10-08 17:31:43,114][21195] Updated weights for policy 0, policy_version 44710 (0.0008) +[2023-10-08 17:31:43,485][21195] Updated weights for policy 0, policy_version 44720 (0.0007) +[2023-10-08 17:31:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.3, 300 sec: 13773.7). Total num frames: 91226112. Throughput: 0: 1751.8, 1: 1730.3. Samples: 22823382. Policy #0 lag: (min: 16.0, avg: 42.0, max: 48.0) +[2023-10-08 17:31:43,803][19739] Avg episode reward: [(0, '744.420'), (1, '877.200')] +[2023-10-08 17:31:43,857][21195] Updated weights for policy 0, policy_version 44730 (0.0007) +[2023-10-08 17:31:43,919][21194] Updated weights for policy 1, policy_version 44390 (0.0008) +[2023-10-08 17:31:44,285][21194] Updated weights for policy 1, policy_version 44400 (0.0008) +[2023-10-08 17:31:44,651][21194] Updated weights for policy 1, policy_version 44410 (0.0007) +[2023-10-08 17:31:47,645][21195] Updated weights for policy 0, policy_version 44740 (0.0009) +[2023-10-08 17:31:48,007][21195] Updated weights for policy 0, policy_version 44750 (0.0008) +[2023-10-08 17:31:48,379][21195] Updated weights for policy 0, policy_version 44760 (0.0007) +[2023-10-08 17:31:48,803][19739] Fps is (10 sec: 16383.7, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 91324416. Throughput: 0: 1720.1, 1: 1700.5. Samples: 22837388. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 17:31:48,804][19739] Avg episode reward: [(0, '748.620'), (1, '877.200')] +[2023-10-08 17:31:48,824][21194] Updated weights for policy 1, policy_version 44420 (0.0009) +[2023-10-08 17:31:49,196][21194] Updated weights for policy 1, policy_version 44430 (0.0008) +[2023-10-08 17:31:49,556][21194] Updated weights for policy 1, policy_version 44440 (0.0008) +[2023-10-08 17:31:52,311][21195] Updated weights for policy 0, policy_version 44770 (0.0007) +[2023-10-08 17:31:52,684][21195] Updated weights for policy 0, policy_version 44780 (0.0007) +[2023-10-08 17:31:53,049][21195] Updated weights for policy 0, policy_version 44790 (0.0007) +[2023-10-08 17:31:53,416][21195] Updated weights for policy 0, policy_version 44800 (0.0007) +[2023-10-08 17:31:53,647][21194] Updated weights for policy 1, policy_version 44450 (0.0010) +[2023-10-08 17:31:53,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 91389952. Throughput: 0: 1748.3, 1: 1722.7. Samples: 22853842. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 17:31:53,803][19739] Avg episode reward: [(0, '748.980'), (1, '863.890')] +[2023-10-08 17:31:54,005][21194] Updated weights for policy 1, policy_version 44460 (0.0009) +[2023-10-08 17:31:54,365][21194] Updated weights for policy 1, policy_version 44470 (0.0007) +[2023-10-08 17:31:54,740][21194] Updated weights for policy 1, policy_version 44480 (0.0007) +[2023-10-08 17:31:57,302][21195] Updated weights for policy 0, policy_version 44810 (0.0009) +[2023-10-08 17:31:57,669][21195] Updated weights for policy 0, policy_version 44820 (0.0008) +[2023-10-08 17:31:58,046][21195] Updated weights for policy 0, policy_version 44830 (0.0009) +[2023-10-08 17:31:58,795][21194] Updated weights for policy 1, policy_version 44490 (0.0010) +[2023-10-08 17:31:58,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 91455488. Throughput: 0: 1718.6, 1: 1719.8. Samples: 22874106. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 17:31:58,803][19739] Avg episode reward: [(0, '748.980'), (1, '863.890')] +[2023-10-08 17:31:59,151][21194] Updated weights for policy 1, policy_version 44500 (0.0009) +[2023-10-08 17:31:59,524][21194] Updated weights for policy 1, policy_version 44510 (0.0008) +[2023-10-08 17:32:01,961][21195] Updated weights for policy 0, policy_version 44840 (0.0008) +[2023-10-08 17:32:02,323][21195] Updated weights for policy 0, policy_version 44850 (0.0010) +[2023-10-08 17:32:02,693][21195] Updated weights for policy 0, policy_version 44860 (0.0010) +[2023-10-08 17:32:03,587][21194] Updated weights for policy 1, policy_version 44520 (0.0009) +[2023-10-08 17:32:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 91521024. Throughput: 0: 1703.8, 1: 1702.9. Samples: 22888688. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 17:32:03,803][19739] Avg episode reward: [(0, '748.980'), (1, '872.840')] +[2023-10-08 17:32:03,953][21194] Updated weights for policy 1, policy_version 44530 (0.0009) +[2023-10-08 17:32:04,312][21194] Updated weights for policy 1, policy_version 44540 (0.0010) +[2023-10-08 17:32:06,697][21195] Updated weights for policy 0, policy_version 44870 (0.0010) +[2023-10-08 17:32:07,062][21195] Updated weights for policy 0, policy_version 44880 (0.0010) +[2023-10-08 17:32:07,432][21195] Updated weights for policy 0, policy_version 44890 (0.0008) +[2023-10-08 17:32:08,205][21194] Updated weights for policy 1, policy_version 44550 (0.0009) +[2023-10-08 17:32:08,569][21194] Updated weights for policy 1, policy_version 44560 (0.0008) +[2023-10-08 17:32:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 91586560. Throughput: 0: 1726.6, 1: 1716.3. Samples: 22904984. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 17:32:08,804][19739] Avg episode reward: [(0, '748.980'), (1, '872.840')] +[2023-10-08 17:32:08,940][21194] Updated weights for policy 1, policy_version 44570 (0.0008) +[2023-10-08 17:32:11,363][21195] Updated weights for policy 0, policy_version 44900 (0.0009) +[2023-10-08 17:32:11,720][21195] Updated weights for policy 0, policy_version 44910 (0.0009) +[2023-10-08 17:32:12,095][21195] Updated weights for policy 0, policy_version 44920 (0.0008) +[2023-10-08 17:32:12,939][21194] Updated weights for policy 1, policy_version 44580 (0.0009) +[2023-10-08 17:32:13,297][21194] Updated weights for policy 1, policy_version 44590 (0.0010) +[2023-10-08 17:32:13,659][21194] Updated weights for policy 1, policy_version 44600 (0.0010) +[2023-10-08 17:32:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 91652096. Throughput: 0: 1711.5, 1: 1708.0. Samples: 22925536. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 17:32:13,803][19739] Avg episode reward: [(0, '745.050'), (1, '881.040')] +[2023-10-08 17:32:15,797][21195] Updated weights for policy 0, policy_version 44930 (0.0008) +[2023-10-08 17:32:16,172][21195] Updated weights for policy 0, policy_version 44940 (0.0008) +[2023-10-08 17:32:16,543][21195] Updated weights for policy 0, policy_version 44950 (0.0007) +[2023-10-08 17:32:16,908][21195] Updated weights for policy 0, policy_version 44960 (0.0007) +[2023-10-08 17:32:17,782][21194] Updated weights for policy 1, policy_version 44610 (0.0009) +[2023-10-08 17:32:18,191][21194] Updated weights for policy 1, policy_version 44620 (0.0009) +[2023-10-08 17:32:18,568][21194] Updated weights for policy 1, policy_version 44630 (0.0009) +[2023-10-08 17:32:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 91717632. Throughput: 0: 1731.4, 1: 1713.3. Samples: 22941328. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 17:32:18,803][19739] Avg episode reward: [(0, '730.590'), (1, '896.120')] +[2023-10-08 17:32:18,928][21194] Updated weights for policy 1, policy_version 44640 (0.0009) +[2023-10-08 17:32:20,620][21195] Updated weights for policy 0, policy_version 44970 (0.0009) +[2023-10-08 17:32:20,988][21195] Updated weights for policy 0, policy_version 44980 (0.0008) +[2023-10-08 17:32:21,356][21195] Updated weights for policy 0, policy_version 44990 (0.0008) +[2023-10-08 17:32:22,938][21194] Updated weights for policy 1, policy_version 44650 (0.0007) +[2023-10-08 17:32:23,303][21194] Updated weights for policy 1, policy_version 44660 (0.0008) +[2023-10-08 17:32:23,673][21194] Updated weights for policy 1, policy_version 44670 (0.0007) +[2023-10-08 17:32:23,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 91815936. Throughput: 0: 1724.9, 1: 1710.4. Samples: 22956476. Policy #0 lag: (min: 31.0, avg: 32.1, max: 54.0) +[2023-10-08 17:32:23,803][19739] Avg episode reward: [(0, '745.480'), (1, '881.320')] +[2023-10-08 17:32:25,434][21195] Updated weights for policy 0, policy_version 45000 (0.0009) +[2023-10-08 17:32:25,798][21195] Updated weights for policy 0, policy_version 45010 (0.0008) +[2023-10-08 17:32:26,173][21195] Updated weights for policy 0, policy_version 45020 (0.0008) +[2023-10-08 17:32:27,410][21194] Updated weights for policy 1, policy_version 44680 (0.0008) +[2023-10-08 17:32:27,778][21194] Updated weights for policy 1, policy_version 44690 (0.0009) +[2023-10-08 17:32:28,146][21194] Updated weights for policy 1, policy_version 44700 (0.0011) +[2023-10-08 17:32:28,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 91881472. Throughput: 0: 1722.8, 1: 1691.6. Samples: 22977032. Policy #0 lag: (min: 31.0, avg: 32.1, max: 54.0) +[2023-10-08 17:32:28,803][19739] Avg episode reward: [(0, '760.270'), (1, '881.320')] +[2023-10-08 17:32:30,264][21195] Updated weights for policy 0, policy_version 45030 (0.0008) +[2023-10-08 17:32:30,642][21195] Updated weights for policy 0, policy_version 45040 (0.0007) +[2023-10-08 17:32:31,006][21195] Updated weights for policy 0, policy_version 45050 (0.0009) +[2023-10-08 17:32:32,311][21194] Updated weights for policy 1, policy_version 44710 (0.0009) +[2023-10-08 17:32:32,685][21194] Updated weights for policy 1, policy_version 44720 (0.0009) +[2023-10-08 17:32:33,053][21194] Updated weights for policy 1, policy_version 44730 (0.0009) +[2023-10-08 17:32:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 91947008. Throughput: 0: 1757.1, 1: 1716.3. Samples: 22993690. Policy #0 lag: (min: 31.0, avg: 32.1, max: 54.0) +[2023-10-08 17:32:33,804][19739] Avg episode reward: [(0, '766.370'), (1, '881.320')] +[2023-10-08 17:32:34,811][21195] Updated weights for policy 0, policy_version 45060 (0.0010) +[2023-10-08 17:32:35,186][21195] Updated weights for policy 0, policy_version 45070 (0.0009) +[2023-10-08 17:32:35,559][21195] Updated weights for policy 0, policy_version 45080 (0.0009) +[2023-10-08 17:32:37,009][21194] Updated weights for policy 1, policy_version 44740 (0.0008) +[2023-10-08 17:32:37,381][21194] Updated weights for policy 1, policy_version 44750 (0.0008) +[2023-10-08 17:32:37,746][21194] Updated weights for policy 1, policy_version 44760 (0.0007) +[2023-10-08 17:32:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 92012544. Throughput: 0: 1726.5, 1: 1718.3. Samples: 23008856. Policy #0 lag: (min: 31.0, avg: 32.1, max: 54.0) +[2023-10-08 17:32:38,803][19739] Avg episode reward: [(0, '766.370'), (1, '890.510')] +[2023-10-08 17:32:39,432][21195] Updated weights for policy 0, policy_version 45090 (0.0008) +[2023-10-08 17:32:39,793][21195] Updated weights for policy 0, policy_version 45100 (0.0007) +[2023-10-08 17:32:40,166][21195] Updated weights for policy 0, policy_version 45110 (0.0009) +[2023-10-08 17:32:40,539][21195] Updated weights for policy 0, policy_version 45120 (0.0008) +[2023-10-08 17:32:41,721][21194] Updated weights for policy 1, policy_version 44770 (0.0008) +[2023-10-08 17:32:42,080][21194] Updated weights for policy 1, policy_version 44780 (0.0009) +[2023-10-08 17:32:42,442][21194] Updated weights for policy 1, policy_version 44790 (0.0009) +[2023-10-08 17:32:42,803][21194] Updated weights for policy 1, policy_version 44800 (0.0011) +[2023-10-08 17:32:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 92078080. Throughput: 0: 1746.9, 1: 1694.0. Samples: 23028948. Policy #0 lag: (min: 31.0, avg: 32.1, max: 54.0) +[2023-10-08 17:32:43,803][19739] Avg episode reward: [(0, '767.190'), (1, '903.840')] +[2023-10-08 17:32:44,472][21195] Updated weights for policy 0, policy_version 45130 (0.0008) +[2023-10-08 17:32:44,832][21195] Updated weights for policy 0, policy_version 45140 (0.0007) +[2023-10-08 17:32:45,196][21195] Updated weights for policy 0, policy_version 45150 (0.0010) +[2023-10-08 17:32:46,803][21194] Updated weights for policy 1, policy_version 44810 (0.0007) +[2023-10-08 17:32:47,170][21194] Updated weights for policy 1, policy_version 44820 (0.0007) +[2023-10-08 17:32:47,537][21194] Updated weights for policy 1, policy_version 44830 (0.0008) +[2023-10-08 17:32:48,803][19739] Fps is (10 sec: 13106.2, 60 sec: 13653.2, 300 sec: 13773.6). Total num frames: 92143616. Throughput: 0: 1759.7, 1: 1728.4. Samples: 23045656. Policy #0 lag: (min: 31.0, avg: 32.1, max: 54.0) +[2023-10-08 17:32:48,804][19739] Avg episode reward: [(0, '767.190'), (1, '894.740')] +[2023-10-08 17:32:49,088][21195] Updated weights for policy 0, policy_version 45160 (0.0009) +[2023-10-08 17:32:49,448][21195] Updated weights for policy 0, policy_version 45170 (0.0008) +[2023-10-08 17:32:49,822][21195] Updated weights for policy 0, policy_version 45180 (0.0009) +[2023-10-08 17:32:51,634][21194] Updated weights for policy 1, policy_version 44840 (0.0010) +[2023-10-08 17:32:51,992][21194] Updated weights for policy 1, policy_version 44850 (0.0008) +[2023-10-08 17:32:52,360][21194] Updated weights for policy 1, policy_version 44860 (0.0008) +[2023-10-08 17:32:53,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 92209152. Throughput: 0: 1738.5, 1: 1707.9. Samples: 23060072. Policy #0 lag: (min: 31.0, avg: 32.1, max: 54.0) +[2023-10-08 17:32:53,804][19739] Avg episode reward: [(0, '767.190'), (1, '894.740')] +[2023-10-08 17:32:53,828][21195] Updated weights for policy 0, policy_version 45190 (0.0008) +[2023-10-08 17:32:54,197][21195] Updated weights for policy 0, policy_version 45200 (0.0009) +[2023-10-08 17:32:54,562][21195] Updated weights for policy 0, policy_version 45210 (0.0007) +[2023-10-08 17:32:56,175][21194] Updated weights for policy 1, policy_version 44870 (0.0008) +[2023-10-08 17:32:56,547][21194] Updated weights for policy 1, policy_version 44880 (0.0010) +[2023-10-08 17:32:56,916][21194] Updated weights for policy 1, policy_version 44890 (0.0009) +[2023-10-08 17:32:58,507][21195] Updated weights for policy 0, policy_version 45220 (0.0009) +[2023-10-08 17:32:58,803][19739] Fps is (10 sec: 13108.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 92274688. Throughput: 0: 1752.2, 1: 1697.0. Samples: 23080752. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 17:32:58,803][19739] Avg episode reward: [(0, '767.190'), (1, '894.740')] +[2023-10-08 17:32:58,871][21195] Updated weights for policy 0, policy_version 45230 (0.0007) +[2023-10-08 17:32:59,236][21195] Updated weights for policy 0, policy_version 45240 (0.0008) +[2023-10-08 17:33:00,800][21194] Updated weights for policy 1, policy_version 44900 (0.0009) +[2023-10-08 17:33:01,158][21194] Updated weights for policy 1, policy_version 44910 (0.0009) +[2023-10-08 17:33:01,527][21194] Updated weights for policy 1, policy_version 44920 (0.0008) +[2023-10-08 17:33:03,179][21195] Updated weights for policy 0, policy_version 45250 (0.0008) +[2023-10-08 17:33:03,543][21195] Updated weights for policy 0, policy_version 45260 (0.0009) +[2023-10-08 17:33:03,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 92340224. Throughput: 0: 1728.8, 1: 1715.7. Samples: 23096328. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 17:33:03,803][19739] Avg episode reward: [(0, '767.190'), (1, '894.740')] +[2023-10-08 17:33:03,917][21195] Updated weights for policy 0, policy_version 45270 (0.0008) +[2023-10-08 17:33:04,287][21195] Updated weights for policy 0, policy_version 45280 (0.0008) +[2023-10-08 17:33:05,553][21194] Updated weights for policy 1, policy_version 44930 (0.0009) +[2023-10-08 17:33:05,945][21194] Updated weights for policy 1, policy_version 44940 (0.0010) +[2023-10-08 17:33:06,308][21194] Updated weights for policy 1, policy_version 44950 (0.0007) +[2023-10-08 17:33:06,668][21194] Updated weights for policy 1, policy_version 44960 (0.0009) +[2023-10-08 17:33:08,150][21195] Updated weights for policy 0, policy_version 45290 (0.0007) +[2023-10-08 17:33:08,526][21195] Updated weights for policy 0, policy_version 45300 (0.0009) +[2023-10-08 17:33:08,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 92405760. Throughput: 0: 1746.0, 1: 1700.4. Samples: 23111560. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 17:33:08,804][19739] Avg episode reward: [(0, '767.130'), (1, '909.600')] +[2023-10-08 17:33:08,905][21195] Updated weights for policy 0, policy_version 45310 (0.0008) +[2023-10-08 17:33:10,573][21194] Updated weights for policy 1, policy_version 44970 (0.0009) +[2023-10-08 17:33:10,947][21194] Updated weights for policy 1, policy_version 44980 (0.0010) +[2023-10-08 17:33:11,307][21194] Updated weights for policy 1, policy_version 44990 (0.0010) +[2023-10-08 17:33:12,707][21195] Updated weights for policy 0, policy_version 45320 (0.0011) +[2023-10-08 17:33:13,087][21195] Updated weights for policy 0, policy_version 45330 (0.0009) +[2023-10-08 17:33:13,455][21195] Updated weights for policy 0, policy_version 45340 (0.0010) +[2023-10-08 17:33:13,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 92504064. Throughput: 0: 1736.5, 1: 1717.8. Samples: 23132476. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 17:33:13,803][19739] Avg episode reward: [(0, '759.150'), (1, '909.600')] +[2023-10-08 17:33:13,813][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000045344_46432256.pth... +[2023-10-08 17:33:13,813][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000044992_46071808.pth... +[2023-10-08 17:33:13,853][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000043712_44761088.pth +[2023-10-08 17:33:13,857][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000043392_44433408.pth +[2023-10-08 17:33:15,220][21194] Updated weights for policy 1, policy_version 45000 (0.0009) +[2023-10-08 17:33:15,586][21194] Updated weights for policy 1, policy_version 45010 (0.0008) +[2023-10-08 17:33:15,961][21194] Updated weights for policy 1, policy_version 45020 (0.0007) +[2023-10-08 17:33:17,408][21195] Updated weights for policy 0, policy_version 45350 (0.0008) +[2023-10-08 17:33:17,770][21195] Updated weights for policy 0, policy_version 45360 (0.0008) +[2023-10-08 17:33:18,147][21195] Updated weights for policy 0, policy_version 45370 (0.0009) +[2023-10-08 17:33:18,803][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 92569600. Throughput: 0: 1711.6, 1: 1700.7. Samples: 23147244. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 17:33:18,803][19739] Avg episode reward: [(0, '745.760'), (1, '910.580')] +[2023-10-08 17:33:19,814][21194] Updated weights for policy 1, policy_version 45030 (0.0009) +[2023-10-08 17:33:20,179][21194] Updated weights for policy 1, policy_version 45040 (0.0009) +[2023-10-08 17:33:20,555][21194] Updated weights for policy 1, policy_version 45050 (0.0008) +[2023-10-08 17:33:21,857][21195] Updated weights for policy 0, policy_version 45380 (0.0010) +[2023-10-08 17:33:22,239][21195] Updated weights for policy 0, policy_version 45390 (0.0009) +[2023-10-08 17:33:22,606][21195] Updated weights for policy 0, policy_version 45400 (0.0007) +[2023-10-08 17:33:23,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 92635136. Throughput: 0: 1748.0, 1: 1700.0. Samples: 23164020. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 17:33:23,803][19739] Avg episode reward: [(0, '701.830'), (1, '910.580')] +[2023-10-08 17:33:24,663][21194] Updated weights for policy 1, policy_version 45060 (0.0009) +[2023-10-08 17:33:25,025][21194] Updated weights for policy 1, policy_version 45070 (0.0008) +[2023-10-08 17:33:25,396][21194] Updated weights for policy 1, policy_version 45080 (0.0007) +[2023-10-08 17:33:26,351][21195] Updated weights for policy 0, policy_version 45410 (0.0008) +[2023-10-08 17:33:26,725][21195] Updated weights for policy 0, policy_version 45420 (0.0008) +[2023-10-08 17:33:27,090][21195] Updated weights for policy 0, policy_version 45430 (0.0009) +[2023-10-08 17:33:27,456][21195] Updated weights for policy 0, policy_version 45440 (0.0007) +[2023-10-08 17:33:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 92700672. Throughput: 0: 1732.2, 1: 1726.1. Samples: 23184574. Policy #0 lag: (min: 9.0, avg: 18.8, max: 41.0) +[2023-10-08 17:33:28,803][19739] Avg episode reward: [(0, '683.680'), (1, '900.380')] +[2023-10-08 17:33:29,345][21194] Updated weights for policy 1, policy_version 45090 (0.0010) +[2023-10-08 17:33:29,718][21194] Updated weights for policy 1, policy_version 45100 (0.0012) +[2023-10-08 17:33:30,076][21194] Updated weights for policy 1, policy_version 45110 (0.0009) +[2023-10-08 17:33:30,440][21194] Updated weights for policy 1, policy_version 45120 (0.0009) +[2023-10-08 17:33:31,438][21195] Updated weights for policy 0, policy_version 45450 (0.0009) +[2023-10-08 17:33:31,802][21195] Updated weights for policy 0, policy_version 45460 (0.0007) +[2023-10-08 17:33:32,179][21195] Updated weights for policy 0, policy_version 45470 (0.0009) +[2023-10-08 17:33:33,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 92766208. Throughput: 0: 1733.4, 1: 1691.5. Samples: 23199778. Policy #0 lag: (min: 9.0, avg: 18.8, max: 41.0) +[2023-10-08 17:33:33,804][19739] Avg episode reward: [(0, '649.570'), (1, '900.380')] +[2023-10-08 17:33:34,373][21194] Updated weights for policy 1, policy_version 45130 (0.0009) +[2023-10-08 17:33:34,741][21194] Updated weights for policy 1, policy_version 45140 (0.0009) +[2023-10-08 17:33:35,100][21194] Updated weights for policy 1, policy_version 45150 (0.0008) +[2023-10-08 17:33:35,955][21195] Updated weights for policy 0, policy_version 45480 (0.0010) +[2023-10-08 17:33:36,327][21195] Updated weights for policy 0, policy_version 45490 (0.0009) +[2023-10-08 17:33:36,703][21195] Updated weights for policy 0, policy_version 45500 (0.0009) +[2023-10-08 17:33:38,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 92831744. Throughput: 0: 1739.3, 1: 1718.1. Samples: 23215650. Policy #0 lag: (min: 9.0, avg: 18.8, max: 41.0) +[2023-10-08 17:33:38,803][19739] Avg episode reward: [(0, '649.570'), (1, '900.380')] +[2023-10-08 17:33:39,271][21194] Updated weights for policy 1, policy_version 45160 (0.0008) +[2023-10-08 17:33:39,637][21194] Updated weights for policy 1, policy_version 45170 (0.0008) +[2023-10-08 17:33:40,012][21194] Updated weights for policy 1, policy_version 45180 (0.0007) +[2023-10-08 17:33:40,472][21195] Updated weights for policy 0, policy_version 45510 (0.0009) +[2023-10-08 17:33:40,837][21195] Updated weights for policy 0, policy_version 45520 (0.0009) +[2023-10-08 17:33:41,207][21195] Updated weights for policy 0, policy_version 45530 (0.0010) +[2023-10-08 17:33:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 92897280. Throughput: 0: 1742.6, 1: 1733.7. Samples: 23237186. Policy #0 lag: (min: 9.0, avg: 18.8, max: 41.0) +[2023-10-08 17:33:43,804][19739] Avg episode reward: [(0, '649.570'), (1, '900.380')] +[2023-10-08 17:33:43,924][21194] Updated weights for policy 1, policy_version 45190 (0.0007) +[2023-10-08 17:33:44,294][21194] Updated weights for policy 1, policy_version 45200 (0.0007) +[2023-10-08 17:33:44,672][21194] Updated weights for policy 1, policy_version 45210 (0.0007) +[2023-10-08 17:33:45,131][21195] Updated weights for policy 0, policy_version 45540 (0.0008) +[2023-10-08 17:33:45,502][21195] Updated weights for policy 0, policy_version 45550 (0.0007) +[2023-10-08 17:33:45,867][21195] Updated weights for policy 0, policy_version 45560 (0.0008) +[2023-10-08 17:33:48,514][21194] Updated weights for policy 1, policy_version 45220 (0.0010) +[2023-10-08 17:33:48,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.5, 300 sec: 13662.6). Total num frames: 92962816. Throughput: 0: 1754.4, 1: 1709.5. Samples: 23252202. Policy #0 lag: (min: 9.0, avg: 18.8, max: 41.0) +[2023-10-08 17:33:48,803][19739] Avg episode reward: [(0, '649.570'), (1, '862.020')] +[2023-10-08 17:33:48,882][21194] Updated weights for policy 1, policy_version 45230 (0.0011) +[2023-10-08 17:33:49,234][21194] Updated weights for policy 1, policy_version 45240 (0.0008) +[2023-10-08 17:33:49,844][21195] Updated weights for policy 0, policy_version 45570 (0.0007) +[2023-10-08 17:33:50,207][21195] Updated weights for policy 0, policy_version 45580 (0.0009) +[2023-10-08 17:33:50,580][21195] Updated weights for policy 0, policy_version 45590 (0.0008) +[2023-10-08 17:33:50,949][21195] Updated weights for policy 0, policy_version 45600 (0.0007) +[2023-10-08 17:33:53,312][21194] Updated weights for policy 1, policy_version 45250 (0.0010) +[2023-10-08 17:33:53,733][21194] Updated weights for policy 1, policy_version 45260 (0.0010) +[2023-10-08 17:33:53,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 93028352. Throughput: 0: 1740.1, 1: 1729.7. Samples: 23267702. Policy #0 lag: (min: 9.0, avg: 18.8, max: 41.0) +[2023-10-08 17:33:53,803][19739] Avg episode reward: [(0, '649.570'), (1, '862.020')] +[2023-10-08 17:33:54,098][21194] Updated weights for policy 1, policy_version 45270 (0.0011) +[2023-10-08 17:33:54,462][21194] Updated weights for policy 1, policy_version 45280 (0.0010) +[2023-10-08 17:33:54,858][21195] Updated weights for policy 0, policy_version 45610 (0.0009) +[2023-10-08 17:33:55,219][21195] Updated weights for policy 0, policy_version 45620 (0.0008) +[2023-10-08 17:33:55,593][21195] Updated weights for policy 0, policy_version 45630 (0.0008) +[2023-10-08 17:33:58,192][21194] Updated weights for policy 1, policy_version 45290 (0.0009) +[2023-10-08 17:33:58,574][21194] Updated weights for policy 1, policy_version 45300 (0.0008) +[2023-10-08 17:33:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 93093888. Throughput: 0: 1750.3, 1: 1728.0. Samples: 23289000. Policy #0 lag: (min: 9.0, avg: 18.8, max: 41.0) +[2023-10-08 17:33:58,803][19739] Avg episode reward: [(0, '649.570'), (1, '862.020')] +[2023-10-08 17:33:58,933][21194] Updated weights for policy 1, policy_version 45310 (0.0010) +[2023-10-08 17:33:59,341][21195] Updated weights for policy 0, policy_version 45640 (0.0008) +[2023-10-08 17:33:59,706][21195] Updated weights for policy 0, policy_version 45650 (0.0009) +[2023-10-08 17:34:00,072][21195] Updated weights for policy 0, policy_version 45660 (0.0008) +[2023-10-08 17:34:02,845][21194] Updated weights for policy 1, policy_version 45320 (0.0007) +[2023-10-08 17:34:03,221][21194] Updated weights for policy 1, policy_version 45330 (0.0007) +[2023-10-08 17:34:03,590][21194] Updated weights for policy 1, policy_version 45340 (0.0008) +[2023-10-08 17:34:03,803][19739] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 93192192. Throughput: 0: 1770.9, 1: 1727.3. Samples: 23304666. Policy #0 lag: (min: 23.0, avg: 30.9, max: 55.0) +[2023-10-08 17:34:03,804][19739] Avg episode reward: [(0, '649.570'), (1, '876.710')] +[2023-10-08 17:34:04,079][21195] Updated weights for policy 0, policy_version 45670 (0.0008) +[2023-10-08 17:34:04,450][21195] Updated weights for policy 0, policy_version 45680 (0.0007) +[2023-10-08 17:34:04,823][21195] Updated weights for policy 0, policy_version 45690 (0.0008) +[2023-10-08 17:34:07,468][21194] Updated weights for policy 1, policy_version 45350 (0.0009) +[2023-10-08 17:34:07,828][21194] Updated weights for policy 1, policy_version 45360 (0.0009) +[2023-10-08 17:34:08,196][21194] Updated weights for policy 1, policy_version 45370 (0.0008) +[2023-10-08 17:34:08,559][21195] Updated weights for policy 0, policy_version 45700 (0.0010) +[2023-10-08 17:34:08,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 93257728. Throughput: 0: 1736.0, 1: 1733.2. Samples: 23320136. Policy #0 lag: (min: 23.0, avg: 30.9, max: 55.0) +[2023-10-08 17:34:08,803][19739] Avg episode reward: [(0, '649.570'), (1, '875.800')] +[2023-10-08 17:34:08,923][21195] Updated weights for policy 0, policy_version 45710 (0.0011) +[2023-10-08 17:34:09,297][21195] Updated weights for policy 0, policy_version 45720 (0.0010) +[2023-10-08 17:34:12,425][21194] Updated weights for policy 1, policy_version 45380 (0.0008) +[2023-10-08 17:34:12,798][21194] Updated weights for policy 1, policy_version 45390 (0.0008) +[2023-10-08 17:34:13,159][21194] Updated weights for policy 1, policy_version 45400 (0.0010) +[2023-10-08 17:34:13,332][21195] Updated weights for policy 0, policy_version 45730 (0.0007) +[2023-10-08 17:34:13,704][21195] Updated weights for policy 0, policy_version 45740 (0.0008) +[2023-10-08 17:34:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 93323264. Throughput: 0: 1757.5, 1: 1712.9. Samples: 23340740. Policy #0 lag: (min: 23.0, avg: 30.9, max: 55.0) +[2023-10-08 17:34:13,804][19739] Avg episode reward: [(0, '649.570'), (1, '851.740')] +[2023-10-08 17:34:14,073][21195] Updated weights for policy 0, policy_version 45750 (0.0007) +[2023-10-08 17:34:14,451][21195] Updated weights for policy 0, policy_version 45760 (0.0007) +[2023-10-08 17:34:17,019][21194] Updated weights for policy 1, policy_version 45410 (0.0008) +[2023-10-08 17:34:17,393][21194] Updated weights for policy 1, policy_version 45420 (0.0009) +[2023-10-08 17:34:17,768][21194] Updated weights for policy 1, policy_version 45430 (0.0009) +[2023-10-08 17:34:18,132][21194] Updated weights for policy 1, policy_version 45440 (0.0010) +[2023-10-08 17:34:18,408][21195] Updated weights for policy 0, policy_version 45770 (0.0008) +[2023-10-08 17:34:18,780][21195] Updated weights for policy 0, policy_version 45780 (0.0010) +[2023-10-08 17:34:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 93388800. Throughput: 0: 1737.3, 1: 1736.0. Samples: 23356076. Policy #0 lag: (min: 23.0, avg: 30.9, max: 55.0) +[2023-10-08 17:34:18,803][19739] Avg episode reward: [(0, '649.570'), (1, '834.520')] +[2023-10-08 17:34:19,163][21195] Updated weights for policy 0, policy_version 45790 (0.0007) +[2023-10-08 17:34:22,195][21194] Updated weights for policy 1, policy_version 45450 (0.0010) +[2023-10-08 17:34:22,556][21194] Updated weights for policy 1, policy_version 45460 (0.0007) +[2023-10-08 17:34:22,922][21194] Updated weights for policy 1, policy_version 45470 (0.0007) +[2023-10-08 17:34:22,985][21195] Updated weights for policy 0, policy_version 45800 (0.0007) +[2023-10-08 17:34:23,344][21195] Updated weights for policy 0, policy_version 45810 (0.0011) +[2023-10-08 17:34:23,711][21195] Updated weights for policy 0, policy_version 45820 (0.0010) +[2023-10-08 17:34:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 93454336. Throughput: 0: 1749.4, 1: 1722.7. Samples: 23371894. Policy #0 lag: (min: 23.0, avg: 30.9, max: 55.0) +[2023-10-08 17:34:23,804][19739] Avg episode reward: [(0, '649.570'), (1, '820.110')] +[2023-10-08 17:34:27,038][21194] Updated weights for policy 1, policy_version 45480 (0.0007) +[2023-10-08 17:34:27,411][21194] Updated weights for policy 1, policy_version 45490 (0.0009) +[2023-10-08 17:34:27,741][21195] Updated weights for policy 0, policy_version 45830 (0.0009) +[2023-10-08 17:34:27,780][21194] Updated weights for policy 1, policy_version 45500 (0.0010) +[2023-10-08 17:34:28,112][21195] Updated weights for policy 0, policy_version 45840 (0.0007) +[2023-10-08 17:34:28,489][21195] Updated weights for policy 0, policy_version 45850 (0.0010) +[2023-10-08 17:34:28,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 93552640. Throughput: 0: 1739.4, 1: 1689.5. Samples: 23391484. Policy #0 lag: (min: 23.0, avg: 30.9, max: 55.0) +[2023-10-08 17:34:28,803][19739] Avg episode reward: [(0, '649.570'), (1, '805.580')] +[2023-10-08 17:34:31,616][21194] Updated weights for policy 1, policy_version 45510 (0.0007) +[2023-10-08 17:34:31,984][21194] Updated weights for policy 1, policy_version 45520 (0.0010) +[2023-10-08 17:34:32,348][21194] Updated weights for policy 1, policy_version 45530 (0.0007) +[2023-10-08 17:34:32,523][21195] Updated weights for policy 0, policy_version 45860 (0.0009) +[2023-10-08 17:34:32,883][21195] Updated weights for policy 0, policy_version 45870 (0.0007) +[2023-10-08 17:34:33,251][21195] Updated weights for policy 0, policy_version 45880 (0.0007) +[2023-10-08 17:34:33,802][19739] Fps is (10 sec: 16384.5, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 93618176. Throughput: 0: 1717.8, 1: 1725.3. Samples: 23407144. Policy #0 lag: (min: 2.0, avg: 8.3, max: 34.0) +[2023-10-08 17:34:33,803][19739] Avg episode reward: [(0, '649.570'), (1, '805.580')] +[2023-10-08 17:34:36,159][21194] Updated weights for policy 1, policy_version 45540 (0.0007) +[2023-10-08 17:34:36,530][21194] Updated weights for policy 1, policy_version 45550 (0.0007) +[2023-10-08 17:34:36,896][21194] Updated weights for policy 1, policy_version 45560 (0.0008) +[2023-10-08 17:34:37,274][21195] Updated weights for policy 0, policy_version 45890 (0.0007) +[2023-10-08 17:34:37,648][21195] Updated weights for policy 0, policy_version 45900 (0.0010) +[2023-10-08 17:34:38,013][21195] Updated weights for policy 0, policy_version 45910 (0.0007) +[2023-10-08 17:34:38,373][21195] Updated weights for policy 0, policy_version 45920 (0.0010) +[2023-10-08 17:34:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 93683712. Throughput: 0: 1741.8, 1: 1706.4. Samples: 23422874. Policy #0 lag: (min: 2.0, avg: 8.3, max: 34.0) +[2023-10-08 17:34:38,803][19739] Avg episode reward: [(0, '659.060'), (1, '805.420')] +[2023-10-08 17:34:40,864][21194] Updated weights for policy 1, policy_version 45570 (0.0009) +[2023-10-08 17:34:41,285][21194] Updated weights for policy 1, policy_version 45580 (0.0008) +[2023-10-08 17:34:41,643][21194] Updated weights for policy 1, policy_version 45590 (0.0008) +[2023-10-08 17:34:42,009][21194] Updated weights for policy 1, policy_version 45600 (0.0009) +[2023-10-08 17:34:42,214][21195] Updated weights for policy 0, policy_version 45930 (0.0009) +[2023-10-08 17:34:42,593][21195] Updated weights for policy 0, policy_version 45940 (0.0008) +[2023-10-08 17:34:42,972][21195] Updated weights for policy 0, policy_version 45950 (0.0009) +[2023-10-08 17:34:43,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 93749248. Throughput: 0: 1725.3, 1: 1700.7. Samples: 23443170. Policy #0 lag: (min: 2.0, avg: 8.3, max: 34.0) +[2023-10-08 17:34:43,803][19739] Avg episode reward: [(0, '688.960'), (1, '805.420')] +[2023-10-08 17:34:45,941][21194] Updated weights for policy 1, policy_version 45610 (0.0009) +[2023-10-08 17:34:46,309][21194] Updated weights for policy 1, policy_version 45620 (0.0009) +[2023-10-08 17:34:46,681][21194] Updated weights for policy 1, policy_version 45630 (0.0007) +[2023-10-08 17:34:46,909][21195] Updated weights for policy 0, policy_version 45960 (0.0009) +[2023-10-08 17:34:47,274][21195] Updated weights for policy 0, policy_version 45970 (0.0008) +[2023-10-08 17:34:47,633][21195] Updated weights for policy 0, policy_version 45980 (0.0008) +[2023-10-08 17:34:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 93814784. Throughput: 0: 1713.9, 1: 1717.1. Samples: 23459060. Policy #0 lag: (min: 2.0, avg: 8.3, max: 34.0) +[2023-10-08 17:34:48,803][19739] Avg episode reward: [(0, '688.960'), (1, '805.420')] +[2023-10-08 17:34:50,501][21194] Updated weights for policy 1, policy_version 45640 (0.0008) +[2023-10-08 17:34:50,859][21194] Updated weights for policy 1, policy_version 45650 (0.0008) +[2023-10-08 17:34:51,222][21194] Updated weights for policy 1, policy_version 45660 (0.0008) +[2023-10-08 17:34:51,617][21195] Updated weights for policy 0, policy_version 45990 (0.0009) +[2023-10-08 17:34:51,984][21195] Updated weights for policy 0, policy_version 46000 (0.0009) +[2023-10-08 17:34:52,366][21195] Updated weights for policy 0, policy_version 46010 (0.0007) +[2023-10-08 17:34:53,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 93880320. Throughput: 0: 1735.6, 1: 1696.4. Samples: 23474578. Policy #0 lag: (min: 2.0, avg: 8.3, max: 34.0) +[2023-10-08 17:34:53,803][19739] Avg episode reward: [(0, '688.960'), (1, '805.420')] +[2023-10-08 17:34:55,251][21194] Updated weights for policy 1, policy_version 45670 (0.0008) +[2023-10-08 17:34:55,627][21194] Updated weights for policy 1, policy_version 45680 (0.0010) +[2023-10-08 17:34:55,978][21194] Updated weights for policy 1, policy_version 45690 (0.0010) +[2023-10-08 17:34:56,136][21195] Updated weights for policy 0, policy_version 46020 (0.0008) +[2023-10-08 17:34:56,500][21195] Updated weights for policy 0, policy_version 46030 (0.0011) +[2023-10-08 17:34:56,870][21195] Updated weights for policy 0, policy_version 46040 (0.0010) +[2023-10-08 17:34:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 93945856. Throughput: 0: 1716.1, 1: 1720.1. Samples: 23495368. Policy #0 lag: (min: 2.0, avg: 8.3, max: 34.0) +[2023-10-08 17:34:58,803][19739] Avg episode reward: [(0, '684.880'), (1, '820.620')] +[2023-10-08 17:35:00,156][21194] Updated weights for policy 1, policy_version 45700 (0.0008) +[2023-10-08 17:35:00,523][21194] Updated weights for policy 1, policy_version 45710 (0.0011) +[2023-10-08 17:35:00,715][21195] Updated weights for policy 0, policy_version 46050 (0.0010) +[2023-10-08 17:35:00,882][21194] Updated weights for policy 1, policy_version 45720 (0.0008) +[2023-10-08 17:35:01,078][21195] Updated weights for policy 0, policy_version 46060 (0.0008) +[2023-10-08 17:35:01,443][21195] Updated weights for policy 0, policy_version 46070 (0.0009) +[2023-10-08 17:35:01,810][21195] Updated weights for policy 0, policy_version 46080 (0.0011) +[2023-10-08 17:35:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 94011392. Throughput: 0: 1737.1, 1: 1703.6. Samples: 23510908. Policy #0 lag: (min: 2.0, avg: 8.3, max: 34.0) +[2023-10-08 17:35:03,803][19739] Avg episode reward: [(0, '685.450'), (1, '820.620')] +[2023-10-08 17:35:04,792][21194] Updated weights for policy 1, policy_version 45730 (0.0008) +[2023-10-08 17:35:05,155][21194] Updated weights for policy 1, policy_version 45740 (0.0008) +[2023-10-08 17:35:05,517][21194] Updated weights for policy 1, policy_version 45750 (0.0009) +[2023-10-08 17:35:05,875][21195] Updated weights for policy 0, policy_version 46090 (0.0008) +[2023-10-08 17:35:05,890][21194] Updated weights for policy 1, policy_version 45760 (0.0009) +[2023-10-08 17:35:06,247][21195] Updated weights for policy 0, policy_version 46100 (0.0008) +[2023-10-08 17:35:06,612][21195] Updated weights for policy 0, policy_version 46110 (0.0008) +[2023-10-08 17:35:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 94076928. Throughput: 0: 1718.8, 1: 1710.8. Samples: 23526224. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:35:08,803][19739] Avg episode reward: [(0, '702.300'), (1, '820.620')] +[2023-10-08 17:35:09,797][21194] Updated weights for policy 1, policy_version 45770 (0.0010) +[2023-10-08 17:35:10,172][21194] Updated weights for policy 1, policy_version 45780 (0.0009) +[2023-10-08 17:35:10,492][21195] Updated weights for policy 0, policy_version 46120 (0.0009) +[2023-10-08 17:35:10,529][21194] Updated weights for policy 1, policy_version 45790 (0.0008) +[2023-10-08 17:35:10,860][21195] Updated weights for policy 0, policy_version 46130 (0.0007) +[2023-10-08 17:35:11,236][21195] Updated weights for policy 0, policy_version 46140 (0.0007) +[2023-10-08 17:35:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 94142464. Throughput: 0: 1725.4, 1: 1740.0. Samples: 23547428. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:35:13,803][19739] Avg episode reward: [(0, '687.650'), (1, '820.620')] +[2023-10-08 17:35:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000046144_47251456.pth... +[2023-10-08 17:35:13,813][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000045792_46891008.pth... +[2023-10-08 17:35:13,846][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000044192_45252608.pth +[2023-10-08 17:35:13,853][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000044512_45580288.pth +[2023-10-08 17:35:14,441][21194] Updated weights for policy 1, policy_version 45800 (0.0008) +[2023-10-08 17:35:14,805][21194] Updated weights for policy 1, policy_version 45810 (0.0009) +[2023-10-08 17:35:15,161][21194] Updated weights for policy 1, policy_version 45820 (0.0009) +[2023-10-08 17:35:15,162][21195] Updated weights for policy 0, policy_version 46150 (0.0007) +[2023-10-08 17:35:15,523][21195] Updated weights for policy 0, policy_version 46160 (0.0009) +[2023-10-08 17:35:15,897][21195] Updated weights for policy 0, policy_version 46170 (0.0010) +[2023-10-08 17:35:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 94208000. Throughput: 0: 1750.8, 1: 1707.9. Samples: 23562784. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:35:18,803][19739] Avg episode reward: [(0, '656.380'), (1, '820.620')] +[2023-10-08 17:35:19,191][21194] Updated weights for policy 1, policy_version 45830 (0.0010) +[2023-10-08 17:35:19,561][21194] Updated weights for policy 1, policy_version 45840 (0.0008) +[2023-10-08 17:35:19,858][21195] Updated weights for policy 0, policy_version 46180 (0.0009) +[2023-10-08 17:35:19,923][21194] Updated weights for policy 1, policy_version 45850 (0.0007) +[2023-10-08 17:35:20,231][21195] Updated weights for policy 0, policy_version 46190 (0.0008) +[2023-10-08 17:35:20,595][21195] Updated weights for policy 0, policy_version 46200 (0.0008) +[2023-10-08 17:35:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 94273536. Throughput: 0: 1720.5, 1: 1725.5. Samples: 23577942. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:35:23,803][19739] Avg episode reward: [(0, '656.380'), (1, '823.730')] +[2023-10-08 17:35:23,807][21194] Updated weights for policy 1, policy_version 45860 (0.0007) +[2023-10-08 17:35:24,180][21194] Updated weights for policy 1, policy_version 45870 (0.0008) +[2023-10-08 17:35:24,538][21195] Updated weights for policy 0, policy_version 46210 (0.0007) +[2023-10-08 17:35:24,543][21194] Updated weights for policy 1, policy_version 45880 (0.0008) +[2023-10-08 17:35:24,896][21195] Updated weights for policy 0, policy_version 46220 (0.0008) +[2023-10-08 17:35:25,268][21195] Updated weights for policy 0, policy_version 46230 (0.0010) +[2023-10-08 17:35:25,637][21195] Updated weights for policy 0, policy_version 46240 (0.0011) +[2023-10-08 17:35:28,457][21194] Updated weights for policy 1, policy_version 45890 (0.0010) +[2023-10-08 17:35:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 94339072. Throughput: 0: 1739.5, 1: 1736.9. Samples: 23599610. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:35:28,803][19739] Avg episode reward: [(0, '632.860'), (1, '823.730')] +[2023-10-08 17:35:28,857][21194] Updated weights for policy 1, policy_version 45900 (0.0009) +[2023-10-08 17:35:29,222][21194] Updated weights for policy 1, policy_version 45910 (0.0007) +[2023-10-08 17:35:29,584][21194] Updated weights for policy 1, policy_version 45920 (0.0007) +[2023-10-08 17:35:29,629][21195] Updated weights for policy 0, policy_version 46250 (0.0008) +[2023-10-08 17:35:30,001][21195] Updated weights for policy 0, policy_version 46260 (0.0010) +[2023-10-08 17:35:30,372][21195] Updated weights for policy 0, policy_version 46270 (0.0010) +[2023-10-08 17:35:33,544][21194] Updated weights for policy 1, policy_version 45930 (0.0012) +[2023-10-08 17:35:33,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 94404608. Throughput: 0: 1744.3, 1: 1714.1. Samples: 23614688. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:35:33,804][19739] Avg episode reward: [(0, '632.860'), (1, '838.710')] +[2023-10-08 17:35:33,899][21194] Updated weights for policy 1, policy_version 45940 (0.0009) +[2023-10-08 17:35:34,260][21194] Updated weights for policy 1, policy_version 45950 (0.0007) +[2023-10-08 17:35:34,404][21195] Updated weights for policy 0, policy_version 46280 (0.0008) +[2023-10-08 17:35:34,782][21195] Updated weights for policy 0, policy_version 46290 (0.0007) +[2023-10-08 17:35:35,149][21195] Updated weights for policy 0, policy_version 46300 (0.0009) +[2023-10-08 17:35:38,321][21194] Updated weights for policy 1, policy_version 45960 (0.0010) +[2023-10-08 17:35:38,682][21194] Updated weights for policy 1, policy_version 45970 (0.0007) +[2023-10-08 17:35:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 94470144. Throughput: 0: 1722.2, 1: 1729.3. Samples: 23629894. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:35:38,803][19739] Avg episode reward: [(0, '632.860'), (1, '838.710')] +[2023-10-08 17:35:39,049][21194] Updated weights for policy 1, policy_version 45980 (0.0008) +[2023-10-08 17:35:39,069][21195] Updated weights for policy 0, policy_version 46310 (0.0009) +[2023-10-08 17:35:39,449][21195] Updated weights for policy 0, policy_version 46320 (0.0009) +[2023-10-08 17:35:39,820][21195] Updated weights for policy 0, policy_version 46330 (0.0009) +[2023-10-08 17:35:43,062][21194] Updated weights for policy 1, policy_version 45990 (0.0007) +[2023-10-08 17:35:43,432][21194] Updated weights for policy 1, policy_version 46000 (0.0008) +[2023-10-08 17:35:43,719][21195] Updated weights for policy 0, policy_version 46340 (0.0008) +[2023-10-08 17:35:43,791][21194] Updated weights for policy 1, policy_version 46010 (0.0009) +[2023-10-08 17:35:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 94535680. Throughput: 0: 1742.2, 1: 1723.5. Samples: 23651322. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 17:35:43,804][19739] Avg episode reward: [(0, '633.090'), (1, '838.710')] +[2023-10-08 17:35:44,086][21195] Updated weights for policy 0, policy_version 46350 (0.0009) +[2023-10-08 17:35:44,453][21195] Updated weights for policy 0, policy_version 46360 (0.0008) +[2023-10-08 17:35:47,717][21194] Updated weights for policy 1, policy_version 46020 (0.0009) +[2023-10-08 17:35:48,082][21194] Updated weights for policy 1, policy_version 46030 (0.0008) +[2023-10-08 17:35:48,151][21195] Updated weights for policy 0, policy_version 46370 (0.0010) +[2023-10-08 17:35:48,446][21194] Updated weights for policy 1, policy_version 46040 (0.0007) +[2023-10-08 17:35:48,519][21195] Updated weights for policy 0, policy_version 46380 (0.0007) +[2023-10-08 17:35:48,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 94633984. Throughput: 0: 1725.5, 1: 1724.5. Samples: 23666156. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 17:35:48,803][19739] Avg episode reward: [(0, '648.160'), (1, '836.020')] +[2023-10-08 17:35:48,898][21195] Updated weights for policy 0, policy_version 46390 (0.0008) +[2023-10-08 17:35:49,263][21195] Updated weights for policy 0, policy_version 46400 (0.0010) +[2023-10-08 17:35:52,475][21194] Updated weights for policy 1, policy_version 46050 (0.0007) +[2023-10-08 17:35:52,844][21194] Updated weights for policy 1, policy_version 46060 (0.0009) +[2023-10-08 17:35:53,210][21194] Updated weights for policy 1, policy_version 46070 (0.0009) +[2023-10-08 17:35:53,319][21195] Updated weights for policy 0, policy_version 46410 (0.0007) +[2023-10-08 17:35:53,575][21194] Updated weights for policy 1, policy_version 46080 (0.0008) +[2023-10-08 17:35:53,687][21195] Updated weights for policy 0, policy_version 46420 (0.0007) +[2023-10-08 17:35:53,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 94699520. Throughput: 0: 1742.0, 1: 1722.9. Samples: 23682144. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 17:35:53,803][19739] Avg episode reward: [(0, '648.160'), (1, '835.550')] +[2023-10-08 17:35:54,055][21195] Updated weights for policy 0, policy_version 46430 (0.0007) +[2023-10-08 17:35:57,589][21194] Updated weights for policy 1, policy_version 46090 (0.0010) +[2023-10-08 17:35:57,812][21195] Updated weights for policy 0, policy_version 46440 (0.0007) +[2023-10-08 17:35:57,962][21194] Updated weights for policy 1, policy_version 46100 (0.0008) +[2023-10-08 17:35:58,178][21195] Updated weights for policy 0, policy_version 46450 (0.0010) +[2023-10-08 17:35:58,327][21194] Updated weights for policy 1, policy_version 46110 (0.0009) +[2023-10-08 17:35:58,554][21195] Updated weights for policy 0, policy_version 46460 (0.0009) +[2023-10-08 17:35:58,803][19739] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 94797824. Throughput: 0: 1739.8, 1: 1702.3. Samples: 23702322. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 17:35:58,804][19739] Avg episode reward: [(0, '661.470'), (1, '835.550')] +[2023-10-08 17:36:02,393][21194] Updated weights for policy 1, policy_version 46120 (0.0008) +[2023-10-08 17:36:02,471][21195] Updated weights for policy 0, policy_version 46470 (0.0008) +[2023-10-08 17:36:02,758][21194] Updated weights for policy 1, policy_version 46130 (0.0008) +[2023-10-08 17:36:02,831][21195] Updated weights for policy 0, policy_version 46480 (0.0008) +[2023-10-08 17:36:03,119][21194] Updated weights for policy 1, policy_version 46140 (0.0008) +[2023-10-08 17:36:03,194][21195] Updated weights for policy 0, policy_version 46490 (0.0009) +[2023-10-08 17:36:03,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 94863360. Throughput: 0: 1717.5, 1: 1718.9. Samples: 23717424. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 17:36:03,803][19739] Avg episode reward: [(0, '661.470'), (1, '835.550')] +[2023-10-08 17:36:07,075][21195] Updated weights for policy 0, policy_version 46500 (0.0007) +[2023-10-08 17:36:07,092][21194] Updated weights for policy 1, policy_version 46150 (0.0007) +[2023-10-08 17:36:07,444][21195] Updated weights for policy 0, policy_version 46510 (0.0007) +[2023-10-08 17:36:07,462][21194] Updated weights for policy 1, policy_version 46160 (0.0008) +[2023-10-08 17:36:07,815][21195] Updated weights for policy 0, policy_version 46520 (0.0008) +[2023-10-08 17:36:07,820][21194] Updated weights for policy 1, policy_version 46170 (0.0008) +[2023-10-08 17:36:08,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 94928896. Throughput: 0: 1749.2, 1: 1722.0. Samples: 23734146. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 17:36:08,803][19739] Avg episode reward: [(0, '661.470'), (1, '835.550')] +[2023-10-08 17:36:11,838][21194] Updated weights for policy 1, policy_version 46180 (0.0009) +[2023-10-08 17:36:11,897][21195] Updated weights for policy 0, policy_version 46530 (0.0007) +[2023-10-08 17:36:12,198][21194] Updated weights for policy 1, policy_version 46190 (0.0009) +[2023-10-08 17:36:12,270][21195] Updated weights for policy 0, policy_version 46540 (0.0007) +[2023-10-08 17:36:12,560][21194] Updated weights for policy 1, policy_version 46200 (0.0008) +[2023-10-08 17:36:12,646][21195] Updated weights for policy 0, policy_version 46550 (0.0008) +[2023-10-08 17:36:13,016][21195] Updated weights for policy 0, policy_version 46560 (0.0008) +[2023-10-08 17:36:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 94994432. Throughput: 0: 1720.0, 1: 1689.2. Samples: 23753026. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 17:36:13,803][19739] Avg episode reward: [(0, '661.470'), (1, '835.550')] +[2023-10-08 17:36:16,548][21194] Updated weights for policy 1, policy_version 46210 (0.0007) +[2023-10-08 17:36:16,796][21195] Updated weights for policy 0, policy_version 46570 (0.0009) +[2023-10-08 17:36:16,950][21194] Updated weights for policy 1, policy_version 46220 (0.0007) +[2023-10-08 17:36:17,164][21195] Updated weights for policy 0, policy_version 46580 (0.0008) +[2023-10-08 17:36:17,319][21194] Updated weights for policy 1, policy_version 46230 (0.0008) +[2023-10-08 17:36:17,532][21195] Updated weights for policy 0, policy_version 46590 (0.0009) +[2023-10-08 17:36:17,687][21194] Updated weights for policy 1, policy_version 46240 (0.0008) +[2023-10-08 17:36:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 95059968. Throughput: 0: 1724.0, 1: 1721.1. Samples: 23769720. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 17:36:18,803][19739] Avg episode reward: [(0, '647.520'), (1, '831.300')] +[2023-10-08 17:36:21,625][21195] Updated weights for policy 0, policy_version 46600 (0.0009) +[2023-10-08 17:36:21,760][21194] Updated weights for policy 1, policy_version 46250 (0.0009) +[2023-10-08 17:36:21,993][21195] Updated weights for policy 0, policy_version 46610 (0.0008) +[2023-10-08 17:36:22,131][21194] Updated weights for policy 1, policy_version 46260 (0.0008) +[2023-10-08 17:36:22,367][21195] Updated weights for policy 0, policy_version 46620 (0.0008) +[2023-10-08 17:36:22,496][21194] Updated weights for policy 1, policy_version 46270 (0.0008) +[2023-10-08 17:36:23,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 95125504. Throughput: 0: 1740.0, 1: 1701.5. Samples: 23784764. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 17:36:23,804][19739] Avg episode reward: [(0, '647.520'), (1, '831.300')] +[2023-10-08 17:36:26,103][21195] Updated weights for policy 0, policy_version 46630 (0.0009) +[2023-10-08 17:36:26,370][21194] Updated weights for policy 1, policy_version 46280 (0.0009) +[2023-10-08 17:36:26,471][21195] Updated weights for policy 0, policy_version 46640 (0.0007) +[2023-10-08 17:36:26,738][21194] Updated weights for policy 1, policy_version 46290 (0.0007) +[2023-10-08 17:36:26,843][21195] Updated weights for policy 0, policy_version 46650 (0.0010) +[2023-10-08 17:36:27,098][21194] Updated weights for policy 1, policy_version 46300 (0.0009) +[2023-10-08 17:36:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 95191040. Throughput: 0: 1722.6, 1: 1689.3. Samples: 23804856. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 17:36:28,803][19739] Avg episode reward: [(0, '651.190'), (1, '818.610')] +[2023-10-08 17:36:30,793][21195] Updated weights for policy 0, policy_version 46660 (0.0009) +[2023-10-08 17:36:31,125][21194] Updated weights for policy 1, policy_version 46310 (0.0008) +[2023-10-08 17:36:31,162][21195] Updated weights for policy 0, policy_version 46670 (0.0009) +[2023-10-08 17:36:31,488][21194] Updated weights for policy 1, policy_version 46320 (0.0007) +[2023-10-08 17:36:31,531][21195] Updated weights for policy 0, policy_version 46680 (0.0007) +[2023-10-08 17:36:31,854][21194] Updated weights for policy 1, policy_version 46330 (0.0009) +[2023-10-08 17:36:33,802][19739] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 95256576. Throughput: 0: 1743.4, 1: 1712.7. Samples: 23821682. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 17:36:33,803][19739] Avg episode reward: [(0, '651.640'), (1, '833.720')] +[2023-10-08 17:36:35,278][21195] Updated weights for policy 0, policy_version 46690 (0.0009) +[2023-10-08 17:36:35,648][21195] Updated weights for policy 0, policy_version 46700 (0.0009) +[2023-10-08 17:36:35,786][21194] Updated weights for policy 1, policy_version 46340 (0.0009) +[2023-10-08 17:36:36,017][21195] Updated weights for policy 0, policy_version 46710 (0.0007) +[2023-10-08 17:36:36,161][21194] Updated weights for policy 1, policy_version 46350 (0.0008) +[2023-10-08 17:36:36,376][21195] Updated weights for policy 0, policy_version 46720 (0.0007) +[2023-10-08 17:36:36,532][21194] Updated weights for policy 1, policy_version 46360 (0.0009) +[2023-10-08 17:36:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 95322112. Throughput: 0: 1728.8, 1: 1689.4. Samples: 23835962. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 17:36:38,803][19739] Avg episode reward: [(0, '651.640'), (1, '833.720')] +[2023-10-08 17:36:40,118][21195] Updated weights for policy 0, policy_version 46730 (0.0007) +[2023-10-08 17:36:40,483][21195] Updated weights for policy 0, policy_version 46740 (0.0010) +[2023-10-08 17:36:40,620][21194] Updated weights for policy 1, policy_version 46370 (0.0011) +[2023-10-08 17:36:40,855][21195] Updated weights for policy 0, policy_version 46750 (0.0008) +[2023-10-08 17:36:40,988][21194] Updated weights for policy 1, policy_version 46380 (0.0008) +[2023-10-08 17:36:41,353][21194] Updated weights for policy 1, policy_version 46390 (0.0010) +[2023-10-08 17:36:41,718][21194] Updated weights for policy 1, policy_version 46400 (0.0011) +[2023-10-08 17:36:43,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 95387648. Throughput: 0: 1735.8, 1: 1708.1. Samples: 23857294. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 17:36:43,803][19739] Avg episode reward: [(0, '651.640'), (1, '833.720')] +[2023-10-08 17:36:44,746][21195] Updated weights for policy 0, policy_version 46760 (0.0008) +[2023-10-08 17:36:45,124][21195] Updated weights for policy 0, policy_version 46770 (0.0010) +[2023-10-08 17:36:45,493][21195] Updated weights for policy 0, policy_version 46780 (0.0009) +[2023-10-08 17:36:45,747][21194] Updated weights for policy 1, policy_version 46410 (0.0008) +[2023-10-08 17:36:46,127][21194] Updated weights for policy 1, policy_version 46420 (0.0009) +[2023-10-08 17:36:46,499][21194] Updated weights for policy 1, policy_version 46430 (0.0010) +[2023-10-08 17:36:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 95453184. Throughput: 0: 1760.8, 1: 1702.2. Samples: 23873262. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 17:36:48,803][19739] Avg episode reward: [(0, '662.880'), (1, '833.720')] +[2023-10-08 17:36:49,524][21195] Updated weights for policy 0, policy_version 46790 (0.0009) +[2023-10-08 17:36:49,894][21195] Updated weights for policy 0, policy_version 46800 (0.0008) +[2023-10-08 17:36:50,263][21195] Updated weights for policy 0, policy_version 46810 (0.0009) +[2023-10-08 17:36:50,651][21194] Updated weights for policy 1, policy_version 46440 (0.0008) +[2023-10-08 17:36:51,010][21194] Updated weights for policy 1, policy_version 46450 (0.0007) +[2023-10-08 17:36:51,377][21194] Updated weights for policy 1, policy_version 46460 (0.0007) +[2023-10-08 17:36:53,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 95518720. Throughput: 0: 1732.2, 1: 1684.6. Samples: 23887902. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 17:36:53,804][19739] Avg episode reward: [(0, '662.880'), (1, '848.680')] +[2023-10-08 17:36:54,135][21195] Updated weights for policy 0, policy_version 46820 (0.0008) +[2023-10-08 17:36:54,504][21195] Updated weights for policy 0, policy_version 46830 (0.0007) +[2023-10-08 17:36:54,882][21195] Updated weights for policy 0, policy_version 46840 (0.0007) +[2023-10-08 17:36:55,236][21194] Updated weights for policy 1, policy_version 46470 (0.0008) +[2023-10-08 17:36:55,597][21194] Updated weights for policy 1, policy_version 46480 (0.0010) +[2023-10-08 17:36:55,960][21194] Updated weights for policy 1, policy_version 46490 (0.0009) +[2023-10-08 17:36:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 95584256. Throughput: 0: 1759.6, 1: 1718.6. Samples: 23909546. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 17:36:58,803][19739] Avg episode reward: [(0, '662.880'), (1, '848.680')] +[2023-10-08 17:36:58,817][21195] Updated weights for policy 0, policy_version 46850 (0.0009) +[2023-10-08 17:36:59,186][21195] Updated weights for policy 0, policy_version 46860 (0.0007) +[2023-10-08 17:36:59,558][21195] Updated weights for policy 0, policy_version 46870 (0.0007) +[2023-10-08 17:36:59,921][21194] Updated weights for policy 1, policy_version 46500 (0.0010) +[2023-10-08 17:36:59,923][21195] Updated weights for policy 0, policy_version 46880 (0.0008) +[2023-10-08 17:37:00,287][21194] Updated weights for policy 1, policy_version 46510 (0.0009) +[2023-10-08 17:37:00,650][21194] Updated weights for policy 1, policy_version 46520 (0.0009) +[2023-10-08 17:37:03,729][21195] Updated weights for policy 0, policy_version 46890 (0.0009) +[2023-10-08 17:37:03,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 95649792. Throughput: 0: 1748.8, 1: 1689.6. Samples: 23924450. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 17:37:03,803][19739] Avg episode reward: [(0, '662.880'), (1, '848.880')] +[2023-10-08 17:37:04,099][21195] Updated weights for policy 0, policy_version 46900 (0.0010) +[2023-10-08 17:37:04,479][21195] Updated weights for policy 0, policy_version 46910 (0.0007) +[2023-10-08 17:37:04,593][21194] Updated weights for policy 1, policy_version 46530 (0.0008) +[2023-10-08 17:37:04,999][21194] Updated weights for policy 1, policy_version 46540 (0.0008) +[2023-10-08 17:37:05,353][21194] Updated weights for policy 1, policy_version 46550 (0.0010) +[2023-10-08 17:37:05,722][21194] Updated weights for policy 1, policy_version 46560 (0.0009) +[2023-10-08 17:37:08,306][21195] Updated weights for policy 0, policy_version 46920 (0.0007) +[2023-10-08 17:37:08,678][21195] Updated weights for policy 0, policy_version 46930 (0.0008) +[2023-10-08 17:37:08,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 95715328. Throughput: 0: 1743.5, 1: 1711.8. Samples: 23940252. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 17:37:08,803][19739] Avg episode reward: [(0, '662.880'), (1, '848.880')] +[2023-10-08 17:37:09,045][21195] Updated weights for policy 0, policy_version 46940 (0.0008) +[2023-10-08 17:37:09,622][21194] Updated weights for policy 1, policy_version 46570 (0.0009) +[2023-10-08 17:37:09,983][21194] Updated weights for policy 1, policy_version 46580 (0.0009) +[2023-10-08 17:37:10,354][21194] Updated weights for policy 1, policy_version 46590 (0.0009) +[2023-10-08 17:37:12,957][21195] Updated weights for policy 0, policy_version 46950 (0.0007) +[2023-10-08 17:37:13,332][21195] Updated weights for policy 0, policy_version 46960 (0.0009) +[2023-10-08 17:37:13,701][21195] Updated weights for policy 0, policy_version 46970 (0.0009) +[2023-10-08 17:37:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 95780864. Throughput: 0: 1759.6, 1: 1724.9. Samples: 23961660. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 17:37:13,803][19739] Avg episode reward: [(0, '662.880'), (1, '848.880')] +[2023-10-08 17:37:13,810][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000046592_47710208.pth... +[2023-10-08 17:37:13,844][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000044992_46071808.pth +[2023-10-08 17:37:13,920][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000046976_48103424.pth... +[2023-10-08 17:37:13,958][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000045344_46432256.pth +[2023-10-08 17:37:14,326][21194] Updated weights for policy 1, policy_version 46600 (0.0009) +[2023-10-08 17:37:14,688][21194] Updated weights for policy 1, policy_version 46610 (0.0010) +[2023-10-08 17:37:15,054][21194] Updated weights for policy 1, policy_version 46620 (0.0007) +[2023-10-08 17:37:17,656][21195] Updated weights for policy 0, policy_version 46980 (0.0008) +[2023-10-08 17:37:18,030][21195] Updated weights for policy 0, policy_version 46990 (0.0010) +[2023-10-08 17:37:18,403][21195] Updated weights for policy 0, policy_version 47000 (0.0008) +[2023-10-08 17:37:18,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 95879168. Throughput: 0: 1730.7, 1: 1697.2. Samples: 23975936. Policy #0 lag: (min: 31.0, avg: 31.0, max: 35.0) +[2023-10-08 17:37:18,803][19739] Avg episode reward: [(0, '666.680'), (1, '854.300')] +[2023-10-08 17:37:19,049][21194] Updated weights for policy 1, policy_version 46630 (0.0007) +[2023-10-08 17:37:19,413][21194] Updated weights for policy 1, policy_version 46640 (0.0008) +[2023-10-08 17:37:19,774][21194] Updated weights for policy 1, policy_version 46650 (0.0011) +[2023-10-08 17:37:22,254][21195] Updated weights for policy 0, policy_version 47010 (0.0010) +[2023-10-08 17:37:22,625][21195] Updated weights for policy 0, policy_version 47020 (0.0011) +[2023-10-08 17:37:23,001][21195] Updated weights for policy 0, policy_version 47030 (0.0009) +[2023-10-08 17:37:23,380][21195] Updated weights for policy 0, policy_version 47040 (0.0008) +[2023-10-08 17:37:23,722][21194] Updated weights for policy 1, policy_version 46660 (0.0010) +[2023-10-08 17:37:23,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 95944704. Throughput: 0: 1764.8, 1: 1721.5. Samples: 23992842. Policy #0 lag: (min: 31.0, avg: 31.0, max: 35.0) +[2023-10-08 17:37:23,803][19739] Avg episode reward: [(0, '681.890'), (1, '869.480')] +[2023-10-08 17:37:24,088][21194] Updated weights for policy 1, policy_version 46670 (0.0011) +[2023-10-08 17:37:24,464][21194] Updated weights for policy 1, policy_version 46680 (0.0009) +[2023-10-08 17:37:27,467][21195] Updated weights for policy 0, policy_version 47050 (0.0007) +[2023-10-08 17:37:27,845][21195] Updated weights for policy 0, policy_version 47060 (0.0010) +[2023-10-08 17:37:28,218][21195] Updated weights for policy 0, policy_version 47070 (0.0008) +[2023-10-08 17:37:28,293][21194] Updated weights for policy 1, policy_version 46690 (0.0008) +[2023-10-08 17:37:28,658][21194] Updated weights for policy 1, policy_version 46700 (0.0008) +[2023-10-08 17:37:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 96010240. Throughput: 0: 1739.1, 1: 1727.5. Samples: 24013292. Policy #0 lag: (min: 31.0, avg: 31.0, max: 35.0) +[2023-10-08 17:37:28,803][19739] Avg episode reward: [(0, '675.240'), (1, '869.480')] +[2023-10-08 17:37:29,019][21194] Updated weights for policy 1, policy_version 46710 (0.0008) +[2023-10-08 17:37:29,386][21194] Updated weights for policy 1, policy_version 46720 (0.0010) +[2023-10-08 17:37:32,122][21195] Updated weights for policy 0, policy_version 47080 (0.0009) +[2023-10-08 17:37:32,486][21195] Updated weights for policy 0, policy_version 47090 (0.0008) +[2023-10-08 17:37:32,855][21195] Updated weights for policy 0, policy_version 47100 (0.0007) +[2023-10-08 17:37:33,461][21194] Updated weights for policy 1, policy_version 46730 (0.0007) +[2023-10-08 17:37:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 96075776. Throughput: 0: 1724.3, 1: 1712.1. Samples: 24027898. Policy #0 lag: (min: 31.0, avg: 31.0, max: 35.0) +[2023-10-08 17:37:33,803][19739] Avg episode reward: [(0, '675.240'), (1, '884.720')] +[2023-10-08 17:37:33,833][21194] Updated weights for policy 1, policy_version 46740 (0.0007) +[2023-10-08 17:37:34,196][21194] Updated weights for policy 1, policy_version 46750 (0.0008) +[2023-10-08 17:37:36,673][21195] Updated weights for policy 0, policy_version 47110 (0.0009) +[2023-10-08 17:37:37,041][21195] Updated weights for policy 0, policy_version 47120 (0.0008) +[2023-10-08 17:37:37,404][21195] Updated weights for policy 0, policy_version 47130 (0.0007) +[2023-10-08 17:37:37,984][21194] Updated weights for policy 1, policy_version 46760 (0.0009) +[2023-10-08 17:37:38,352][21194] Updated weights for policy 1, policy_version 46770 (0.0009) +[2023-10-08 17:37:38,720][21194] Updated weights for policy 1, policy_version 46780 (0.0010) +[2023-10-08 17:37:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 96141312. Throughput: 0: 1746.2, 1: 1731.8. Samples: 24044410. Policy #0 lag: (min: 31.0, avg: 31.0, max: 35.0) +[2023-10-08 17:37:38,803][19739] Avg episode reward: [(0, '675.240'), (1, '883.960')] +[2023-10-08 17:37:41,354][21195] Updated weights for policy 0, policy_version 47140 (0.0009) +[2023-10-08 17:37:41,723][21195] Updated weights for policy 0, policy_version 47150 (0.0008) +[2023-10-08 17:37:42,092][21195] Updated weights for policy 0, policy_version 47160 (0.0007) +[2023-10-08 17:37:42,768][21194] Updated weights for policy 1, policy_version 46790 (0.0007) +[2023-10-08 17:37:43,144][21194] Updated weights for policy 1, policy_version 46800 (0.0007) +[2023-10-08 17:37:43,519][21194] Updated weights for policy 1, policy_version 46810 (0.0007) +[2023-10-08 17:37:43,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 96239616. Throughput: 0: 1720.3, 1: 1718.4. Samples: 24064286. Policy #0 lag: (min: 31.0, avg: 31.0, max: 35.0) +[2023-10-08 17:37:43,803][19739] Avg episode reward: [(0, '690.290'), (1, '883.960')] +[2023-10-08 17:37:45,880][21195] Updated weights for policy 0, policy_version 47170 (0.0008) +[2023-10-08 17:37:46,249][21195] Updated weights for policy 0, policy_version 47180 (0.0009) +[2023-10-08 17:37:46,617][21195] Updated weights for policy 0, policy_version 47190 (0.0007) +[2023-10-08 17:37:46,995][21195] Updated weights for policy 0, policy_version 47200 (0.0007) +[2023-10-08 17:37:47,387][21194] Updated weights for policy 1, policy_version 46820 (0.0010) +[2023-10-08 17:37:47,763][21194] Updated weights for policy 1, policy_version 46830 (0.0008) +[2023-10-08 17:37:48,127][21194] Updated weights for policy 1, policy_version 46840 (0.0008) +[2023-10-08 17:37:48,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 96305152. Throughput: 0: 1734.1, 1: 1726.7. Samples: 24080186. Policy #0 lag: (min: 31.0, avg: 31.0, max: 35.0) +[2023-10-08 17:37:48,803][19739] Avg episode reward: [(0, '690.290'), (1, '883.960')] +[2023-10-08 17:37:50,933][21195] Updated weights for policy 0, policy_version 47210 (0.0008) +[2023-10-08 17:37:51,306][21195] Updated weights for policy 0, policy_version 47220 (0.0008) +[2023-10-08 17:37:51,684][21195] Updated weights for policy 0, policy_version 47230 (0.0008) +[2023-10-08 17:37:52,244][21194] Updated weights for policy 1, policy_version 46850 (0.0008) +[2023-10-08 17:37:52,657][21194] Updated weights for policy 1, policy_version 46860 (0.0008) +[2023-10-08 17:37:53,018][21194] Updated weights for policy 1, policy_version 46870 (0.0009) +[2023-10-08 17:37:53,385][21194] Updated weights for policy 1, policy_version 46880 (0.0010) +[2023-10-08 17:37:53,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 96370688. Throughput: 0: 1723.0, 1: 1725.7. Samples: 24095444. Policy #0 lag: (min: 9.0, avg: 22.9, max: 41.0) +[2023-10-08 17:37:53,804][19739] Avg episode reward: [(0, '690.290'), (1, '883.960')] +[2023-10-08 17:37:55,497][21195] Updated weights for policy 0, policy_version 47240 (0.0011) +[2023-10-08 17:37:55,856][21195] Updated weights for policy 0, policy_version 47250 (0.0010) +[2023-10-08 17:37:56,234][21195] Updated weights for policy 0, policy_version 47260 (0.0009) +[2023-10-08 17:37:57,267][21194] Updated weights for policy 1, policy_version 46890 (0.0009) +[2023-10-08 17:37:57,633][21194] Updated weights for policy 1, policy_version 46900 (0.0010) +[2023-10-08 17:37:58,013][21194] Updated weights for policy 1, policy_version 46910 (0.0009) +[2023-10-08 17:37:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 96436224. Throughput: 0: 1722.9, 1: 1698.9. Samples: 24115644. Policy #0 lag: (min: 9.0, avg: 22.9, max: 41.0) +[2023-10-08 17:37:58,803][19739] Avg episode reward: [(0, '690.290'), (1, '883.960')] +[2023-10-08 17:38:00,315][21195] Updated weights for policy 0, policy_version 47270 (0.0010) +[2023-10-08 17:38:00,676][21195] Updated weights for policy 0, policy_version 47280 (0.0007) +[2023-10-08 17:38:01,051][21195] Updated weights for policy 0, policy_version 47290 (0.0008) +[2023-10-08 17:38:02,245][21194] Updated weights for policy 1, policy_version 46920 (0.0009) +[2023-10-08 17:38:02,614][21194] Updated weights for policy 1, policy_version 46930 (0.0008) +[2023-10-08 17:38:02,975][21194] Updated weights for policy 1, policy_version 46940 (0.0008) +[2023-10-08 17:38:03,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 96501760. Throughput: 0: 1745.2, 1: 1722.7. Samples: 24131992. Policy #0 lag: (min: 9.0, avg: 22.9, max: 41.0) +[2023-10-08 17:38:03,803][19739] Avg episode reward: [(0, '690.290'), (1, '883.960')] +[2023-10-08 17:38:05,064][21195] Updated weights for policy 0, policy_version 47300 (0.0009) +[2023-10-08 17:38:05,440][21195] Updated weights for policy 0, policy_version 47310 (0.0008) +[2023-10-08 17:38:05,802][21195] Updated weights for policy 0, policy_version 47320 (0.0008) +[2023-10-08 17:38:06,795][21194] Updated weights for policy 1, policy_version 46950 (0.0008) +[2023-10-08 17:38:07,166][21194] Updated weights for policy 1, policy_version 46960 (0.0009) +[2023-10-08 17:38:07,537][21194] Updated weights for policy 1, policy_version 46970 (0.0008) +[2023-10-08 17:38:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 96567296. Throughput: 0: 1711.0, 1: 1715.3. Samples: 24147028. Policy #0 lag: (min: 9.0, avg: 22.9, max: 41.0) +[2023-10-08 17:38:08,804][19739] Avg episode reward: [(0, '690.290'), (1, '887.080')] +[2023-10-08 17:38:09,702][21195] Updated weights for policy 0, policy_version 47330 (0.0007) +[2023-10-08 17:38:10,073][21195] Updated weights for policy 0, policy_version 47340 (0.0008) +[2023-10-08 17:38:10,445][21195] Updated weights for policy 0, policy_version 47350 (0.0009) +[2023-10-08 17:38:10,813][21195] Updated weights for policy 0, policy_version 47360 (0.0008) +[2023-10-08 17:38:11,418][21194] Updated weights for policy 1, policy_version 46980 (0.0008) +[2023-10-08 17:38:11,787][21194] Updated weights for policy 1, policy_version 46990 (0.0008) +[2023-10-08 17:38:12,157][21194] Updated weights for policy 1, policy_version 47000 (0.0010) +[2023-10-08 17:38:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 96632832. Throughput: 0: 1732.4, 1: 1696.1. Samples: 24167576. Policy #0 lag: (min: 9.0, avg: 22.9, max: 41.0) +[2023-10-08 17:38:13,803][19739] Avg episode reward: [(0, '690.290'), (1, '887.080')] +[2023-10-08 17:38:14,843][21195] Updated weights for policy 0, policy_version 47370 (0.0008) +[2023-10-08 17:38:15,215][21195] Updated weights for policy 0, policy_version 47380 (0.0009) +[2023-10-08 17:38:15,583][21195] Updated weights for policy 0, policy_version 47390 (0.0009) +[2023-10-08 17:38:15,975][21194] Updated weights for policy 1, policy_version 47010 (0.0008) +[2023-10-08 17:38:16,344][21194] Updated weights for policy 1, policy_version 47020 (0.0008) +[2023-10-08 17:38:16,705][21194] Updated weights for policy 1, policy_version 47030 (0.0007) +[2023-10-08 17:38:17,069][21194] Updated weights for policy 1, policy_version 47040 (0.0008) +[2023-10-08 17:38:18,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 96698368. Throughput: 0: 1741.4, 1: 1733.3. Samples: 24184260. Policy #0 lag: (min: 9.0, avg: 22.9, max: 41.0) +[2023-10-08 17:38:18,803][19739] Avg episode reward: [(0, '690.290'), (1, '887.080')] +[2023-10-08 17:38:19,427][21195] Updated weights for policy 0, policy_version 47400 (0.0008) +[2023-10-08 17:38:19,790][21195] Updated weights for policy 0, policy_version 47410 (0.0008) +[2023-10-08 17:38:20,153][21195] Updated weights for policy 0, policy_version 47420 (0.0007) +[2023-10-08 17:38:21,104][21194] Updated weights for policy 1, policy_version 47050 (0.0009) +[2023-10-08 17:38:21,470][21194] Updated weights for policy 1, policy_version 47060 (0.0007) +[2023-10-08 17:38:21,829][21194] Updated weights for policy 1, policy_version 47070 (0.0011) +[2023-10-08 17:38:23,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.2, 300 sec: 13773.7). Total num frames: 96763904. Throughput: 0: 1721.1, 1: 1699.3. Samples: 24198328. Policy #0 lag: (min: 9.0, avg: 22.9, max: 41.0) +[2023-10-08 17:38:23,804][19739] Avg episode reward: [(0, '690.290'), (1, '887.080')] +[2023-10-08 17:38:24,022][21195] Updated weights for policy 0, policy_version 47430 (0.0008) +[2023-10-08 17:38:24,395][21195] Updated weights for policy 0, policy_version 47440 (0.0009) +[2023-10-08 17:38:24,765][21195] Updated weights for policy 0, policy_version 47450 (0.0010) +[2023-10-08 17:38:25,955][21194] Updated weights for policy 1, policy_version 47080 (0.0012) +[2023-10-08 17:38:26,323][21194] Updated weights for policy 1, policy_version 47090 (0.0007) +[2023-10-08 17:38:26,703][21194] Updated weights for policy 1, policy_version 47100 (0.0010) +[2023-10-08 17:38:28,665][21195] Updated weights for policy 0, policy_version 47460 (0.0011) +[2023-10-08 17:38:28,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 96829440. Throughput: 0: 1742.1, 1: 1707.5. Samples: 24219520. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 17:38:28,803][19739] Avg episode reward: [(0, '690.290'), (1, '901.980')] +[2023-10-08 17:38:29,040][21195] Updated weights for policy 0, policy_version 47470 (0.0010) +[2023-10-08 17:38:29,417][21195] Updated weights for policy 0, policy_version 47480 (0.0010) +[2023-10-08 17:38:30,466][21194] Updated weights for policy 1, policy_version 47110 (0.0010) +[2023-10-08 17:38:30,832][21194] Updated weights for policy 1, policy_version 47120 (0.0011) +[2023-10-08 17:38:31,199][21194] Updated weights for policy 1, policy_version 47130 (0.0010) +[2023-10-08 17:38:33,476][21195] Updated weights for policy 0, policy_version 47490 (0.0010) +[2023-10-08 17:38:33,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 96894976. Throughput: 0: 1725.9, 1: 1712.2. Samples: 24234900. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 17:38:33,803][19739] Avg episode reward: [(0, '690.290'), (1, '913.870')] +[2023-10-08 17:38:33,854][21195] Updated weights for policy 0, policy_version 47500 (0.0010) +[2023-10-08 17:38:34,215][21195] Updated weights for policy 0, policy_version 47510 (0.0009) +[2023-10-08 17:38:34,591][21195] Updated weights for policy 0, policy_version 47520 (0.0008) +[2023-10-08 17:38:35,079][21194] Updated weights for policy 1, policy_version 47140 (0.0010) +[2023-10-08 17:38:35,438][21194] Updated weights for policy 1, policy_version 47150 (0.0010) +[2023-10-08 17:38:35,805][21194] Updated weights for policy 1, policy_version 47160 (0.0009) +[2023-10-08 17:38:38,492][21195] Updated weights for policy 0, policy_version 47530 (0.0011) +[2023-10-08 17:38:38,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 96960512. Throughput: 0: 1736.3, 1: 1708.9. Samples: 24250476. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 17:38:38,803][19739] Avg episode reward: [(0, '690.290'), (1, '913.870')] +[2023-10-08 17:38:38,866][21195] Updated weights for policy 0, policy_version 47540 (0.0009) +[2023-10-08 17:38:39,221][21195] Updated weights for policy 0, policy_version 47550 (0.0010) +[2023-10-08 17:38:39,951][21194] Updated weights for policy 1, policy_version 47170 (0.0010) +[2023-10-08 17:38:40,364][21194] Updated weights for policy 1, policy_version 47180 (0.0009) +[2023-10-08 17:38:40,733][21194] Updated weights for policy 1, policy_version 47190 (0.0012) +[2023-10-08 17:38:41,100][21194] Updated weights for policy 1, policy_version 47200 (0.0009) +[2023-10-08 17:38:43,144][21195] Updated weights for policy 0, policy_version 47560 (0.0008) +[2023-10-08 17:38:43,518][21195] Updated weights for policy 0, policy_version 47570 (0.0007) +[2023-10-08 17:38:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 97026048. Throughput: 0: 1735.9, 1: 1734.1. Samples: 24271794. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 17:38:43,803][19739] Avg episode reward: [(0, '690.290'), (1, '911.180')] +[2023-10-08 17:38:43,881][21195] Updated weights for policy 0, policy_version 47580 (0.0007) +[2023-10-08 17:38:44,823][21194] Updated weights for policy 1, policy_version 47210 (0.0009) +[2023-10-08 17:38:45,189][21194] Updated weights for policy 1, policy_version 47220 (0.0009) +[2023-10-08 17:38:45,553][21194] Updated weights for policy 1, policy_version 47230 (0.0007) +[2023-10-08 17:38:47,774][21195] Updated weights for policy 0, policy_version 47590 (0.0008) +[2023-10-08 17:38:48,142][21195] Updated weights for policy 0, policy_version 47600 (0.0008) +[2023-10-08 17:38:48,501][21195] Updated weights for policy 0, policy_version 47610 (0.0008) +[2023-10-08 17:38:48,802][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 97124352. Throughput: 0: 1711.0, 1: 1712.5. Samples: 24286050. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 17:38:48,803][19739] Avg episode reward: [(0, '699.460'), (1, '894.080')] +[2023-10-08 17:38:49,566][21194] Updated weights for policy 1, policy_version 47240 (0.0008) +[2023-10-08 17:38:49,928][21194] Updated weights for policy 1, policy_version 47250 (0.0008) +[2023-10-08 17:38:50,298][21194] Updated weights for policy 1, policy_version 47260 (0.0007) +[2023-10-08 17:38:52,467][21195] Updated weights for policy 0, policy_version 47620 (0.0007) +[2023-10-08 17:38:52,834][21195] Updated weights for policy 0, policy_version 47630 (0.0009) +[2023-10-08 17:38:53,209][21195] Updated weights for policy 0, policy_version 47640 (0.0008) +[2023-10-08 17:38:53,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 97189888. Throughput: 0: 1739.5, 1: 1722.5. Samples: 24302816. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 17:38:53,803][19739] Avg episode reward: [(0, '714.270'), (1, '894.080')] +[2023-10-08 17:38:54,265][21194] Updated weights for policy 1, policy_version 47270 (0.0009) +[2023-10-08 17:38:54,624][21194] Updated weights for policy 1, policy_version 47280 (0.0008) +[2023-10-08 17:38:54,985][21194] Updated weights for policy 1, policy_version 47290 (0.0010) +[2023-10-08 17:38:56,954][21195] Updated weights for policy 0, policy_version 47650 (0.0008) +[2023-10-08 17:38:57,311][21195] Updated weights for policy 0, policy_version 47660 (0.0008) +[2023-10-08 17:38:57,682][21195] Updated weights for policy 0, policy_version 47670 (0.0009) +[2023-10-08 17:38:58,046][21195] Updated weights for policy 0, policy_version 47680 (0.0008) +[2023-10-08 17:38:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 97255424. Throughput: 0: 1726.5, 1: 1741.7. Samples: 24323644. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:38:58,803][19739] Avg episode reward: [(0, '729.250'), (1, '894.080')] +[2023-10-08 17:38:58,961][21194] Updated weights for policy 1, policy_version 47300 (0.0010) +[2023-10-08 17:38:59,322][21194] Updated weights for policy 1, policy_version 47310 (0.0008) +[2023-10-08 17:38:59,686][21194] Updated weights for policy 1, policy_version 47320 (0.0007) +[2023-10-08 17:39:01,889][21195] Updated weights for policy 0, policy_version 47690 (0.0009) +[2023-10-08 17:39:02,258][21195] Updated weights for policy 0, policy_version 47700 (0.0008) +[2023-10-08 17:39:02,642][21195] Updated weights for policy 0, policy_version 47710 (0.0009) +[2023-10-08 17:39:03,439][21194] Updated weights for policy 1, policy_version 47330 (0.0008) +[2023-10-08 17:39:03,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 97320960. Throughput: 0: 1723.4, 1: 1710.3. Samples: 24338776. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:39:03,804][19739] Avg episode reward: [(0, '729.250'), (1, '879.580')] +[2023-10-08 17:39:03,807][21194] Updated weights for policy 1, policy_version 47340 (0.0009) +[2023-10-08 17:39:04,168][21194] Updated weights for policy 1, policy_version 47350 (0.0009) +[2023-10-08 17:39:04,538][21194] Updated weights for policy 1, policy_version 47360 (0.0008) +[2023-10-08 17:39:06,559][21195] Updated weights for policy 0, policy_version 47720 (0.0009) +[2023-10-08 17:39:06,922][21195] Updated weights for policy 0, policy_version 47730 (0.0008) +[2023-10-08 17:39:07,295][21195] Updated weights for policy 0, policy_version 47740 (0.0009) +[2023-10-08 17:39:08,396][21194] Updated weights for policy 1, policy_version 47370 (0.0010) +[2023-10-08 17:39:08,767][21194] Updated weights for policy 1, policy_version 47380 (0.0007) +[2023-10-08 17:39:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 97386496. Throughput: 0: 1740.4, 1: 1746.9. Samples: 24355256. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:39:08,803][19739] Avg episode reward: [(0, '744.150'), (1, '879.670')] +[2023-10-08 17:39:09,133][21194] Updated weights for policy 1, policy_version 47390 (0.0009) +[2023-10-08 17:39:11,152][21195] Updated weights for policy 0, policy_version 47750 (0.0008) +[2023-10-08 17:39:11,521][21195] Updated weights for policy 0, policy_version 47760 (0.0008) +[2023-10-08 17:39:11,894][21195] Updated weights for policy 0, policy_version 47770 (0.0009) +[2023-10-08 17:39:13,117][21194] Updated weights for policy 1, policy_version 47400 (0.0010) +[2023-10-08 17:39:13,478][21194] Updated weights for policy 1, policy_version 47410 (0.0010) +[2023-10-08 17:39:13,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 97452032. Throughput: 0: 1721.4, 1: 1745.6. Samples: 24375536. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:39:13,803][19739] Avg episode reward: [(0, '760.330'), (1, '865.080')] +[2023-10-08 17:39:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000047776_48922624.pth... +[2023-10-08 17:39:13,843][21194] Updated weights for policy 1, policy_version 47420 (0.0010) +[2023-10-08 17:39:13,844][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000046144_47251456.pth +[2023-10-08 17:39:13,986][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000047424_48562176.pth... +[2023-10-08 17:39:14,028][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000045792_46891008.pth +[2023-10-08 17:39:15,776][21195] Updated weights for policy 0, policy_version 47780 (0.0009) +[2023-10-08 17:39:16,143][21195] Updated weights for policy 0, policy_version 47790 (0.0008) +[2023-10-08 17:39:16,514][21195] Updated weights for policy 0, policy_version 47800 (0.0007) +[2023-10-08 17:39:17,753][21194] Updated weights for policy 1, policy_version 47430 (0.0008) +[2023-10-08 17:39:18,122][21194] Updated weights for policy 1, policy_version 47440 (0.0009) +[2023-10-08 17:39:18,480][21194] Updated weights for policy 1, policy_version 47450 (0.0009) +[2023-10-08 17:39:18,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 13884.8). Total num frames: 97550336. Throughput: 0: 1741.8, 1: 1735.6. Samples: 24391384. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:39:18,803][19739] Avg episode reward: [(0, '760.390'), (1, '865.080')] +[2023-10-08 17:39:20,321][21195] Updated weights for policy 0, policy_version 47810 (0.0007) +[2023-10-08 17:39:20,687][21195] Updated weights for policy 0, policy_version 47820 (0.0007) +[2023-10-08 17:39:21,058][21195] Updated weights for policy 0, policy_version 47830 (0.0008) +[2023-10-08 17:39:21,429][21195] Updated weights for policy 0, policy_version 47840 (0.0007) +[2023-10-08 17:39:22,275][21194] Updated weights for policy 1, policy_version 47460 (0.0009) +[2023-10-08 17:39:22,638][21194] Updated weights for policy 1, policy_version 47470 (0.0008) +[2023-10-08 17:39:22,996][21194] Updated weights for policy 1, policy_version 47480 (0.0009) +[2023-10-08 17:39:23,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 97615872. Throughput: 0: 1736.7, 1: 1741.1. Samples: 24406974. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:39:23,803][19739] Avg episode reward: [(0, '760.390'), (1, '835.260')] +[2023-10-08 17:39:25,311][21195] Updated weights for policy 0, policy_version 47850 (0.0007) +[2023-10-08 17:39:25,692][21195] Updated weights for policy 0, policy_version 47860 (0.0010) +[2023-10-08 17:39:26,051][21195] Updated weights for policy 0, policy_version 47870 (0.0008) +[2023-10-08 17:39:27,085][21194] Updated weights for policy 1, policy_version 47490 (0.0010) +[2023-10-08 17:39:27,490][21194] Updated weights for policy 1, policy_version 47500 (0.0008) +[2023-10-08 17:39:27,854][21194] Updated weights for policy 1, policy_version 47510 (0.0007) +[2023-10-08 17:39:28,214][21194] Updated weights for policy 1, policy_version 47520 (0.0010) +[2023-10-08 17:39:28,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 97681408. Throughput: 0: 1741.8, 1: 1718.7. Samples: 24427518. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:39:28,803][19739] Avg episode reward: [(0, '760.390'), (1, '835.260')] +[2023-10-08 17:39:29,868][21195] Updated weights for policy 0, policy_version 47880 (0.0009) +[2023-10-08 17:39:30,235][21195] Updated weights for policy 0, policy_version 47890 (0.0008) +[2023-10-08 17:39:30,605][21195] Updated weights for policy 0, policy_version 47900 (0.0009) +[2023-10-08 17:39:32,159][21194] Updated weights for policy 1, policy_version 47530 (0.0008) +[2023-10-08 17:39:32,522][21194] Updated weights for policy 1, policy_version 47540 (0.0008) +[2023-10-08 17:39:32,889][21194] Updated weights for policy 1, policy_version 47550 (0.0008) +[2023-10-08 17:39:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 97746944. Throughput: 0: 1772.1, 1: 1740.5. Samples: 24444118. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 17:39:33,803][19739] Avg episode reward: [(0, '760.390'), (1, '835.260')] +[2023-10-08 17:39:34,645][21195] Updated weights for policy 0, policy_version 47910 (0.0008) +[2023-10-08 17:39:35,005][21195] Updated weights for policy 0, policy_version 47920 (0.0009) +[2023-10-08 17:39:35,378][21195] Updated weights for policy 0, policy_version 47930 (0.0009) +[2023-10-08 17:39:36,953][21194] Updated weights for policy 1, policy_version 47560 (0.0008) +[2023-10-08 17:39:37,320][21194] Updated weights for policy 1, policy_version 47570 (0.0007) +[2023-10-08 17:39:37,685][21194] Updated weights for policy 1, policy_version 47580 (0.0010) +[2023-10-08 17:39:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 97812480. Throughput: 0: 1744.7, 1: 1729.6. Samples: 24459160. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 17:39:38,803][19739] Avg episode reward: [(0, '760.390'), (1, '835.260')] +[2023-10-08 17:39:39,114][21195] Updated weights for policy 0, policy_version 47940 (0.0008) +[2023-10-08 17:39:39,489][21195] Updated weights for policy 0, policy_version 47950 (0.0008) +[2023-10-08 17:39:39,861][21195] Updated weights for policy 0, policy_version 47960 (0.0008) +[2023-10-08 17:39:41,674][21194] Updated weights for policy 1, policy_version 47590 (0.0009) +[2023-10-08 17:39:42,042][21194] Updated weights for policy 1, policy_version 47600 (0.0007) +[2023-10-08 17:39:42,396][21194] Updated weights for policy 1, policy_version 47610 (0.0007) +[2023-10-08 17:39:43,624][21195] Updated weights for policy 0, policy_version 47970 (0.0008) +[2023-10-08 17:39:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 97878016. Throughput: 0: 1761.6, 1: 1709.6. Samples: 24479848. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 17:39:43,804][19739] Avg episode reward: [(0, '760.390'), (1, '829.560')] +[2023-10-08 17:39:43,992][21195] Updated weights for policy 0, policy_version 47980 (0.0009) +[2023-10-08 17:39:44,370][21195] Updated weights for policy 0, policy_version 47990 (0.0008) +[2023-10-08 17:39:44,745][21195] Updated weights for policy 0, policy_version 48000 (0.0008) +[2023-10-08 17:39:46,323][21194] Updated weights for policy 1, policy_version 47620 (0.0007) +[2023-10-08 17:39:46,699][21194] Updated weights for policy 1, policy_version 47630 (0.0008) +[2023-10-08 17:39:47,060][21194] Updated weights for policy 1, policy_version 47640 (0.0007) +[2023-10-08 17:39:48,734][21195] Updated weights for policy 0, policy_version 48010 (0.0011) +[2023-10-08 17:39:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 97943552. Throughput: 0: 1756.5, 1: 1738.5. Samples: 24496054. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 17:39:48,803][19739] Avg episode reward: [(0, '746.880'), (1, '829.560')] +[2023-10-08 17:39:49,103][21195] Updated weights for policy 0, policy_version 48020 (0.0009) +[2023-10-08 17:39:49,472][21195] Updated weights for policy 0, policy_version 48030 (0.0009) +[2023-10-08 17:39:51,023][21194] Updated weights for policy 1, policy_version 47650 (0.0008) +[2023-10-08 17:39:51,392][21194] Updated weights for policy 1, policy_version 47660 (0.0009) +[2023-10-08 17:39:51,749][21194] Updated weights for policy 1, policy_version 47670 (0.0008) +[2023-10-08 17:39:52,122][21194] Updated weights for policy 1, policy_version 47680 (0.0008) +[2023-10-08 17:39:53,297][21195] Updated weights for policy 0, policy_version 48040 (0.0010) +[2023-10-08 17:39:53,665][21195] Updated weights for policy 0, policy_version 48050 (0.0009) +[2023-10-08 17:39:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 98009088. Throughput: 0: 1750.4, 1: 1706.2. Samples: 24510804. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 17:39:53,804][19739] Avg episode reward: [(0, '747.040'), (1, '829.560')] +[2023-10-08 17:39:54,038][21195] Updated weights for policy 0, policy_version 48060 (0.0011) +[2023-10-08 17:39:56,024][21194] Updated weights for policy 1, policy_version 47690 (0.0008) +[2023-10-08 17:39:56,406][21194] Updated weights for policy 1, policy_version 47700 (0.0009) +[2023-10-08 17:39:56,761][21194] Updated weights for policy 1, policy_version 47710 (0.0007) +[2023-10-08 17:39:58,108][21195] Updated weights for policy 0, policy_version 48070 (0.0010) +[2023-10-08 17:39:58,487][21195] Updated weights for policy 0, policy_version 48080 (0.0008) +[2023-10-08 17:39:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 98074624. Throughput: 0: 1771.3, 1: 1708.1. Samples: 24532110. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 17:39:58,803][19739] Avg episode reward: [(0, '761.050'), (1, '829.560')] +[2023-10-08 17:39:58,864][21195] Updated weights for policy 0, policy_version 48090 (0.0008) +[2023-10-08 17:40:00,727][21194] Updated weights for policy 1, policy_version 47720 (0.0007) +[2023-10-08 17:40:01,096][21194] Updated weights for policy 1, policy_version 47730 (0.0007) +[2023-10-08 17:40:01,450][21194] Updated weights for policy 1, policy_version 47740 (0.0009) +[2023-10-08 17:40:02,767][21195] Updated weights for policy 0, policy_version 48100 (0.0008) +[2023-10-08 17:40:03,142][21195] Updated weights for policy 0, policy_version 48110 (0.0007) +[2023-10-08 17:40:03,511][21195] Updated weights for policy 0, policy_version 48120 (0.0009) +[2023-10-08 17:40:03,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 98140160. Throughput: 0: 1737.2, 1: 1720.2. Samples: 24546970. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 17:40:03,803][19739] Avg episode reward: [(0, '734.370'), (1, '834.840')] +[2023-10-08 17:40:05,449][21194] Updated weights for policy 1, policy_version 47750 (0.0009) +[2023-10-08 17:40:05,805][21194] Updated weights for policy 1, policy_version 47760 (0.0010) +[2023-10-08 17:40:06,174][21194] Updated weights for policy 1, policy_version 47770 (0.0010) +[2023-10-08 17:40:07,362][21195] Updated weights for policy 0, policy_version 48130 (0.0009) +[2023-10-08 17:40:07,733][21195] Updated weights for policy 0, policy_version 48140 (0.0008) +[2023-10-08 17:40:08,107][21195] Updated weights for policy 0, policy_version 48150 (0.0007) +[2023-10-08 17:40:08,476][21195] Updated weights for policy 0, policy_version 48160 (0.0009) +[2023-10-08 17:40:08,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 98238464. Throughput: 0: 1764.0, 1: 1700.0. Samples: 24562858. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 17:40:08,803][19739] Avg episode reward: [(0, '704.570'), (1, '834.840')] +[2023-10-08 17:40:10,082][21194] Updated weights for policy 1, policy_version 47780 (0.0010) +[2023-10-08 17:40:10,447][21194] Updated weights for policy 1, policy_version 47790 (0.0009) +[2023-10-08 17:40:10,804][21194] Updated weights for policy 1, policy_version 47800 (0.0009) +[2023-10-08 17:40:12,416][21195] Updated weights for policy 0, policy_version 48170 (0.0009) +[2023-10-08 17:40:12,785][21195] Updated weights for policy 0, policy_version 48180 (0.0007) +[2023-10-08 17:40:13,160][21195] Updated weights for policy 0, policy_version 48190 (0.0010) +[2023-10-08 17:40:13,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 98304000. Throughput: 0: 1740.3, 1: 1727.8. Samples: 24583584. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 17:40:13,803][19739] Avg episode reward: [(0, '704.570'), (1, '834.840')] +[2023-10-08 17:40:14,921][21194] Updated weights for policy 1, policy_version 47810 (0.0011) +[2023-10-08 17:40:15,333][21194] Updated weights for policy 1, policy_version 47820 (0.0010) +[2023-10-08 17:40:15,694][21194] Updated weights for policy 1, policy_version 47830 (0.0008) +[2023-10-08 17:40:16,060][21194] Updated weights for policy 1, policy_version 47840 (0.0009) +[2023-10-08 17:40:16,965][21195] Updated weights for policy 0, policy_version 48200 (0.0009) +[2023-10-08 17:40:17,338][21195] Updated weights for policy 0, policy_version 48210 (0.0007) +[2023-10-08 17:40:17,709][21195] Updated weights for policy 0, policy_version 48220 (0.0007) +[2023-10-08 17:40:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 98369536. Throughput: 0: 1725.4, 1: 1703.4. Samples: 24598414. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 17:40:18,803][19739] Avg episode reward: [(0, '691.480'), (1, '834.840')] +[2023-10-08 17:40:20,075][21194] Updated weights for policy 1, policy_version 47850 (0.0008) +[2023-10-08 17:40:20,437][21194] Updated weights for policy 1, policy_version 47860 (0.0009) +[2023-10-08 17:40:20,805][21194] Updated weights for policy 1, policy_version 47870 (0.0011) +[2023-10-08 17:40:21,661][21195] Updated weights for policy 0, policy_version 48230 (0.0008) +[2023-10-08 17:40:22,032][21195] Updated weights for policy 0, policy_version 48240 (0.0008) +[2023-10-08 17:40:22,408][21195] Updated weights for policy 0, policy_version 48250 (0.0010) +[2023-10-08 17:40:23,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 98435072. Throughput: 0: 1744.3, 1: 1706.6. Samples: 24614450. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 17:40:23,804][19739] Avg episode reward: [(0, '691.480'), (1, '834.840')] +[2023-10-08 17:40:24,882][21194] Updated weights for policy 1, policy_version 47880 (0.0010) +[2023-10-08 17:40:25,245][21194] Updated weights for policy 1, policy_version 47890 (0.0010) +[2023-10-08 17:40:25,613][21194] Updated weights for policy 1, policy_version 47900 (0.0011) +[2023-10-08 17:40:26,223][21195] Updated weights for policy 0, policy_version 48260 (0.0008) +[2023-10-08 17:40:26,586][21195] Updated weights for policy 0, policy_version 48270 (0.0007) +[2023-10-08 17:40:26,945][21195] Updated weights for policy 0, policy_version 48280 (0.0007) +[2023-10-08 17:40:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 98500608. Throughput: 0: 1724.0, 1: 1724.1. Samples: 24635012. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 17:40:28,803][19739] Avg episode reward: [(0, '691.480'), (1, '834.840')] +[2023-10-08 17:40:29,514][21194] Updated weights for policy 1, policy_version 47910 (0.0010) +[2023-10-08 17:40:29,879][21194] Updated weights for policy 1, policy_version 47920 (0.0007) +[2023-10-08 17:40:30,243][21194] Updated weights for policy 1, policy_version 47930 (0.0008) +[2023-10-08 17:40:30,903][21195] Updated weights for policy 0, policy_version 48290 (0.0007) +[2023-10-08 17:40:31,269][21195] Updated weights for policy 0, policy_version 48300 (0.0008) +[2023-10-08 17:40:31,641][21195] Updated weights for policy 0, policy_version 48310 (0.0009) +[2023-10-08 17:40:32,010][21195] Updated weights for policy 0, policy_version 48320 (0.0008) +[2023-10-08 17:40:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 98566144. Throughput: 0: 1731.7, 1: 1696.3. Samples: 24650312. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 17:40:33,804][19739] Avg episode reward: [(0, '691.480'), (1, '834.640')] +[2023-10-08 17:40:33,987][21194] Updated weights for policy 1, policy_version 47940 (0.0010) +[2023-10-08 17:40:34,354][21194] Updated weights for policy 1, policy_version 47950 (0.0009) +[2023-10-08 17:40:34,723][21194] Updated weights for policy 1, policy_version 47960 (0.0009) +[2023-10-08 17:40:36,112][21195] Updated weights for policy 0, policy_version 48330 (0.0007) +[2023-10-08 17:40:36,486][21195] Updated weights for policy 0, policy_version 48340 (0.0008) +[2023-10-08 17:40:36,856][21195] Updated weights for policy 0, policy_version 48350 (0.0008) +[2023-10-08 17:40:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 98631680. Throughput: 0: 1718.2, 1: 1727.6. Samples: 24665864. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:40:38,803][19739] Avg episode reward: [(0, '691.340'), (1, '834.640')] +[2023-10-08 17:40:38,841][21194] Updated weights for policy 1, policy_version 47970 (0.0008) +[2023-10-08 17:40:39,206][21194] Updated weights for policy 1, policy_version 47980 (0.0009) +[2023-10-08 17:40:39,565][21194] Updated weights for policy 1, policy_version 47990 (0.0010) +[2023-10-08 17:40:39,937][21194] Updated weights for policy 1, policy_version 48000 (0.0010) +[2023-10-08 17:40:40,632][21195] Updated weights for policy 0, policy_version 48360 (0.0009) +[2023-10-08 17:40:40,995][21195] Updated weights for policy 0, policy_version 48370 (0.0010) +[2023-10-08 17:40:41,370][21195] Updated weights for policy 0, policy_version 48380 (0.0009) +[2023-10-08 17:40:43,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 98697216. Throughput: 0: 1716.2, 1: 1725.2. Samples: 24686976. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:40:43,803][19739] Avg episode reward: [(0, '691.340'), (1, '834.430')] +[2023-10-08 17:40:44,008][21194] Updated weights for policy 1, policy_version 48010 (0.0007) +[2023-10-08 17:40:44,372][21194] Updated weights for policy 1, policy_version 48020 (0.0007) +[2023-10-08 17:40:44,736][21194] Updated weights for policy 1, policy_version 48030 (0.0009) +[2023-10-08 17:40:45,364][21195] Updated weights for policy 0, policy_version 48390 (0.0009) +[2023-10-08 17:40:45,729][21195] Updated weights for policy 0, policy_version 48400 (0.0008) +[2023-10-08 17:40:46,106][21195] Updated weights for policy 0, policy_version 48410 (0.0008) +[2023-10-08 17:40:48,734][21194] Updated weights for policy 1, policy_version 48040 (0.0008) +[2023-10-08 17:40:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 98762752. Throughput: 0: 1739.6, 1: 1708.8. Samples: 24702144. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:40:48,803][19739] Avg episode reward: [(0, '691.340'), (1, '834.430')] +[2023-10-08 17:40:49,103][21194] Updated weights for policy 1, policy_version 48050 (0.0010) +[2023-10-08 17:40:49,471][21194] Updated weights for policy 1, policy_version 48060 (0.0009) +[2023-10-08 17:40:50,055][21195] Updated weights for policy 0, policy_version 48420 (0.0008) +[2023-10-08 17:40:50,426][21195] Updated weights for policy 0, policy_version 48430 (0.0010) +[2023-10-08 17:40:50,787][21195] Updated weights for policy 0, policy_version 48440 (0.0010) +[2023-10-08 17:40:53,433][21194] Updated weights for policy 1, policy_version 48070 (0.0010) +[2023-10-08 17:40:53,800][21194] Updated weights for policy 1, policy_version 48080 (0.0008) +[2023-10-08 17:40:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 98828288. Throughput: 0: 1711.2, 1: 1730.8. Samples: 24717744. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:40:53,803][19739] Avg episode reward: [(0, '677.780'), (1, '834.430')] +[2023-10-08 17:40:54,173][21194] Updated weights for policy 1, policy_version 48090 (0.0009) +[2023-10-08 17:40:54,748][21195] Updated weights for policy 0, policy_version 48450 (0.0007) +[2023-10-08 17:40:55,111][21195] Updated weights for policy 0, policy_version 48460 (0.0008) +[2023-10-08 17:40:55,489][21195] Updated weights for policy 0, policy_version 48470 (0.0008) +[2023-10-08 17:40:55,856][21195] Updated weights for policy 0, policy_version 48480 (0.0009) +[2023-10-08 17:40:58,013][21194] Updated weights for policy 1, policy_version 48100 (0.0008) +[2023-10-08 17:40:58,390][21194] Updated weights for policy 1, policy_version 48110 (0.0009) +[2023-10-08 17:40:58,755][21194] Updated weights for policy 1, policy_version 48120 (0.0008) +[2023-10-08 17:40:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 98893824. Throughput: 0: 1730.9, 1: 1728.9. Samples: 24739276. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:40:58,803][19739] Avg episode reward: [(0, '677.780'), (1, '834.430')] +[2023-10-08 17:40:59,599][21195] Updated weights for policy 0, policy_version 48490 (0.0007) +[2023-10-08 17:40:59,974][21195] Updated weights for policy 0, policy_version 48500 (0.0007) +[2023-10-08 17:41:00,331][21195] Updated weights for policy 0, policy_version 48510 (0.0007) +[2023-10-08 17:41:02,829][21194] Updated weights for policy 1, policy_version 48130 (0.0009) +[2023-10-08 17:41:03,233][21194] Updated weights for policy 1, policy_version 48140 (0.0007) +[2023-10-08 17:41:03,592][21194] Updated weights for policy 1, policy_version 48150 (0.0007) +[2023-10-08 17:41:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 98959360. Throughput: 0: 1743.0, 1: 1735.5. Samples: 24754944. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:41:03,804][19739] Avg episode reward: [(0, '677.780'), (1, '835.690')] +[2023-10-08 17:41:03,962][21194] Updated weights for policy 1, policy_version 48160 (0.0011) +[2023-10-08 17:41:04,241][21195] Updated weights for policy 0, policy_version 48520 (0.0009) +[2023-10-08 17:41:04,618][21195] Updated weights for policy 0, policy_version 48530 (0.0009) +[2023-10-08 17:41:04,985][21195] Updated weights for policy 0, policy_version 48540 (0.0008) +[2023-10-08 17:41:07,837][21194] Updated weights for policy 1, policy_version 48170 (0.0008) +[2023-10-08 17:41:08,198][21194] Updated weights for policy 1, policy_version 48180 (0.0007) +[2023-10-08 17:41:08,563][21194] Updated weights for policy 1, policy_version 48190 (0.0007) +[2023-10-08 17:41:08,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 99057664. Throughput: 0: 1718.6, 1: 1733.4. Samples: 24769790. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:41:08,803][19739] Avg episode reward: [(0, '677.780'), (1, '850.670')] +[2023-10-08 17:41:09,122][21195] Updated weights for policy 0, policy_version 48550 (0.0009) +[2023-10-08 17:41:09,499][21195] Updated weights for policy 0, policy_version 48560 (0.0011) +[2023-10-08 17:41:09,871][21195] Updated weights for policy 0, policy_version 48570 (0.0008) +[2023-10-08 17:41:12,428][21194] Updated weights for policy 1, policy_version 48200 (0.0008) +[2023-10-08 17:41:12,784][21194] Updated weights for policy 1, policy_version 48210 (0.0009) +[2023-10-08 17:41:13,151][21194] Updated weights for policy 1, policy_version 48220 (0.0011) +[2023-10-08 17:41:13,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 99123200. Throughput: 0: 1733.7, 1: 1718.1. Samples: 24790344. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 17:41:13,803][19739] Avg episode reward: [(0, '677.780'), (1, '854.600')] +[2023-10-08 17:41:13,809][21195] Updated weights for policy 0, policy_version 48580 (0.0010) +[2023-10-08 17:41:13,813][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000048224_49381376.pth... +[2023-10-08 17:41:13,845][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000046592_47710208.pth +[2023-10-08 17:41:13,849][20836] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p1/milestones/checkpoint_000048224_49381376.pth +[2023-10-08 17:41:14,178][21195] Updated weights for policy 0, policy_version 48590 (0.0008) +[2023-10-08 17:41:14,546][21195] Updated weights for policy 0, policy_version 48600 (0.0007) +[2023-10-08 17:41:14,832][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000048608_49774592.pth... +[2023-10-08 17:41:14,861][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000046976_48103424.pth +[2023-10-08 17:41:14,864][20740] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p0/milestones/checkpoint_000048608_49774592.pth +[2023-10-08 17:41:17,202][21194] Updated weights for policy 1, policy_version 48230 (0.0010) +[2023-10-08 17:41:17,565][21194] Updated weights for policy 1, policy_version 48240 (0.0011) +[2023-10-08 17:41:17,939][21194] Updated weights for policy 1, policy_version 48250 (0.0010) +[2023-10-08 17:41:18,663][21195] Updated weights for policy 0, policy_version 48610 (0.0008) +[2023-10-08 17:41:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 99188736. Throughput: 0: 1734.1, 1: 1737.2. Samples: 24806518. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 17:41:18,803][19739] Avg episode reward: [(0, '677.780'), (1, '854.600')] +[2023-10-08 17:41:19,026][21195] Updated weights for policy 0, policy_version 48620 (0.0008) +[2023-10-08 17:41:19,394][21195] Updated weights for policy 0, policy_version 48630 (0.0009) +[2023-10-08 17:41:19,769][21195] Updated weights for policy 0, policy_version 48640 (0.0009) +[2023-10-08 17:41:21,891][21194] Updated weights for policy 1, policy_version 48260 (0.0008) +[2023-10-08 17:41:22,255][21194] Updated weights for policy 1, policy_version 48270 (0.0010) +[2023-10-08 17:41:22,627][21194] Updated weights for policy 1, policy_version 48280 (0.0010) +[2023-10-08 17:41:23,696][21195] Updated weights for policy 0, policy_version 48650 (0.0009) +[2023-10-08 17:41:23,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 99254272. Throughput: 0: 1736.3, 1: 1726.4. Samples: 24821684. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 17:41:23,803][19739] Avg episode reward: [(0, '678.010'), (1, '854.600')] +[2023-10-08 17:41:24,070][21195] Updated weights for policy 0, policy_version 48660 (0.0010) +[2023-10-08 17:41:24,436][21195] Updated weights for policy 0, policy_version 48670 (0.0010) +[2023-10-08 17:41:26,345][21194] Updated weights for policy 1, policy_version 48290 (0.0009) +[2023-10-08 17:41:26,714][21194] Updated weights for policy 1, policy_version 48300 (0.0008) +[2023-10-08 17:41:27,079][21194] Updated weights for policy 1, policy_version 48310 (0.0007) +[2023-10-08 17:41:27,449][21194] Updated weights for policy 1, policy_version 48320 (0.0007) +[2023-10-08 17:41:28,121][21195] Updated weights for policy 0, policy_version 48680 (0.0009) +[2023-10-08 17:41:28,486][21195] Updated weights for policy 0, policy_version 48690 (0.0007) +[2023-10-08 17:41:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 99319808. Throughput: 0: 1746.0, 1: 1708.4. Samples: 24842426. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 17:41:28,803][19739] Avg episode reward: [(0, '692.300'), (1, '854.600')] +[2023-10-08 17:41:28,847][21195] Updated weights for policy 0, policy_version 48700 (0.0009) +[2023-10-08 17:41:31,342][21194] Updated weights for policy 1, policy_version 48330 (0.0009) +[2023-10-08 17:41:31,716][21194] Updated weights for policy 1, policy_version 48340 (0.0009) +[2023-10-08 17:41:32,074][21194] Updated weights for policy 1, policy_version 48350 (0.0009) +[2023-10-08 17:41:32,697][21195] Updated weights for policy 0, policy_version 48710 (0.0010) +[2023-10-08 17:41:33,061][21195] Updated weights for policy 0, policy_version 48720 (0.0010) +[2023-10-08 17:41:33,429][21195] Updated weights for policy 0, policy_version 48730 (0.0007) +[2023-10-08 17:41:33,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 99418112. Throughput: 0: 1718.7, 1: 1737.3. Samples: 24857662. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 17:41:33,804][19739] Avg episode reward: [(0, '692.300'), (1, '854.600')] +[2023-10-08 17:41:36,141][21194] Updated weights for policy 1, policy_version 48360 (0.0007) +[2023-10-08 17:41:36,511][21194] Updated weights for policy 1, policy_version 48370 (0.0008) +[2023-10-08 17:41:36,879][21194] Updated weights for policy 1, policy_version 48380 (0.0007) +[2023-10-08 17:41:37,292][21195] Updated weights for policy 0, policy_version 48740 (0.0008) +[2023-10-08 17:41:37,664][21195] Updated weights for policy 0, policy_version 48750 (0.0010) +[2023-10-08 17:41:38,033][21195] Updated weights for policy 0, policy_version 48760 (0.0009) +[2023-10-08 17:41:38,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 99483648. Throughput: 0: 1751.2, 1: 1705.0. Samples: 24873274. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 17:41:38,804][19739] Avg episode reward: [(0, '707.170'), (1, '855.210')] +[2023-10-08 17:41:40,769][21194] Updated weights for policy 1, policy_version 48390 (0.0009) +[2023-10-08 17:41:41,137][21194] Updated weights for policy 1, policy_version 48400 (0.0010) +[2023-10-08 17:41:41,507][21194] Updated weights for policy 1, policy_version 48410 (0.0007) +[2023-10-08 17:41:42,003][21195] Updated weights for policy 0, policy_version 48770 (0.0009) +[2023-10-08 17:41:42,364][21195] Updated weights for policy 0, policy_version 48780 (0.0007) +[2023-10-08 17:41:42,731][21195] Updated weights for policy 0, policy_version 48790 (0.0007) +[2023-10-08 17:41:43,109][21195] Updated weights for policy 0, policy_version 48800 (0.0007) +[2023-10-08 17:41:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 99549184. Throughput: 0: 1730.0, 1: 1704.0. Samples: 24893804. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 17:41:43,804][19739] Avg episode reward: [(0, '707.170'), (1, '869.400')] +[2023-10-08 17:41:45,579][21194] Updated weights for policy 1, policy_version 48420 (0.0009) +[2023-10-08 17:41:45,944][21194] Updated weights for policy 1, policy_version 48430 (0.0010) +[2023-10-08 17:41:46,296][21194] Updated weights for policy 1, policy_version 48440 (0.0008) +[2023-10-08 17:41:47,051][21195] Updated weights for policy 0, policy_version 48810 (0.0008) +[2023-10-08 17:41:47,426][21195] Updated weights for policy 0, policy_version 48820 (0.0010) +[2023-10-08 17:41:47,807][21195] Updated weights for policy 0, policy_version 48830 (0.0009) +[2023-10-08 17:41:48,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 99614720. Throughput: 0: 1717.6, 1: 1711.6. Samples: 24909256. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 17:41:48,803][19739] Avg episode reward: [(0, '707.170'), (1, '879.420')] +[2023-10-08 17:41:50,392][21194] Updated weights for policy 1, policy_version 48450 (0.0007) +[2023-10-08 17:41:50,759][21194] Updated weights for policy 1, policy_version 48460 (0.0007) +[2023-10-08 17:41:51,127][21194] Updated weights for policy 1, policy_version 48470 (0.0007) +[2023-10-08 17:41:51,489][21194] Updated weights for policy 1, policy_version 48480 (0.0008) +[2023-10-08 17:41:51,843][21195] Updated weights for policy 0, policy_version 48840 (0.0008) +[2023-10-08 17:41:52,209][21195] Updated weights for policy 0, policy_version 48850 (0.0008) +[2023-10-08 17:41:52,573][21195] Updated weights for policy 0, policy_version 48860 (0.0008) +[2023-10-08 17:41:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 99680256. Throughput: 0: 1744.0, 1: 1701.2. Samples: 24924828. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 17:41:53,804][19739] Avg episode reward: [(0, '722.250'), (1, '879.420')] +[2023-10-08 17:41:55,502][21194] Updated weights for policy 1, policy_version 48490 (0.0009) +[2023-10-08 17:41:55,861][21194] Updated weights for policy 1, policy_version 48500 (0.0007) +[2023-10-08 17:41:56,226][21194] Updated weights for policy 1, policy_version 48510 (0.0007) +[2023-10-08 17:41:56,373][21195] Updated weights for policy 0, policy_version 48870 (0.0009) +[2023-10-08 17:41:56,746][21195] Updated weights for policy 0, policy_version 48880 (0.0008) +[2023-10-08 17:41:57,116][21195] Updated weights for policy 0, policy_version 48890 (0.0009) +[2023-10-08 17:41:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 99745792. Throughput: 0: 1724.3, 1: 1719.9. Samples: 24945330. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 17:41:58,803][19739] Avg episode reward: [(0, '722.250'), (1, '879.420')] +[2023-10-08 17:42:00,101][21194] Updated weights for policy 1, policy_version 48520 (0.0009) +[2023-10-08 17:42:00,464][21194] Updated weights for policy 1, policy_version 48530 (0.0008) +[2023-10-08 17:42:00,835][21194] Updated weights for policy 1, policy_version 48540 (0.0009) +[2023-10-08 17:42:01,140][21195] Updated weights for policy 0, policy_version 48900 (0.0008) +[2023-10-08 17:42:01,502][21195] Updated weights for policy 0, policy_version 48910 (0.0011) +[2023-10-08 17:42:01,865][21195] Updated weights for policy 0, policy_version 48920 (0.0011) +[2023-10-08 17:42:03,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 99811328. Throughput: 0: 1724.7, 1: 1700.8. Samples: 24960666. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 17:42:03,803][19739] Avg episode reward: [(0, '722.250'), (1, '879.420')] +[2023-10-08 17:42:04,882][21194] Updated weights for policy 1, policy_version 48550 (0.0008) +[2023-10-08 17:42:05,251][21194] Updated weights for policy 1, policy_version 48560 (0.0011) +[2023-10-08 17:42:05,614][21194] Updated weights for policy 1, policy_version 48570 (0.0011) +[2023-10-08 17:42:05,825][21195] Updated weights for policy 0, policy_version 48930 (0.0009) +[2023-10-08 17:42:06,197][21195] Updated weights for policy 0, policy_version 48940 (0.0010) +[2023-10-08 17:42:06,566][21195] Updated weights for policy 0, policy_version 48950 (0.0008) +[2023-10-08 17:42:06,942][21195] Updated weights for policy 0, policy_version 48960 (0.0007) +[2023-10-08 17:42:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 99876864. Throughput: 0: 1730.3, 1: 1705.7. Samples: 24976306. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 17:42:08,803][19739] Avg episode reward: [(0, '723.270'), (1, '871.050')] +[2023-10-08 17:42:09,644][21194] Updated weights for policy 1, policy_version 48580 (0.0009) +[2023-10-08 17:42:10,004][21194] Updated weights for policy 1, policy_version 48590 (0.0009) +[2023-10-08 17:42:10,372][21194] Updated weights for policy 1, policy_version 48600 (0.0008) +[2023-10-08 17:42:10,919][21195] Updated weights for policy 0, policy_version 48970 (0.0007) +[2023-10-08 17:42:11,287][21195] Updated weights for policy 0, policy_version 48980 (0.0007) +[2023-10-08 17:42:11,664][21195] Updated weights for policy 0, policy_version 48990 (0.0007) +[2023-10-08 17:42:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 99942400. Throughput: 0: 1715.7, 1: 1725.6. Samples: 24997288. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 17:42:13,803][19739] Avg episode reward: [(0, '723.270'), (1, '840.800')] +[2023-10-08 17:42:14,427][21194] Updated weights for policy 1, policy_version 48610 (0.0008) +[2023-10-08 17:42:14,797][21194] Updated weights for policy 1, policy_version 48620 (0.0010) +[2023-10-08 17:42:15,155][21194] Updated weights for policy 1, policy_version 48630 (0.0007) +[2023-10-08 17:42:15,447][21195] Updated weights for policy 0, policy_version 49000 (0.0009) +[2023-10-08 17:42:15,524][21194] Updated weights for policy 1, policy_version 48640 (0.0009) +[2023-10-08 17:42:15,811][21195] Updated weights for policy 0, policy_version 49010 (0.0009) +[2023-10-08 17:42:16,183][21195] Updated weights for policy 0, policy_version 49020 (0.0009) +[2023-10-08 17:42:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 100007936. Throughput: 0: 1748.7, 1: 1696.4. Samples: 25012690. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:42:18,803][19739] Avg episode reward: [(0, '723.270'), (1, '835.150')] +[2023-10-08 17:42:19,342][21194] Updated weights for policy 1, policy_version 48650 (0.0009) +[2023-10-08 17:42:19,709][21194] Updated weights for policy 1, policy_version 48660 (0.0009) +[2023-10-08 17:42:20,018][21195] Updated weights for policy 0, policy_version 49030 (0.0007) +[2023-10-08 17:42:20,072][21194] Updated weights for policy 1, policy_version 48670 (0.0007) +[2023-10-08 17:42:20,379][21195] Updated weights for policy 0, policy_version 49040 (0.0009) +[2023-10-08 17:42:20,750][21195] Updated weights for policy 0, policy_version 49050 (0.0010) +[2023-10-08 17:42:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 100073472. Throughput: 0: 1712.9, 1: 1727.1. Samples: 25028070. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:42:23,803][19739] Avg episode reward: [(0, '717.200'), (1, '835.330')] +[2023-10-08 17:42:23,838][21194] Updated weights for policy 1, policy_version 48680 (0.0008) +[2023-10-08 17:42:24,208][21194] Updated weights for policy 1, policy_version 48690 (0.0010) +[2023-10-08 17:42:24,575][21194] Updated weights for policy 1, policy_version 48700 (0.0009) +[2023-10-08 17:42:24,739][21195] Updated weights for policy 0, policy_version 49060 (0.0010) +[2023-10-08 17:42:25,107][21195] Updated weights for policy 0, policy_version 49070 (0.0009) +[2023-10-08 17:42:25,470][21195] Updated weights for policy 0, policy_version 49080 (0.0008) +[2023-10-08 17:42:28,517][21194] Updated weights for policy 1, policy_version 48710 (0.0008) +[2023-10-08 17:42:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 100139008. Throughput: 0: 1737.4, 1: 1730.4. Samples: 25049856. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:42:28,803][19739] Avg episode reward: [(0, '717.200'), (1, '835.270')] +[2023-10-08 17:42:28,878][21194] Updated weights for policy 1, policy_version 48720 (0.0007) +[2023-10-08 17:42:29,255][21194] Updated weights for policy 1, policy_version 48730 (0.0009) +[2023-10-08 17:42:29,385][21195] Updated weights for policy 0, policy_version 49090 (0.0008) +[2023-10-08 17:42:29,750][21195] Updated weights for policy 0, policy_version 49100 (0.0008) +[2023-10-08 17:42:30,113][21195] Updated weights for policy 0, policy_version 49110 (0.0008) +[2023-10-08 17:42:30,480][21195] Updated weights for policy 0, policy_version 49120 (0.0008) +[2023-10-08 17:42:33,081][21194] Updated weights for policy 1, policy_version 48740 (0.0007) +[2023-10-08 17:42:33,453][21194] Updated weights for policy 1, policy_version 48750 (0.0007) +[2023-10-08 17:42:33,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 100204544. Throughput: 0: 1748.3, 1: 1721.5. Samples: 25065396. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:42:33,804][19739] Avg episode reward: [(0, '717.200'), (1, '849.690')] +[2023-10-08 17:42:33,813][21194] Updated weights for policy 1, policy_version 48760 (0.0011) +[2023-10-08 17:42:34,398][21195] Updated weights for policy 0, policy_version 49130 (0.0007) +[2023-10-08 17:42:34,773][21195] Updated weights for policy 0, policy_version 49140 (0.0007) +[2023-10-08 17:42:35,146][21195] Updated weights for policy 0, policy_version 49150 (0.0007) +[2023-10-08 17:42:37,633][21194] Updated weights for policy 1, policy_version 48770 (0.0007) +[2023-10-08 17:42:37,996][21194] Updated weights for policy 1, policy_version 48780 (0.0008) +[2023-10-08 17:42:38,354][21194] Updated weights for policy 1, policy_version 48790 (0.0010) +[2023-10-08 17:42:38,725][21194] Updated weights for policy 1, policy_version 48800 (0.0010) +[2023-10-08 17:42:38,803][19739] Fps is (10 sec: 16384.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 100302848. Throughput: 0: 1725.9, 1: 1741.5. Samples: 25080858. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:42:38,803][19739] Avg episode reward: [(0, '717.200'), (1, '849.530')] +[2023-10-08 17:42:39,022][21195] Updated weights for policy 0, policy_version 49160 (0.0009) +[2023-10-08 17:42:39,397][21195] Updated weights for policy 0, policy_version 49170 (0.0009) +[2023-10-08 17:42:39,772][21195] Updated weights for policy 0, policy_version 49180 (0.0008) +[2023-10-08 17:42:42,773][21194] Updated weights for policy 1, policy_version 48810 (0.0009) +[2023-10-08 17:42:43,129][21194] Updated weights for policy 1, policy_version 48820 (0.0007) +[2023-10-08 17:42:43,501][21194] Updated weights for policy 1, policy_version 48830 (0.0007) +[2023-10-08 17:42:43,746][21195] Updated weights for policy 0, policy_version 49190 (0.0008) +[2023-10-08 17:42:43,803][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 100368384. Throughput: 0: 1749.1, 1: 1722.0. Samples: 25101530. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:42:43,803][19739] Avg episode reward: [(0, '717.200'), (1, '849.530')] +[2023-10-08 17:42:44,114][21195] Updated weights for policy 0, policy_version 49200 (0.0008) +[2023-10-08 17:42:44,477][21195] Updated weights for policy 0, policy_version 49210 (0.0010) +[2023-10-08 17:42:47,555][21194] Updated weights for policy 1, policy_version 48840 (0.0008) +[2023-10-08 17:42:47,926][21194] Updated weights for policy 1, policy_version 48850 (0.0008) +[2023-10-08 17:42:48,284][21194] Updated weights for policy 1, policy_version 48860 (0.0009) +[2023-10-08 17:42:48,357][21195] Updated weights for policy 0, policy_version 49220 (0.0009) +[2023-10-08 17:42:48,726][21195] Updated weights for policy 0, policy_version 49230 (0.0008) +[2023-10-08 17:42:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 100433920. Throughput: 0: 1741.1, 1: 1737.2. Samples: 25117188. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 17:42:48,803][19739] Avg episode reward: [(0, '686.900'), (1, '849.530')] +[2023-10-08 17:42:49,090][21195] Updated weights for policy 0, policy_version 49240 (0.0008) +[2023-10-08 17:42:52,389][21194] Updated weights for policy 1, policy_version 48870 (0.0008) +[2023-10-08 17:42:52,750][21194] Updated weights for policy 1, policy_version 48880 (0.0007) +[2023-10-08 17:42:52,934][21195] Updated weights for policy 0, policy_version 49250 (0.0008) +[2023-10-08 17:42:53,112][21194] Updated weights for policy 1, policy_version 48890 (0.0008) +[2023-10-08 17:42:53,310][21195] Updated weights for policy 0, policy_version 49260 (0.0008) +[2023-10-08 17:42:53,685][21195] Updated weights for policy 0, policy_version 49270 (0.0009) +[2023-10-08 17:42:53,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 100499456. Throughput: 0: 1745.6, 1: 1736.9. Samples: 25133020. Policy #0 lag: (min: 27.0, avg: 35.3, max: 59.0) +[2023-10-08 17:42:53,804][19739] Avg episode reward: [(0, '672.510'), (1, '849.530')] +[2023-10-08 17:42:54,054][21195] Updated weights for policy 0, policy_version 49280 (0.0008) +[2023-10-08 17:42:57,007][21194] Updated weights for policy 1, policy_version 48900 (0.0009) +[2023-10-08 17:42:57,377][21194] Updated weights for policy 1, policy_version 48910 (0.0009) +[2023-10-08 17:42:57,738][21194] Updated weights for policy 1, policy_version 48920 (0.0008) +[2023-10-08 17:42:58,094][21195] Updated weights for policy 0, policy_version 49290 (0.0008) +[2023-10-08 17:42:58,468][21195] Updated weights for policy 0, policy_version 49300 (0.0007) +[2023-10-08 17:42:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 100564992. Throughput: 0: 1749.2, 1: 1708.9. Samples: 25152904. Policy #0 lag: (min: 27.0, avg: 35.3, max: 59.0) +[2023-10-08 17:42:58,803][19739] Avg episode reward: [(0, '672.510'), (1, '849.530')] +[2023-10-08 17:42:58,840][21195] Updated weights for policy 0, policy_version 49310 (0.0008) +[2023-10-08 17:43:01,724][21194] Updated weights for policy 1, policy_version 48930 (0.0007) +[2023-10-08 17:43:02,079][21194] Updated weights for policy 1, policy_version 48940 (0.0007) +[2023-10-08 17:43:02,439][21194] Updated weights for policy 1, policy_version 48950 (0.0008) +[2023-10-08 17:43:02,708][21195] Updated weights for policy 0, policy_version 49320 (0.0007) +[2023-10-08 17:43:02,795][21194] Updated weights for policy 1, policy_version 48960 (0.0008) +[2023-10-08 17:43:03,075][21195] Updated weights for policy 0, policy_version 49330 (0.0009) +[2023-10-08 17:43:03,450][21195] Updated weights for policy 0, policy_version 49340 (0.0009) +[2023-10-08 17:43:03,802][19739] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 100663296. Throughput: 0: 1717.6, 1: 1740.7. Samples: 25168310. Policy #0 lag: (min: 27.0, avg: 35.3, max: 59.0) +[2023-10-08 17:43:03,803][19739] Avg episode reward: [(0, '685.810'), (1, '849.530')] +[2023-10-08 17:43:06,946][21194] Updated weights for policy 1, policy_version 48970 (0.0009) +[2023-10-08 17:43:07,310][21194] Updated weights for policy 1, policy_version 48980 (0.0008) +[2023-10-08 17:43:07,339][21195] Updated weights for policy 0, policy_version 49350 (0.0010) +[2023-10-08 17:43:07,671][21194] Updated weights for policy 1, policy_version 48990 (0.0009) +[2023-10-08 17:43:07,708][21195] Updated weights for policy 0, policy_version 49360 (0.0009) +[2023-10-08 17:43:08,083][21195] Updated weights for policy 0, policy_version 49370 (0.0010) +[2023-10-08 17:43:08,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 100728832. Throughput: 0: 1752.4, 1: 1726.1. Samples: 25184604. Policy #0 lag: (min: 27.0, avg: 35.3, max: 59.0) +[2023-10-08 17:43:08,803][19739] Avg episode reward: [(0, '685.100'), (1, '863.310')] +[2023-10-08 17:43:11,495][21194] Updated weights for policy 1, policy_version 49000 (0.0008) +[2023-10-08 17:43:11,877][21194] Updated weights for policy 1, policy_version 49010 (0.0009) +[2023-10-08 17:43:12,067][21195] Updated weights for policy 0, policy_version 49380 (0.0010) +[2023-10-08 17:43:12,245][21194] Updated weights for policy 1, policy_version 49020 (0.0009) +[2023-10-08 17:43:12,444][21195] Updated weights for policy 0, policy_version 49390 (0.0009) +[2023-10-08 17:43:12,814][21195] Updated weights for policy 0, policy_version 49400 (0.0008) +[2023-10-08 17:43:13,803][19739] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 100794368. Throughput: 0: 1722.4, 1: 1704.7. Samples: 25204078. Policy #0 lag: (min: 27.0, avg: 35.3, max: 59.0) +[2023-10-08 17:43:13,804][19739] Avg episode reward: [(0, '685.100'), (1, '863.310')] +[2023-10-08 17:43:13,818][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000049408_50593792.pth... +[2023-10-08 17:43:13,818][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000049024_50200576.pth... +[2023-10-08 17:43:13,854][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000047424_48562176.pth +[2023-10-08 17:43:13,862][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000047776_48922624.pth +[2023-10-08 17:43:16,199][21194] Updated weights for policy 1, policy_version 49030 (0.0007) +[2023-10-08 17:43:16,563][21194] Updated weights for policy 1, policy_version 49040 (0.0007) +[2023-10-08 17:43:16,822][21195] Updated weights for policy 0, policy_version 49410 (0.0007) +[2023-10-08 17:43:16,924][21194] Updated weights for policy 1, policy_version 49050 (0.0009) +[2023-10-08 17:43:17,184][21195] Updated weights for policy 0, policy_version 49420 (0.0007) +[2023-10-08 17:43:17,558][21195] Updated weights for policy 0, policy_version 49430 (0.0008) +[2023-10-08 17:43:17,926][21195] Updated weights for policy 0, policy_version 49440 (0.0007) +[2023-10-08 17:43:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 100859904. Throughput: 0: 1709.5, 1: 1731.3. Samples: 25220232. Policy #0 lag: (min: 27.0, avg: 35.3, max: 59.0) +[2023-10-08 17:43:18,803][19739] Avg episode reward: [(0, '685.100'), (1, '866.340')] +[2023-10-08 17:43:21,005][21194] Updated weights for policy 1, policy_version 49060 (0.0008) +[2023-10-08 17:43:21,377][21194] Updated weights for policy 1, policy_version 49070 (0.0008) +[2023-10-08 17:43:21,734][21194] Updated weights for policy 1, policy_version 49080 (0.0009) +[2023-10-08 17:43:21,920][21195] Updated weights for policy 0, policy_version 49450 (0.0009) +[2023-10-08 17:43:22,290][21195] Updated weights for policy 0, policy_version 49460 (0.0008) +[2023-10-08 17:43:22,659][21195] Updated weights for policy 0, policy_version 49470 (0.0008) +[2023-10-08 17:43:23,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 100925440. Throughput: 0: 1736.0, 1: 1698.2. Samples: 25235398. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 17:43:23,803][19739] Avg episode reward: [(0, '677.070'), (1, '866.340')] +[2023-10-08 17:43:25,761][21194] Updated weights for policy 1, policy_version 49090 (0.0008) +[2023-10-08 17:43:26,125][21194] Updated weights for policy 1, policy_version 49100 (0.0010) +[2023-10-08 17:43:26,337][21195] Updated weights for policy 0, policy_version 49480 (0.0008) +[2023-10-08 17:43:26,490][21194] Updated weights for policy 1, policy_version 49110 (0.0010) +[2023-10-08 17:43:26,701][21195] Updated weights for policy 0, policy_version 49490 (0.0007) +[2023-10-08 17:43:26,852][21194] Updated weights for policy 1, policy_version 49120 (0.0008) +[2023-10-08 17:43:27,075][21195] Updated weights for policy 0, policy_version 49500 (0.0007) +[2023-10-08 17:43:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 100990976. Throughput: 0: 1712.1, 1: 1711.6. Samples: 25255598. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 17:43:28,804][19739] Avg episode reward: [(0, '693.010'), (1, '866.340')] +[2023-10-08 17:43:30,946][21194] Updated weights for policy 1, policy_version 49130 (0.0008) +[2023-10-08 17:43:31,025][21195] Updated weights for policy 0, policy_version 49510 (0.0007) +[2023-10-08 17:43:31,305][21194] Updated weights for policy 1, policy_version 49140 (0.0009) +[2023-10-08 17:43:31,385][21195] Updated weights for policy 0, policy_version 49520 (0.0008) +[2023-10-08 17:43:31,673][21194] Updated weights for policy 1, policy_version 49150 (0.0009) +[2023-10-08 17:43:31,751][21195] Updated weights for policy 0, policy_version 49530 (0.0007) +[2023-10-08 17:43:33,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 101056512. Throughput: 0: 1723.8, 1: 1708.7. Samples: 25271650. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 17:43:33,803][19739] Avg episode reward: [(0, '699.010'), (1, '852.330')] +[2023-10-08 17:43:35,485][21194] Updated weights for policy 1, policy_version 49160 (0.0010) +[2023-10-08 17:43:35,498][21195] Updated weights for policy 0, policy_version 49540 (0.0008) +[2023-10-08 17:43:35,852][21194] Updated weights for policy 1, policy_version 49170 (0.0008) +[2023-10-08 17:43:35,872][21195] Updated weights for policy 0, policy_version 49550 (0.0008) +[2023-10-08 17:43:36,221][21194] Updated weights for policy 1, policy_version 49180 (0.0008) +[2023-10-08 17:43:36,240][21195] Updated weights for policy 0, policy_version 49560 (0.0008) +[2023-10-08 17:43:38,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 101122048. Throughput: 0: 1712.2, 1: 1693.3. Samples: 25286268. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 17:43:38,803][19739] Avg episode reward: [(0, '699.010'), (1, '852.330')] +[2023-10-08 17:43:40,134][21195] Updated weights for policy 0, policy_version 49570 (0.0008) +[2023-10-08 17:43:40,176][21194] Updated weights for policy 1, policy_version 49190 (0.0007) +[2023-10-08 17:43:40,498][21195] Updated weights for policy 0, policy_version 49580 (0.0009) +[2023-10-08 17:43:40,535][21194] Updated weights for policy 1, policy_version 49200 (0.0009) +[2023-10-08 17:43:40,867][21195] Updated weights for policy 0, policy_version 49590 (0.0008) +[2023-10-08 17:43:40,911][21194] Updated weights for policy 1, policy_version 49210 (0.0008) +[2023-10-08 17:43:41,244][21195] Updated weights for policy 0, policy_version 49600 (0.0008) +[2023-10-08 17:43:43,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 101187584. Throughput: 0: 1718.6, 1: 1724.3. Samples: 25307834. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 17:43:43,803][19739] Avg episode reward: [(0, '699.010'), (1, '862.740')] +[2023-10-08 17:43:44,754][21194] Updated weights for policy 1, policy_version 49220 (0.0010) +[2023-10-08 17:43:45,110][21194] Updated weights for policy 1, policy_version 49230 (0.0009) +[2023-10-08 17:43:45,211][21195] Updated weights for policy 0, policy_version 49610 (0.0008) +[2023-10-08 17:43:45,480][21194] Updated weights for policy 1, policy_version 49240 (0.0009) +[2023-10-08 17:43:45,574][21195] Updated weights for policy 0, policy_version 49620 (0.0010) +[2023-10-08 17:43:45,939][21195] Updated weights for policy 0, policy_version 49630 (0.0009) +[2023-10-08 17:43:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 101253120. Throughput: 0: 1742.7, 1: 1690.6. Samples: 25322808. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 17:43:48,803][19739] Avg episode reward: [(0, '699.010'), (1, '862.740')] +[2023-10-08 17:43:49,621][21194] Updated weights for policy 1, policy_version 49250 (0.0009) +[2023-10-08 17:43:49,987][21194] Updated weights for policy 1, policy_version 49260 (0.0009) +[2023-10-08 17:43:50,008][21195] Updated weights for policy 0, policy_version 49640 (0.0010) +[2023-10-08 17:43:50,350][21194] Updated weights for policy 1, policy_version 49270 (0.0008) +[2023-10-08 17:43:50,374][21195] Updated weights for policy 0, policy_version 49650 (0.0009) +[2023-10-08 17:43:50,717][21194] Updated weights for policy 1, policy_version 49280 (0.0009) +[2023-10-08 17:43:50,744][21195] Updated weights for policy 0, policy_version 49660 (0.0008) +[2023-10-08 17:43:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 101318656. Throughput: 0: 1706.5, 1: 1698.0. Samples: 25337808. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 17:43:53,803][19739] Avg episode reward: [(0, '685.230'), (1, '862.740')] +[2023-10-08 17:43:54,808][21195] Updated weights for policy 0, policy_version 49670 (0.0007) +[2023-10-08 17:43:54,850][21194] Updated weights for policy 1, policy_version 49290 (0.0008) +[2023-10-08 17:43:55,176][21195] Updated weights for policy 0, policy_version 49680 (0.0007) +[2023-10-08 17:43:55,218][21194] Updated weights for policy 1, policy_version 49300 (0.0008) +[2023-10-08 17:43:55,547][21195] Updated weights for policy 0, policy_version 49690 (0.0007) +[2023-10-08 17:43:55,583][21194] Updated weights for policy 1, policy_version 49310 (0.0010) +[2023-10-08 17:43:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 101384192. Throughput: 0: 1728.7, 1: 1715.9. Samples: 25359084. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:43:58,803][19739] Avg episode reward: [(0, '685.230'), (1, '872.090')] +[2023-10-08 17:43:59,460][21194] Updated weights for policy 1, policy_version 49320 (0.0008) +[2023-10-08 17:43:59,542][21195] Updated weights for policy 0, policy_version 49700 (0.0007) +[2023-10-08 17:43:59,828][21194] Updated weights for policy 1, policy_version 49330 (0.0008) +[2023-10-08 17:43:59,912][21195] Updated weights for policy 0, policy_version 49710 (0.0007) +[2023-10-08 17:44:00,189][21194] Updated weights for policy 1, policy_version 49340 (0.0009) +[2023-10-08 17:44:00,273][21195] Updated weights for policy 0, policy_version 49720 (0.0007) +[2023-10-08 17:44:03,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 101449728. Throughput: 0: 1738.3, 1: 1684.0. Samples: 25374238. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:44:03,803][19739] Avg episode reward: [(0, '698.710'), (1, '857.420')] +[2023-10-08 17:44:04,195][21195] Updated weights for policy 0, policy_version 49730 (0.0008) +[2023-10-08 17:44:04,226][21194] Updated weights for policy 1, policy_version 49350 (0.0008) +[2023-10-08 17:44:04,561][21195] Updated weights for policy 0, policy_version 49740 (0.0008) +[2023-10-08 17:44:04,586][21194] Updated weights for policy 1, policy_version 49360 (0.0009) +[2023-10-08 17:44:04,926][21195] Updated weights for policy 0, policy_version 49750 (0.0008) +[2023-10-08 17:44:04,954][21194] Updated weights for policy 1, policy_version 49370 (0.0008) +[2023-10-08 17:44:05,292][21195] Updated weights for policy 0, policy_version 49760 (0.0007) +[2023-10-08 17:44:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 101515264. Throughput: 0: 1711.2, 1: 1714.4. Samples: 25389552. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:44:08,803][19739] Avg episode reward: [(0, '684.000'), (1, '857.420')] +[2023-10-08 17:44:08,903][21194] Updated weights for policy 1, policy_version 49380 (0.0010) +[2023-10-08 17:44:09,259][21194] Updated weights for policy 1, policy_version 49390 (0.0007) +[2023-10-08 17:44:09,331][21195] Updated weights for policy 0, policy_version 49770 (0.0008) +[2023-10-08 17:44:09,628][21194] Updated weights for policy 1, policy_version 49400 (0.0007) +[2023-10-08 17:44:09,702][21195] Updated weights for policy 0, policy_version 49780 (0.0008) +[2023-10-08 17:44:10,078][21195] Updated weights for policy 0, policy_version 49790 (0.0009) +[2023-10-08 17:44:13,499][21194] Updated weights for policy 1, policy_version 49410 (0.0011) +[2023-10-08 17:44:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 101580800. Throughput: 0: 1725.0, 1: 1719.7. Samples: 25410608. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:44:13,803][19739] Avg episode reward: [(0, '692.720'), (1, '857.420')] +[2023-10-08 17:44:13,854][21194] Updated weights for policy 1, policy_version 49420 (0.0010) +[2023-10-08 17:44:14,222][21194] Updated weights for policy 1, policy_version 49430 (0.0009) +[2023-10-08 17:44:14,251][21195] Updated weights for policy 0, policy_version 49800 (0.0010) +[2023-10-08 17:44:14,587][21194] Updated weights for policy 1, policy_version 49440 (0.0008) +[2023-10-08 17:44:14,625][21195] Updated weights for policy 0, policy_version 49810 (0.0008) +[2023-10-08 17:44:14,991][21195] Updated weights for policy 0, policy_version 49820 (0.0009) +[2023-10-08 17:44:18,632][21194] Updated weights for policy 1, policy_version 49450 (0.0009) +[2023-10-08 17:44:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 101646336. Throughput: 0: 1721.7, 1: 1705.7. Samples: 25425882. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:44:18,803][19739] Avg episode reward: [(0, '692.720'), (1, '871.320')] +[2023-10-08 17:44:18,963][21195] Updated weights for policy 0, policy_version 49830 (0.0009) +[2023-10-08 17:44:18,998][21194] Updated weights for policy 1, policy_version 49460 (0.0009) +[2023-10-08 17:44:19,334][21195] Updated weights for policy 0, policy_version 49840 (0.0008) +[2023-10-08 17:44:19,371][21194] Updated weights for policy 1, policy_version 49470 (0.0008) +[2023-10-08 17:44:19,705][21195] Updated weights for policy 0, policy_version 49850 (0.0007) +[2023-10-08 17:44:23,219][21194] Updated weights for policy 1, policy_version 49480 (0.0007) +[2023-10-08 17:44:23,585][21194] Updated weights for policy 1, policy_version 49490 (0.0007) +[2023-10-08 17:44:23,686][21195] Updated weights for policy 0, policy_version 49860 (0.0009) +[2023-10-08 17:44:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 101711872. Throughput: 0: 1719.7, 1: 1725.2. Samples: 25441292. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:44:23,803][19739] Avg episode reward: [(0, '692.720'), (1, '871.320')] +[2023-10-08 17:44:23,953][21194] Updated weights for policy 1, policy_version 49500 (0.0007) +[2023-10-08 17:44:24,055][21195] Updated weights for policy 0, policy_version 49870 (0.0007) +[2023-10-08 17:44:24,417][21195] Updated weights for policy 0, policy_version 49880 (0.0009) +[2023-10-08 17:44:27,725][21194] Updated weights for policy 1, policy_version 49510 (0.0008) +[2023-10-08 17:44:28,089][21194] Updated weights for policy 1, policy_version 49520 (0.0010) +[2023-10-08 17:44:28,407][21195] Updated weights for policy 0, policy_version 49890 (0.0008) +[2023-10-08 17:44:28,460][21194] Updated weights for policy 1, policy_version 49530 (0.0009) +[2023-10-08 17:44:28,770][21195] Updated weights for policy 0, policy_version 49900 (0.0012) +[2023-10-08 17:44:28,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 101810176. Throughput: 0: 1716.9, 1: 1721.2. Samples: 25462548. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:44:28,803][19739] Avg episode reward: [(0, '663.670'), (1, '871.320')] +[2023-10-08 17:44:29,134][21195] Updated weights for policy 0, policy_version 49910 (0.0011) +[2023-10-08 17:44:29,500][21195] Updated weights for policy 0, policy_version 49920 (0.0008) +[2023-10-08 17:44:32,444][21194] Updated weights for policy 1, policy_version 49540 (0.0007) +[2023-10-08 17:44:32,825][21194] Updated weights for policy 1, policy_version 49550 (0.0008) +[2023-10-08 17:44:33,183][21194] Updated weights for policy 1, policy_version 49560 (0.0008) +[2023-10-08 17:44:33,529][21195] Updated weights for policy 0, policy_version 49930 (0.0010) +[2023-10-08 17:44:33,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 101875712. Throughput: 0: 1700.7, 1: 1735.0. Samples: 25477414. Policy #0 lag: (min: 1.0, avg: 10.3, max: 33.0) +[2023-10-08 17:44:33,803][19739] Avg episode reward: [(0, '663.670'), (1, '871.320')] +[2023-10-08 17:44:33,915][21195] Updated weights for policy 0, policy_version 49940 (0.0009) +[2023-10-08 17:44:34,281][21195] Updated weights for policy 0, policy_version 49950 (0.0009) +[2023-10-08 17:44:37,154][21194] Updated weights for policy 1, policy_version 49570 (0.0010) +[2023-10-08 17:44:37,521][21194] Updated weights for policy 1, policy_version 49580 (0.0007) +[2023-10-08 17:44:37,889][21194] Updated weights for policy 1, policy_version 49590 (0.0010) +[2023-10-08 17:44:38,124][21195] Updated weights for policy 0, policy_version 49960 (0.0008) +[2023-10-08 17:44:38,259][21194] Updated weights for policy 1, policy_version 49600 (0.0008) +[2023-10-08 17:44:38,499][21195] Updated weights for policy 0, policy_version 49970 (0.0008) +[2023-10-08 17:44:38,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 101941248. Throughput: 0: 1715.1, 1: 1740.6. Samples: 25493312. Policy #0 lag: (min: 1.0, avg: 10.3, max: 33.0) +[2023-10-08 17:44:38,803][19739] Avg episode reward: [(0, '663.670'), (1, '871.320')] +[2023-10-08 17:44:38,859][21195] Updated weights for policy 0, policy_version 49980 (0.0010) +[2023-10-08 17:44:42,202][21194] Updated weights for policy 1, policy_version 49610 (0.0011) +[2023-10-08 17:44:42,565][21194] Updated weights for policy 1, policy_version 49620 (0.0011) +[2023-10-08 17:44:42,776][21195] Updated weights for policy 0, policy_version 49990 (0.0007) +[2023-10-08 17:44:42,937][21194] Updated weights for policy 1, policy_version 49630 (0.0009) +[2023-10-08 17:44:43,146][21195] Updated weights for policy 0, policy_version 50000 (0.0007) +[2023-10-08 17:44:43,508][21195] Updated weights for policy 0, policy_version 50010 (0.0008) +[2023-10-08 17:44:43,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 102039552. Throughput: 0: 1717.0, 1: 1715.1. Samples: 25513528. Policy #0 lag: (min: 1.0, avg: 10.3, max: 33.0) +[2023-10-08 17:44:43,803][19739] Avg episode reward: [(0, '663.670'), (1, '871.320')] +[2023-10-08 17:44:46,919][21194] Updated weights for policy 1, policy_version 49640 (0.0007) +[2023-10-08 17:44:47,287][21194] Updated weights for policy 1, policy_version 49650 (0.0008) +[2023-10-08 17:44:47,350][21195] Updated weights for policy 0, policy_version 50020 (0.0009) +[2023-10-08 17:44:47,655][21194] Updated weights for policy 1, policy_version 49660 (0.0010) +[2023-10-08 17:44:47,719][21195] Updated weights for policy 0, policy_version 50030 (0.0008) +[2023-10-08 17:44:48,081][21195] Updated weights for policy 0, policy_version 50040 (0.0008) +[2023-10-08 17:44:48,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 102105088. Throughput: 0: 1697.6, 1: 1744.0. Samples: 25529112. Policy #0 lag: (min: 1.0, avg: 10.3, max: 33.0) +[2023-10-08 17:44:48,803][19739] Avg episode reward: [(0, '668.910'), (1, '881.790')] +[2023-10-08 17:44:51,714][21194] Updated weights for policy 1, policy_version 49670 (0.0010) +[2023-10-08 17:44:52,022][21195] Updated weights for policy 0, policy_version 50050 (0.0009) +[2023-10-08 17:44:52,072][21194] Updated weights for policy 1, policy_version 49680 (0.0010) +[2023-10-08 17:44:52,387][21195] Updated weights for policy 0, policy_version 50060 (0.0008) +[2023-10-08 17:44:52,434][21194] Updated weights for policy 1, policy_version 49690 (0.0007) +[2023-10-08 17:44:52,755][21195] Updated weights for policy 0, policy_version 50070 (0.0009) +[2023-10-08 17:44:53,134][21195] Updated weights for policy 0, policy_version 50080 (0.0008) +[2023-10-08 17:44:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 102170624. Throughput: 0: 1727.8, 1: 1724.9. Samples: 25544926. Policy #0 lag: (min: 1.0, avg: 10.3, max: 33.0) +[2023-10-08 17:44:53,803][19739] Avg episode reward: [(0, '668.920'), (1, '881.790')] +[2023-10-08 17:44:56,491][21194] Updated weights for policy 1, policy_version 49700 (0.0008) +[2023-10-08 17:44:56,849][21194] Updated weights for policy 1, policy_version 49710 (0.0007) +[2023-10-08 17:44:56,992][21195] Updated weights for policy 0, policy_version 50090 (0.0007) +[2023-10-08 17:44:57,221][21194] Updated weights for policy 1, policy_version 49720 (0.0009) +[2023-10-08 17:44:57,360][21195] Updated weights for policy 0, policy_version 50100 (0.0007) +[2023-10-08 17:44:57,723][21195] Updated weights for policy 0, policy_version 50110 (0.0007) +[2023-10-08 17:44:58,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 102236160. Throughput: 0: 1711.1, 1: 1706.6. Samples: 25564404. Policy #0 lag: (min: 1.0, avg: 10.3, max: 33.0) +[2023-10-08 17:44:58,804][19739] Avg episode reward: [(0, '668.920'), (1, '836.040')] +[2023-10-08 17:45:01,254][21194] Updated weights for policy 1, policy_version 49730 (0.0008) +[2023-10-08 17:45:01,452][21195] Updated weights for policy 0, policy_version 50120 (0.0008) +[2023-10-08 17:45:01,615][21194] Updated weights for policy 1, policy_version 49740 (0.0007) +[2023-10-08 17:45:01,818][21195] Updated weights for policy 0, policy_version 50130 (0.0007) +[2023-10-08 17:45:01,982][21194] Updated weights for policy 1, policy_version 49750 (0.0008) +[2023-10-08 17:45:02,182][21195] Updated weights for policy 0, policy_version 50140 (0.0008) +[2023-10-08 17:45:02,342][21194] Updated weights for policy 1, policy_version 49760 (0.0007) +[2023-10-08 17:45:03,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 102301696. Throughput: 0: 1716.2, 1: 1733.2. Samples: 25581106. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 17:45:03,804][19739] Avg episode reward: [(0, '669.430'), (1, '836.040')] +[2023-10-08 17:45:06,209][21195] Updated weights for policy 0, policy_version 50150 (0.0008) +[2023-10-08 17:45:06,394][21194] Updated weights for policy 1, policy_version 49770 (0.0008) +[2023-10-08 17:45:06,577][21195] Updated weights for policy 0, policy_version 50160 (0.0008) +[2023-10-08 17:45:06,767][21194] Updated weights for policy 1, policy_version 49780 (0.0008) +[2023-10-08 17:45:06,943][21195] Updated weights for policy 0, policy_version 50170 (0.0007) +[2023-10-08 17:45:07,138][21194] Updated weights for policy 1, policy_version 49790 (0.0008) +[2023-10-08 17:45:08,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 102367232. Throughput: 0: 1724.7, 1: 1702.6. Samples: 25595518. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 17:45:08,803][19739] Avg episode reward: [(0, '669.430'), (1, '836.040')] +[2023-10-08 17:45:10,785][21195] Updated weights for policy 0, policy_version 50180 (0.0008) +[2023-10-08 17:45:10,934][21194] Updated weights for policy 1, policy_version 49800 (0.0008) +[2023-10-08 17:45:11,153][21195] Updated weights for policy 0, policy_version 50190 (0.0007) +[2023-10-08 17:45:11,294][21194] Updated weights for policy 1, policy_version 49810 (0.0008) +[2023-10-08 17:45:11,514][21195] Updated weights for policy 0, policy_version 50200 (0.0008) +[2023-10-08 17:45:11,658][21194] Updated weights for policy 1, policy_version 49820 (0.0008) +[2023-10-08 17:45:13,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 102432768. Throughput: 0: 1718.6, 1: 1699.9. Samples: 25616378. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 17:45:13,803][19739] Avg episode reward: [(0, '669.430'), (1, '836.040')] +[2023-10-08 17:45:13,813][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000050208_51412992.pth... +[2023-10-08 17:45:13,813][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000049824_51019776.pth... +[2023-10-08 17:45:13,864][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000048224_49381376.pth +[2023-10-08 17:45:13,865][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000048608_49774592.pth +[2023-10-08 17:45:15,540][21194] Updated weights for policy 1, policy_version 49830 (0.0009) +[2023-10-08 17:45:15,590][21195] Updated weights for policy 0, policy_version 50210 (0.0008) +[2023-10-08 17:45:15,905][21194] Updated weights for policy 1, policy_version 49840 (0.0007) +[2023-10-08 17:45:15,962][21195] Updated weights for policy 0, policy_version 50220 (0.0008) +[2023-10-08 17:45:16,271][21194] Updated weights for policy 1, policy_version 49850 (0.0007) +[2023-10-08 17:45:16,331][21195] Updated weights for policy 0, policy_version 50230 (0.0007) +[2023-10-08 17:45:16,707][21195] Updated weights for policy 0, policy_version 50240 (0.0008) +[2023-10-08 17:45:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 102498304. Throughput: 0: 1738.6, 1: 1706.8. Samples: 25632454. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 17:45:18,803][19739] Avg episode reward: [(0, '669.430'), (1, '849.190')] +[2023-10-08 17:45:20,280][21194] Updated weights for policy 1, policy_version 49860 (0.0007) +[2023-10-08 17:45:20,639][21195] Updated weights for policy 0, policy_version 50250 (0.0007) +[2023-10-08 17:45:20,650][21194] Updated weights for policy 1, policy_version 49870 (0.0009) +[2023-10-08 17:45:20,999][21195] Updated weights for policy 0, policy_version 50260 (0.0008) +[2023-10-08 17:45:21,006][21194] Updated weights for policy 1, policy_version 49880 (0.0007) +[2023-10-08 17:45:21,375][21195] Updated weights for policy 0, policy_version 50270 (0.0008) +[2023-10-08 17:45:23,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 102563840. Throughput: 0: 1729.2, 1: 1697.8. Samples: 25647528. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 17:45:23,804][19739] Avg episode reward: [(0, '669.430'), (1, '840.320')] +[2023-10-08 17:45:24,849][21194] Updated weights for policy 1, policy_version 49890 (0.0008) +[2023-10-08 17:45:25,221][21194] Updated weights for policy 1, policy_version 49900 (0.0008) +[2023-10-08 17:45:25,488][21195] Updated weights for policy 0, policy_version 50280 (0.0009) +[2023-10-08 17:45:25,580][21194] Updated weights for policy 1, policy_version 49910 (0.0010) +[2023-10-08 17:45:25,869][21195] Updated weights for policy 0, policy_version 50290 (0.0008) +[2023-10-08 17:45:25,944][21194] Updated weights for policy 1, policy_version 49920 (0.0009) +[2023-10-08 17:45:26,229][21195] Updated weights for policy 0, policy_version 50300 (0.0008) +[2023-10-08 17:45:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 102629376. Throughput: 0: 1724.2, 1: 1727.8. Samples: 25668868. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 17:45:28,803][19739] Avg episode reward: [(0, '669.430'), (1, '841.280')] +[2023-10-08 17:45:29,776][21194] Updated weights for policy 1, policy_version 49930 (0.0008) +[2023-10-08 17:45:30,139][21194] Updated weights for policy 1, policy_version 49940 (0.0007) +[2023-10-08 17:45:30,225][21195] Updated weights for policy 0, policy_version 50310 (0.0008) +[2023-10-08 17:45:30,513][21194] Updated weights for policy 1, policy_version 49950 (0.0008) +[2023-10-08 17:45:30,597][21195] Updated weights for policy 0, policy_version 50320 (0.0008) +[2023-10-08 17:45:30,968][21195] Updated weights for policy 0, policy_version 50330 (0.0008) +[2023-10-08 17:45:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 102694912. Throughput: 0: 1745.7, 1: 1699.1. Samples: 25684128. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 17:45:33,803][19739] Avg episode reward: [(0, '696.590'), (1, '841.280')] +[2023-10-08 17:45:34,661][21194] Updated weights for policy 1, policy_version 49960 (0.0007) +[2023-10-08 17:45:34,909][21195] Updated weights for policy 0, policy_version 50340 (0.0007) +[2023-10-08 17:45:35,029][21194] Updated weights for policy 1, policy_version 49970 (0.0008) +[2023-10-08 17:45:35,271][21195] Updated weights for policy 0, policy_version 50350 (0.0007) +[2023-10-08 17:45:35,390][21194] Updated weights for policy 1, policy_version 49980 (0.0009) +[2023-10-08 17:45:35,638][21195] Updated weights for policy 0, policy_version 50360 (0.0009) +[2023-10-08 17:45:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 102760448. Throughput: 0: 1715.7, 1: 1719.7. Samples: 25699520. Policy #0 lag: (min: 14.0, avg: 15.8, max: 43.0) +[2023-10-08 17:45:38,803][19739] Avg episode reward: [(0, '696.590'), (1, '841.280')] +[2023-10-08 17:45:39,320][21194] Updated weights for policy 1, policy_version 49990 (0.0009) +[2023-10-08 17:45:39,530][21195] Updated weights for policy 0, policy_version 50370 (0.0010) +[2023-10-08 17:45:39,683][21194] Updated weights for policy 1, policy_version 50000 (0.0007) +[2023-10-08 17:45:39,898][21195] Updated weights for policy 0, policy_version 50380 (0.0009) +[2023-10-08 17:45:40,043][21194] Updated weights for policy 1, policy_version 50010 (0.0008) +[2023-10-08 17:45:40,262][21195] Updated weights for policy 0, policy_version 50390 (0.0009) +[2023-10-08 17:45:40,630][21195] Updated weights for policy 0, policy_version 50400 (0.0010) +[2023-10-08 17:45:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 102825984. Throughput: 0: 1741.5, 1: 1736.9. Samples: 25720930. Policy #0 lag: (min: 14.0, avg: 15.8, max: 43.0) +[2023-10-08 17:45:43,803][19739] Avg episode reward: [(0, '696.590'), (1, '841.280')] +[2023-10-08 17:45:44,054][21194] Updated weights for policy 1, policy_version 50020 (0.0010) +[2023-10-08 17:45:44,424][21194] Updated weights for policy 1, policy_version 50030 (0.0008) +[2023-10-08 17:45:44,577][21195] Updated weights for policy 0, policy_version 50410 (0.0009) +[2023-10-08 17:45:44,780][21194] Updated weights for policy 1, policy_version 50040 (0.0007) +[2023-10-08 17:45:44,947][21195] Updated weights for policy 0, policy_version 50420 (0.0008) +[2023-10-08 17:45:45,314][21195] Updated weights for policy 0, policy_version 50430 (0.0010) +[2023-10-08 17:45:48,715][21194] Updated weights for policy 1, policy_version 50050 (0.0007) +[2023-10-08 17:45:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 102891520. Throughput: 0: 1739.4, 1: 1710.6. Samples: 25736354. Policy #0 lag: (min: 14.0, avg: 15.8, max: 43.0) +[2023-10-08 17:45:48,803][19739] Avg episode reward: [(0, '711.500'), (1, '855.380')] +[2023-10-08 17:45:49,073][21194] Updated weights for policy 1, policy_version 50060 (0.0007) +[2023-10-08 17:45:49,213][21195] Updated weights for policy 0, policy_version 50440 (0.0008) +[2023-10-08 17:45:49,443][21194] Updated weights for policy 1, policy_version 50070 (0.0008) +[2023-10-08 17:45:49,580][21195] Updated weights for policy 0, policy_version 50450 (0.0008) +[2023-10-08 17:45:49,797][21194] Updated weights for policy 1, policy_version 50080 (0.0008) +[2023-10-08 17:45:49,947][21195] Updated weights for policy 0, policy_version 50460 (0.0009) +[2023-10-08 17:45:53,720][21195] Updated weights for policy 0, policy_version 50470 (0.0010) +[2023-10-08 17:45:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 102957056. Throughput: 0: 1731.5, 1: 1738.5. Samples: 25751668. Policy #0 lag: (min: 14.0, avg: 15.8, max: 43.0) +[2023-10-08 17:45:53,803][19739] Avg episode reward: [(0, '711.500'), (1, '855.380')] +[2023-10-08 17:45:53,910][21194] Updated weights for policy 1, policy_version 50090 (0.0010) +[2023-10-08 17:45:54,097][21195] Updated weights for policy 0, policy_version 50480 (0.0008) +[2023-10-08 17:45:54,278][21194] Updated weights for policy 1, policy_version 50100 (0.0009) +[2023-10-08 17:45:54,462][21195] Updated weights for policy 0, policy_version 50490 (0.0009) +[2023-10-08 17:45:54,650][21194] Updated weights for policy 1, policy_version 50110 (0.0009) +[2023-10-08 17:45:58,282][21195] Updated weights for policy 0, policy_version 50500 (0.0007) +[2023-10-08 17:45:58,537][21194] Updated weights for policy 1, policy_version 50120 (0.0007) +[2023-10-08 17:45:58,648][21195] Updated weights for policy 0, policy_version 50510 (0.0008) +[2023-10-08 17:45:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 103022592. Throughput: 0: 1743.4, 1: 1743.1. Samples: 25773272. Policy #0 lag: (min: 14.0, avg: 15.8, max: 43.0) +[2023-10-08 17:45:58,803][19739] Avg episode reward: [(0, '711.500'), (1, '855.380')] +[2023-10-08 17:45:58,906][21194] Updated weights for policy 1, policy_version 50130 (0.0007) +[2023-10-08 17:45:59,022][21195] Updated weights for policy 0, policy_version 50520 (0.0010) +[2023-10-08 17:45:59,267][21194] Updated weights for policy 1, policy_version 50140 (0.0007) +[2023-10-08 17:46:02,995][21195] Updated weights for policy 0, policy_version 50530 (0.0008) +[2023-10-08 17:46:03,178][21194] Updated weights for policy 1, policy_version 50150 (0.0009) +[2023-10-08 17:46:03,362][21195] Updated weights for policy 0, policy_version 50540 (0.0008) +[2023-10-08 17:46:03,540][21194] Updated weights for policy 1, policy_version 50160 (0.0007) +[2023-10-08 17:46:03,733][21195] Updated weights for policy 0, policy_version 50550 (0.0008) +[2023-10-08 17:46:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 103088128. Throughput: 0: 1719.1, 1: 1722.0. Samples: 25787300. Policy #0 lag: (min: 14.0, avg: 15.8, max: 43.0) +[2023-10-08 17:46:03,803][19739] Avg episode reward: [(0, '734.540'), (1, '839.490')] +[2023-10-08 17:46:03,904][21194] Updated weights for policy 1, policy_version 50170 (0.0009) +[2023-10-08 17:46:04,098][21195] Updated weights for policy 0, policy_version 50560 (0.0008) +[2023-10-08 17:46:07,906][21194] Updated weights for policy 1, policy_version 50180 (0.0009) +[2023-10-08 17:46:08,116][21195] Updated weights for policy 0, policy_version 50570 (0.0007) +[2023-10-08 17:46:08,267][21194] Updated weights for policy 1, policy_version 50190 (0.0007) +[2023-10-08 17:46:08,480][21195] Updated weights for policy 0, policy_version 50580 (0.0007) +[2023-10-08 17:46:08,632][21194] Updated weights for policy 1, policy_version 50200 (0.0007) +[2023-10-08 17:46:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 103153664. Throughput: 0: 1736.0, 1: 1731.5. Samples: 25803564. Policy #0 lag: (min: 14.0, avg: 15.8, max: 43.0) +[2023-10-08 17:46:08,803][19739] Avg episode reward: [(0, '734.540'), (1, '839.490')] +[2023-10-08 17:46:08,860][21195] Updated weights for policy 0, policy_version 50590 (0.0008) +[2023-10-08 17:46:12,697][21194] Updated weights for policy 1, policy_version 50210 (0.0010) +[2023-10-08 17:46:12,834][21195] Updated weights for policy 0, policy_version 50600 (0.0008) +[2023-10-08 17:46:13,059][21194] Updated weights for policy 1, policy_version 50220 (0.0008) +[2023-10-08 17:46:13,199][21195] Updated weights for policy 0, policy_version 50610 (0.0009) +[2023-10-08 17:46:13,417][21194] Updated weights for policy 1, policy_version 50230 (0.0008) +[2023-10-08 17:46:13,568][21195] Updated weights for policy 0, policy_version 50620 (0.0008) +[2023-10-08 17:46:13,776][21194] Updated weights for policy 1, policy_version 50240 (0.0009) +[2023-10-08 17:46:13,803][19739] Fps is (10 sec: 19661.0, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 103284736. Throughput: 0: 1732.7, 1: 1715.4. Samples: 25824032. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 17:46:13,803][19739] Avg episode reward: [(0, '734.540'), (1, '839.490')] +[2023-10-08 17:46:17,595][21195] Updated weights for policy 0, policy_version 50630 (0.0007) +[2023-10-08 17:46:17,672][21194] Updated weights for policy 1, policy_version 50250 (0.0010) +[2023-10-08 17:46:17,957][21195] Updated weights for policy 0, policy_version 50640 (0.0007) +[2023-10-08 17:46:18,030][21194] Updated weights for policy 1, policy_version 50260 (0.0009) +[2023-10-08 17:46:18,322][21195] Updated weights for policy 0, policy_version 50650 (0.0009) +[2023-10-08 17:46:18,397][21194] Updated weights for policy 1, policy_version 50270 (0.0008) +[2023-10-08 17:46:18,803][19739] Fps is (10 sec: 19660.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 103350272. Throughput: 0: 1709.6, 1: 1728.3. Samples: 25838832. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 17:46:18,803][19739] Avg episode reward: [(0, '734.540'), (1, '839.490')] +[2023-10-08 17:46:22,241][21195] Updated weights for policy 0, policy_version 50660 (0.0007) +[2023-10-08 17:46:22,345][21194] Updated weights for policy 1, policy_version 50280 (0.0009) +[2023-10-08 17:46:22,615][21195] Updated weights for policy 0, policy_version 50670 (0.0008) +[2023-10-08 17:46:22,715][21194] Updated weights for policy 1, policy_version 50290 (0.0008) +[2023-10-08 17:46:22,977][21195] Updated weights for policy 0, policy_version 50680 (0.0009) +[2023-10-08 17:46:23,080][21194] Updated weights for policy 1, policy_version 50300 (0.0008) +[2023-10-08 17:46:23,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 103415808. Throughput: 0: 1737.9, 1: 1728.1. Samples: 25855492. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 17:46:23,803][19739] Avg episode reward: [(0, '734.540'), (1, '839.380')] +[2023-10-08 17:46:26,931][21195] Updated weights for policy 0, policy_version 50690 (0.0008) +[2023-10-08 17:46:27,001][21194] Updated weights for policy 1, policy_version 50310 (0.0008) +[2023-10-08 17:46:27,288][21195] Updated weights for policy 0, policy_version 50700 (0.0007) +[2023-10-08 17:46:27,371][21194] Updated weights for policy 1, policy_version 50320 (0.0009) +[2023-10-08 17:46:27,657][21195] Updated weights for policy 0, policy_version 50710 (0.0007) +[2023-10-08 17:46:27,735][21194] Updated weights for policy 1, policy_version 50330 (0.0008) +[2023-10-08 17:46:28,025][21195] Updated weights for policy 0, policy_version 50720 (0.0007) +[2023-10-08 17:46:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 103481344. Throughput: 0: 1714.7, 1: 1700.5. Samples: 25874614. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 17:46:28,803][19739] Avg episode reward: [(0, '734.540'), (1, '839.380')] +[2023-10-08 17:46:31,713][21195] Updated weights for policy 0, policy_version 50730 (0.0008) +[2023-10-08 17:46:31,823][21194] Updated weights for policy 1, policy_version 50340 (0.0007) +[2023-10-08 17:46:32,081][21195] Updated weights for policy 0, policy_version 50740 (0.0009) +[2023-10-08 17:46:32,194][21194] Updated weights for policy 1, policy_version 50350 (0.0010) +[2023-10-08 17:46:32,452][21195] Updated weights for policy 0, policy_version 50750 (0.0010) +[2023-10-08 17:46:32,565][21194] Updated weights for policy 1, policy_version 50360 (0.0007) +[2023-10-08 17:46:33,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 103546880. Throughput: 0: 1712.8, 1: 1728.4. Samples: 25891208. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 17:46:33,804][19739] Avg episode reward: [(0, '734.540'), (1, '839.380')] +[2023-10-08 17:46:36,314][21195] Updated weights for policy 0, policy_version 50760 (0.0009) +[2023-10-08 17:46:36,687][21194] Updated weights for policy 1, policy_version 50370 (0.0007) +[2023-10-08 17:46:36,687][21195] Updated weights for policy 0, policy_version 50770 (0.0007) +[2023-10-08 17:46:37,051][21194] Updated weights for policy 1, policy_version 50380 (0.0009) +[2023-10-08 17:46:37,056][21195] Updated weights for policy 0, policy_version 50780 (0.0008) +[2023-10-08 17:46:37,415][21194] Updated weights for policy 1, policy_version 50390 (0.0007) +[2023-10-08 17:46:37,779][21194] Updated weights for policy 1, policy_version 50400 (0.0007) +[2023-10-08 17:46:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 103612416. Throughput: 0: 1727.7, 1: 1712.2. Samples: 25906466. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 17:46:38,803][19739] Avg episode reward: [(0, '734.540'), (1, '839.380')] +[2023-10-08 17:46:40,947][21195] Updated weights for policy 0, policy_version 50790 (0.0009) +[2023-10-08 17:46:41,308][21195] Updated weights for policy 0, policy_version 50800 (0.0009) +[2023-10-08 17:46:41,673][21195] Updated weights for policy 0, policy_version 50810 (0.0008) +[2023-10-08 17:46:41,858][21194] Updated weights for policy 1, policy_version 50410 (0.0008) +[2023-10-08 17:46:42,229][21194] Updated weights for policy 1, policy_version 50420 (0.0008) +[2023-10-08 17:46:42,590][21194] Updated weights for policy 1, policy_version 50430 (0.0009) +[2023-10-08 17:46:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 103677952. Throughput: 0: 1708.7, 1: 1690.1. Samples: 25926218. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 17:46:43,803][19739] Avg episode reward: [(0, '734.540'), (1, '846.480')] +[2023-10-08 17:46:45,562][21195] Updated weights for policy 0, policy_version 50820 (0.0007) +[2023-10-08 17:46:45,938][21195] Updated weights for policy 0, policy_version 50830 (0.0010) +[2023-10-08 17:46:46,313][21195] Updated weights for policy 0, policy_version 50840 (0.0009) +[2023-10-08 17:46:46,533][21194] Updated weights for policy 1, policy_version 50440 (0.0008) +[2023-10-08 17:46:46,890][21194] Updated weights for policy 1, policy_version 50450 (0.0009) +[2023-10-08 17:46:47,258][21194] Updated weights for policy 1, policy_version 50460 (0.0009) +[2023-10-08 17:46:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 103743488. Throughput: 0: 1736.0, 1: 1720.9. Samples: 25942860. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 17:46:48,803][19739] Avg episode reward: [(0, '734.540'), (1, '861.430')] +[2023-10-08 17:46:50,232][21195] Updated weights for policy 0, policy_version 50850 (0.0007) +[2023-10-08 17:46:50,604][21195] Updated weights for policy 0, policy_version 50860 (0.0009) +[2023-10-08 17:46:50,973][21195] Updated weights for policy 0, policy_version 50870 (0.0008) +[2023-10-08 17:46:51,285][21194] Updated weights for policy 1, policy_version 50470 (0.0010) +[2023-10-08 17:46:51,342][21195] Updated weights for policy 0, policy_version 50880 (0.0007) +[2023-10-08 17:46:51,641][21194] Updated weights for policy 1, policy_version 50480 (0.0010) +[2023-10-08 17:46:52,014][21194] Updated weights for policy 1, policy_version 50490 (0.0007) +[2023-10-08 17:46:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 103809024. Throughput: 0: 1717.2, 1: 1693.3. Samples: 25957038. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 17:46:53,803][19739] Avg episode reward: [(0, '734.540'), (1, '861.430')] +[2023-10-08 17:46:55,201][21195] Updated weights for policy 0, policy_version 50890 (0.0009) +[2023-10-08 17:46:55,571][21195] Updated weights for policy 0, policy_version 50900 (0.0007) +[2023-10-08 17:46:55,914][21194] Updated weights for policy 1, policy_version 50500 (0.0008) +[2023-10-08 17:46:55,937][21195] Updated weights for policy 0, policy_version 50910 (0.0008) +[2023-10-08 17:46:56,267][21194] Updated weights for policy 1, policy_version 50510 (0.0010) +[2023-10-08 17:46:56,629][21194] Updated weights for policy 1, policy_version 50520 (0.0008) +[2023-10-08 17:46:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 103874560. Throughput: 0: 1728.8, 1: 1697.5. Samples: 25978216. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 17:46:58,803][19739] Avg episode reward: [(0, '734.540'), (1, '861.430')] +[2023-10-08 17:46:59,769][21195] Updated weights for policy 0, policy_version 50920 (0.0008) +[2023-10-08 17:47:00,145][21195] Updated weights for policy 0, policy_version 50930 (0.0008) +[2023-10-08 17:47:00,511][21195] Updated weights for policy 0, policy_version 50940 (0.0009) +[2023-10-08 17:47:00,660][21194] Updated weights for policy 1, policy_version 50530 (0.0008) +[2023-10-08 17:47:01,023][21194] Updated weights for policy 1, policy_version 50540 (0.0009) +[2023-10-08 17:47:01,386][21194] Updated weights for policy 1, policy_version 50550 (0.0008) +[2023-10-08 17:47:01,746][21194] Updated weights for policy 1, policy_version 50560 (0.0008) +[2023-10-08 17:47:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 103940096. Throughput: 0: 1758.2, 1: 1702.6. Samples: 25994568. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 17:47:03,803][19739] Avg episode reward: [(0, '738.330'), (1, '861.430')] +[2023-10-08 17:47:04,370][21195] Updated weights for policy 0, policy_version 50950 (0.0007) +[2023-10-08 17:47:04,741][21195] Updated weights for policy 0, policy_version 50960 (0.0008) +[2023-10-08 17:47:05,113][21195] Updated weights for policy 0, policy_version 50970 (0.0008) +[2023-10-08 17:47:05,708][21194] Updated weights for policy 1, policy_version 50570 (0.0009) +[2023-10-08 17:47:06,075][21194] Updated weights for policy 1, policy_version 50580 (0.0010) +[2023-10-08 17:47:06,437][21194] Updated weights for policy 1, policy_version 50590 (0.0007) +[2023-10-08 17:47:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 104005632. Throughput: 0: 1734.0, 1: 1682.2. Samples: 26009218. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 17:47:08,803][19739] Avg episode reward: [(0, '738.330'), (1, '861.430')] +[2023-10-08 17:47:09,122][21195] Updated weights for policy 0, policy_version 50980 (0.0009) +[2023-10-08 17:47:09,496][21195] Updated weights for policy 0, policy_version 50990 (0.0010) +[2023-10-08 17:47:09,868][21195] Updated weights for policy 0, policy_version 51000 (0.0011) +[2023-10-08 17:47:10,459][21194] Updated weights for policy 1, policy_version 50600 (0.0010) +[2023-10-08 17:47:10,830][21194] Updated weights for policy 1, policy_version 50610 (0.0010) +[2023-10-08 17:47:11,188][21194] Updated weights for policy 1, policy_version 50620 (0.0010) +[2023-10-08 17:47:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 104071168. Throughput: 0: 1757.0, 1: 1708.5. Samples: 26030562. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 17:47:13,803][19739] Avg episode reward: [(0, '738.330'), (1, '861.430')] +[2023-10-08 17:47:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000050624_51838976.pth... +[2023-10-08 17:47:13,840][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000049024_50200576.pth +[2023-10-08 17:47:13,842][21195] Updated weights for policy 0, policy_version 51010 (0.0009) +[2023-10-08 17:47:14,216][21195] Updated weights for policy 0, policy_version 51020 (0.0008) +[2023-10-08 17:47:14,599][21195] Updated weights for policy 0, policy_version 51030 (0.0009) +[2023-10-08 17:47:14,966][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000051040_52264960.pth... +[2023-10-08 17:47:14,967][21195] Updated weights for policy 0, policy_version 51040 (0.0008) +[2023-10-08 17:47:15,001][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000049408_50593792.pth +[2023-10-08 17:47:15,201][21194] Updated weights for policy 1, policy_version 50630 (0.0008) +[2023-10-08 17:47:15,573][21194] Updated weights for policy 1, policy_version 50640 (0.0008) +[2023-10-08 17:47:15,931][21194] Updated weights for policy 1, policy_version 50650 (0.0008) +[2023-10-08 17:47:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 104136704. Throughput: 0: 1752.7, 1: 1685.3. Samples: 26045920. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:47:18,803][19739] Avg episode reward: [(0, '743.340'), (1, '861.430')] +[2023-10-08 17:47:19,066][21195] Updated weights for policy 0, policy_version 51050 (0.0007) +[2023-10-08 17:47:19,434][21195] Updated weights for policy 0, policy_version 51060 (0.0008) +[2023-10-08 17:47:19,801][21195] Updated weights for policy 0, policy_version 51070 (0.0009) +[2023-10-08 17:47:19,895][21194] Updated weights for policy 1, policy_version 50660 (0.0009) +[2023-10-08 17:47:20,247][21194] Updated weights for policy 1, policy_version 50670 (0.0010) +[2023-10-08 17:47:20,619][21194] Updated weights for policy 1, policy_version 50680 (0.0010) +[2023-10-08 17:47:23,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 104202240. Throughput: 0: 1737.7, 1: 1697.6. Samples: 26061056. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:47:23,803][19739] Avg episode reward: [(0, '674.430'), (1, '861.440')] +[2023-10-08 17:47:23,811][21195] Updated weights for policy 0, policy_version 51080 (0.0009) +[2023-10-08 17:47:24,177][21195] Updated weights for policy 0, policy_version 51090 (0.0010) +[2023-10-08 17:47:24,549][21195] Updated weights for policy 0, policy_version 51100 (0.0007) +[2023-10-08 17:47:24,593][21194] Updated weights for policy 1, policy_version 50690 (0.0009) +[2023-10-08 17:47:24,954][21194] Updated weights for policy 1, policy_version 50700 (0.0011) +[2023-10-08 17:47:25,319][21194] Updated weights for policy 1, policy_version 50710 (0.0008) +[2023-10-08 17:47:25,692][21194] Updated weights for policy 1, policy_version 50720 (0.0009) +[2023-10-08 17:47:28,424][21195] Updated weights for policy 0, policy_version 51110 (0.0009) +[2023-10-08 17:47:28,798][21195] Updated weights for policy 0, policy_version 51120 (0.0010) +[2023-10-08 17:47:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 104267776. Throughput: 0: 1756.8, 1: 1725.6. Samples: 26082924. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:47:28,803][19739] Avg episode reward: [(0, '674.650'), (1, '862.420')] +[2023-10-08 17:47:29,178][21195] Updated weights for policy 0, policy_version 51130 (0.0010) +[2023-10-08 17:47:29,610][21194] Updated weights for policy 1, policy_version 50730 (0.0007) +[2023-10-08 17:47:29,971][21194] Updated weights for policy 1, policy_version 50740 (0.0007) +[2023-10-08 17:47:30,331][21194] Updated weights for policy 1, policy_version 50750 (0.0007) +[2023-10-08 17:47:33,075][21195] Updated weights for policy 0, policy_version 51140 (0.0008) +[2023-10-08 17:47:33,437][21195] Updated weights for policy 0, policy_version 51150 (0.0008) +[2023-10-08 17:47:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 104333312. Throughput: 0: 1735.8, 1: 1694.0. Samples: 26097200. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:47:33,803][19739] Avg episode reward: [(0, '674.650'), (1, '862.420')] +[2023-10-08 17:47:33,814][21195] Updated weights for policy 0, policy_version 51160 (0.0009) +[2023-10-08 17:47:34,177][21194] Updated weights for policy 1, policy_version 50760 (0.0008) +[2023-10-08 17:47:34,539][21194] Updated weights for policy 1, policy_version 50770 (0.0009) +[2023-10-08 17:47:34,904][21194] Updated weights for policy 1, policy_version 50780 (0.0008) +[2023-10-08 17:47:37,743][21195] Updated weights for policy 0, policy_version 51170 (0.0007) +[2023-10-08 17:47:38,115][21195] Updated weights for policy 0, policy_version 51180 (0.0007) +[2023-10-08 17:47:38,486][21195] Updated weights for policy 0, policy_version 51190 (0.0008) +[2023-10-08 17:47:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 104398848. Throughput: 0: 1755.0, 1: 1722.0. Samples: 26113504. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:47:38,803][19739] Avg episode reward: [(0, '689.460'), (1, '847.780')] +[2023-10-08 17:47:38,857][21195] Updated weights for policy 0, policy_version 51200 (0.0008) +[2023-10-08 17:47:38,916][21194] Updated weights for policy 1, policy_version 50790 (0.0008) +[2023-10-08 17:47:39,281][21194] Updated weights for policy 1, policy_version 50800 (0.0010) +[2023-10-08 17:47:39,649][21194] Updated weights for policy 1, policy_version 50810 (0.0009) +[2023-10-08 17:47:42,778][21195] Updated weights for policy 0, policy_version 51210 (0.0007) +[2023-10-08 17:47:43,146][21195] Updated weights for policy 0, policy_version 51220 (0.0008) +[2023-10-08 17:47:43,518][21195] Updated weights for policy 0, policy_version 51230 (0.0007) +[2023-10-08 17:47:43,733][21194] Updated weights for policy 1, policy_version 50820 (0.0009) +[2023-10-08 17:47:43,803][19739] Fps is (10 sec: 16383.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 104497152. Throughput: 0: 1737.5, 1: 1731.2. Samples: 26134310. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:47:43,804][19739] Avg episode reward: [(0, '718.200'), (1, '847.780')] +[2023-10-08 17:47:44,109][21194] Updated weights for policy 1, policy_version 50830 (0.0010) +[2023-10-08 17:47:44,478][21194] Updated weights for policy 1, policy_version 50840 (0.0009) +[2023-10-08 17:47:47,388][21195] Updated weights for policy 0, policy_version 51240 (0.0009) +[2023-10-08 17:47:47,760][21195] Updated weights for policy 0, policy_version 51250 (0.0010) +[2023-10-08 17:47:48,133][21195] Updated weights for policy 0, policy_version 51260 (0.0010) +[2023-10-08 17:47:48,446][21194] Updated weights for policy 1, policy_version 50850 (0.0008) +[2023-10-08 17:47:48,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 104562688. Throughput: 0: 1713.4, 1: 1711.8. Samples: 26148700. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:47:48,803][19739] Avg episode reward: [(0, '718.200'), (1, '835.850')] +[2023-10-08 17:47:48,806][21194] Updated weights for policy 1, policy_version 50860 (0.0009) +[2023-10-08 17:47:49,187][21194] Updated weights for policy 1, policy_version 50870 (0.0008) +[2023-10-08 17:47:49,555][21194] Updated weights for policy 1, policy_version 50880 (0.0009) +[2023-10-08 17:47:52,049][21195] Updated weights for policy 0, policy_version 51270 (0.0010) +[2023-10-08 17:47:52,414][21195] Updated weights for policy 0, policy_version 51280 (0.0008) +[2023-10-08 17:47:52,784][21195] Updated weights for policy 0, policy_version 51290 (0.0010) +[2023-10-08 17:47:53,536][21194] Updated weights for policy 1, policy_version 50890 (0.0007) +[2023-10-08 17:47:53,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 104628224. Throughput: 0: 1740.1, 1: 1728.7. Samples: 26165312. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:47:53,803][19739] Avg episode reward: [(0, '718.200'), (1, '835.850')] +[2023-10-08 17:47:53,894][21194] Updated weights for policy 1, policy_version 50900 (0.0007) +[2023-10-08 17:47:54,271][21194] Updated weights for policy 1, policy_version 50910 (0.0009) +[2023-10-08 17:47:56,598][21195] Updated weights for policy 0, policy_version 51300 (0.0009) +[2023-10-08 17:47:56,966][21195] Updated weights for policy 0, policy_version 51310 (0.0007) +[2023-10-08 17:47:57,341][21195] Updated weights for policy 0, policy_version 51320 (0.0007) +[2023-10-08 17:47:58,217][21194] Updated weights for policy 1, policy_version 50920 (0.0008) +[2023-10-08 17:47:58,587][21194] Updated weights for policy 1, policy_version 50930 (0.0009) +[2023-10-08 17:47:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 104693760. Throughput: 0: 1714.0, 1: 1725.7. Samples: 26185346. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:47:58,803][19739] Avg episode reward: [(0, '732.360'), (1, '830.490')] +[2023-10-08 17:47:58,958][21194] Updated weights for policy 1, policy_version 50940 (0.0010) +[2023-10-08 17:48:01,167][21195] Updated weights for policy 0, policy_version 51330 (0.0007) +[2023-10-08 17:48:01,529][21195] Updated weights for policy 0, policy_version 51340 (0.0008) +[2023-10-08 17:48:01,896][21195] Updated weights for policy 0, policy_version 51350 (0.0010) +[2023-10-08 17:48:02,264][21195] Updated weights for policy 0, policy_version 51360 (0.0011) +[2023-10-08 17:48:02,996][21194] Updated weights for policy 1, policy_version 50950 (0.0008) +[2023-10-08 17:48:03,358][21194] Updated weights for policy 1, policy_version 50960 (0.0007) +[2023-10-08 17:48:03,732][21194] Updated weights for policy 1, policy_version 50970 (0.0008) +[2023-10-08 17:48:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 104759296. Throughput: 0: 1720.8, 1: 1720.9. Samples: 26200800. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:48:03,804][19739] Avg episode reward: [(0, '732.360'), (1, '830.490')] +[2023-10-08 17:48:06,156][21195] Updated weights for policy 0, policy_version 51370 (0.0011) +[2023-10-08 17:48:06,520][21195] Updated weights for policy 0, policy_version 51380 (0.0011) +[2023-10-08 17:48:06,894][21195] Updated weights for policy 0, policy_version 51390 (0.0009) +[2023-10-08 17:48:07,703][21194] Updated weights for policy 1, policy_version 50980 (0.0009) +[2023-10-08 17:48:08,072][21194] Updated weights for policy 1, policy_version 50990 (0.0008) +[2023-10-08 17:48:08,439][21194] Updated weights for policy 1, policy_version 51000 (0.0007) +[2023-10-08 17:48:08,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 104857600. Throughput: 0: 1726.4, 1: 1727.5. Samples: 26216484. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:48:08,803][19739] Avg episode reward: [(0, '689.150'), (1, '830.230')] +[2023-10-08 17:48:10,789][21195] Updated weights for policy 0, policy_version 51400 (0.0007) +[2023-10-08 17:48:11,158][21195] Updated weights for policy 0, policy_version 51410 (0.0007) +[2023-10-08 17:48:11,521][21195] Updated weights for policy 0, policy_version 51420 (0.0007) +[2023-10-08 17:48:12,348][21194] Updated weights for policy 1, policy_version 51010 (0.0009) +[2023-10-08 17:48:12,722][21194] Updated weights for policy 1, policy_version 51020 (0.0008) +[2023-10-08 17:48:13,086][21194] Updated weights for policy 1, policy_version 51030 (0.0008) +[2023-10-08 17:48:13,464][21194] Updated weights for policy 1, policy_version 51040 (0.0008) +[2023-10-08 17:48:13,803][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 104923136. Throughput: 0: 1718.9, 1: 1708.3. Samples: 26237148. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:48:13,803][19739] Avg episode reward: [(0, '689.150'), (1, '830.230')] +[2023-10-08 17:48:15,523][21195] Updated weights for policy 0, policy_version 51430 (0.0009) +[2023-10-08 17:48:15,886][21195] Updated weights for policy 0, policy_version 51440 (0.0007) +[2023-10-08 17:48:16,257][21195] Updated weights for policy 0, policy_version 51450 (0.0010) +[2023-10-08 17:48:17,436][21194] Updated weights for policy 1, policy_version 51050 (0.0007) +[2023-10-08 17:48:17,814][21194] Updated weights for policy 1, policy_version 51060 (0.0007) +[2023-10-08 17:48:18,178][21194] Updated weights for policy 1, policy_version 51070 (0.0011) +[2023-10-08 17:48:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 104988672. Throughput: 0: 1741.8, 1: 1731.9. Samples: 26253516. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:48:18,803][19739] Avg episode reward: [(0, '674.520'), (1, '830.230')] +[2023-10-08 17:48:20,114][21195] Updated weights for policy 0, policy_version 51460 (0.0009) +[2023-10-08 17:48:20,482][21195] Updated weights for policy 0, policy_version 51470 (0.0008) +[2023-10-08 17:48:20,854][21195] Updated weights for policy 0, policy_version 51480 (0.0008) +[2023-10-08 17:48:21,967][21194] Updated weights for policy 1, policy_version 51080 (0.0010) +[2023-10-08 17:48:22,329][21194] Updated weights for policy 1, policy_version 51090 (0.0008) +[2023-10-08 17:48:22,711][21194] Updated weights for policy 1, policy_version 51100 (0.0007) +[2023-10-08 17:48:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 105054208. Throughput: 0: 1720.4, 1: 1724.4. Samples: 26268520. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:48:23,803][19739] Avg episode reward: [(0, '630.400'), (1, '830.230')] +[2023-10-08 17:48:24,740][21195] Updated weights for policy 0, policy_version 51490 (0.0007) +[2023-10-08 17:48:25,112][21195] Updated weights for policy 0, policy_version 51500 (0.0008) +[2023-10-08 17:48:25,480][21195] Updated weights for policy 0, policy_version 51510 (0.0010) +[2023-10-08 17:48:25,850][21195] Updated weights for policy 0, policy_version 51520 (0.0007) +[2023-10-08 17:48:26,595][21194] Updated weights for policy 1, policy_version 51110 (0.0007) +[2023-10-08 17:48:26,964][21194] Updated weights for policy 1, policy_version 51120 (0.0007) +[2023-10-08 17:48:27,326][21194] Updated weights for policy 1, policy_version 51130 (0.0007) +[2023-10-08 17:48:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 105119744. Throughput: 0: 1732.6, 1: 1701.3. Samples: 26288838. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 17:48:28,803][19739] Avg episode reward: [(0, '630.400'), (1, '845.380')] +[2023-10-08 17:48:29,907][21195] Updated weights for policy 0, policy_version 51530 (0.0007) +[2023-10-08 17:48:30,271][21195] Updated weights for policy 0, policy_version 51540 (0.0008) +[2023-10-08 17:48:30,637][21195] Updated weights for policy 0, policy_version 51550 (0.0008) +[2023-10-08 17:48:31,326][21194] Updated weights for policy 1, policy_version 51140 (0.0009) +[2023-10-08 17:48:31,699][21194] Updated weights for policy 1, policy_version 51150 (0.0009) +[2023-10-08 17:48:32,068][21194] Updated weights for policy 1, policy_version 51160 (0.0011) +[2023-10-08 17:48:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 105185280. Throughput: 0: 1745.9, 1: 1737.2. Samples: 26305440. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 17:48:33,803][19739] Avg episode reward: [(0, '630.400'), (1, '845.380')] +[2023-10-08 17:48:34,608][21195] Updated weights for policy 0, policy_version 51560 (0.0008) +[2023-10-08 17:48:34,976][21195] Updated weights for policy 0, policy_version 51570 (0.0008) +[2023-10-08 17:48:35,343][21195] Updated weights for policy 0, policy_version 51580 (0.0007) +[2023-10-08 17:48:35,906][21194] Updated weights for policy 1, policy_version 51170 (0.0011) +[2023-10-08 17:48:36,259][21194] Updated weights for policy 1, policy_version 51180 (0.0010) +[2023-10-08 17:48:36,630][21194] Updated weights for policy 1, policy_version 51190 (0.0011) +[2023-10-08 17:48:36,999][21194] Updated weights for policy 1, policy_version 51200 (0.0010) +[2023-10-08 17:48:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 105250816. Throughput: 0: 1712.7, 1: 1710.9. Samples: 26319372. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 17:48:38,803][19739] Avg episode reward: [(0, '630.400'), (1, '845.380')] +[2023-10-08 17:48:39,304][21195] Updated weights for policy 0, policy_version 51590 (0.0009) +[2023-10-08 17:48:39,683][21195] Updated weights for policy 0, policy_version 51600 (0.0008) +[2023-10-08 17:48:40,052][21195] Updated weights for policy 0, policy_version 51610 (0.0008) +[2023-10-08 17:48:40,926][21194] Updated weights for policy 1, policy_version 51210 (0.0009) +[2023-10-08 17:48:41,294][21194] Updated weights for policy 1, policy_version 51220 (0.0008) +[2023-10-08 17:48:41,667][21194] Updated weights for policy 1, policy_version 51230 (0.0009) +[2023-10-08 17:48:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 105316352. Throughput: 0: 1740.5, 1: 1709.9. Samples: 26340614. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 17:48:43,803][19739] Avg episode reward: [(0, '630.400'), (1, '845.380')] +[2023-10-08 17:48:43,881][21195] Updated weights for policy 0, policy_version 51620 (0.0008) +[2023-10-08 17:48:44,251][21195] Updated weights for policy 0, policy_version 51630 (0.0008) +[2023-10-08 17:48:44,610][21195] Updated weights for policy 0, policy_version 51640 (0.0007) +[2023-10-08 17:48:45,651][21194] Updated weights for policy 1, policy_version 51240 (0.0008) +[2023-10-08 17:48:46,010][21194] Updated weights for policy 1, policy_version 51250 (0.0009) +[2023-10-08 17:48:46,377][21194] Updated weights for policy 1, policy_version 51260 (0.0007) +[2023-10-08 17:48:48,331][21195] Updated weights for policy 0, policy_version 51650 (0.0008) +[2023-10-08 17:48:48,701][21195] Updated weights for policy 0, policy_version 51660 (0.0007) +[2023-10-08 17:48:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 105381888. Throughput: 0: 1733.5, 1: 1724.8. Samples: 26356424. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 17:48:48,803][19739] Avg episode reward: [(0, '630.400'), (1, '845.380')] +[2023-10-08 17:48:49,071][21195] Updated weights for policy 0, policy_version 51670 (0.0007) +[2023-10-08 17:48:49,430][21195] Updated weights for policy 0, policy_version 51680 (0.0007) +[2023-10-08 17:48:50,311][21194] Updated weights for policy 1, policy_version 51270 (0.0008) +[2023-10-08 17:48:50,684][21194] Updated weights for policy 1, policy_version 51280 (0.0008) +[2023-10-08 17:48:51,044][21194] Updated weights for policy 1, policy_version 51290 (0.0009) +[2023-10-08 17:48:53,427][21195] Updated weights for policy 0, policy_version 51690 (0.0010) +[2023-10-08 17:48:53,789][21195] Updated weights for policy 0, policy_version 51700 (0.0011) +[2023-10-08 17:48:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 105447424. Throughput: 0: 1744.9, 1: 1710.2. Samples: 26371964. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 17:48:53,803][19739] Avg episode reward: [(0, '629.920'), (1, '845.380')] +[2023-10-08 17:48:54,155][21195] Updated weights for policy 0, policy_version 51710 (0.0010) +[2023-10-08 17:48:55,037][21194] Updated weights for policy 1, policy_version 51300 (0.0009) +[2023-10-08 17:48:55,403][21194] Updated weights for policy 1, policy_version 51310 (0.0009) +[2023-10-08 17:48:55,768][21194] Updated weights for policy 1, policy_version 51320 (0.0008) +[2023-10-08 17:48:57,913][21195] Updated weights for policy 0, policy_version 51720 (0.0008) +[2023-10-08 17:48:58,286][21195] Updated weights for policy 0, policy_version 51730 (0.0008) +[2023-10-08 17:48:58,654][21195] Updated weights for policy 0, policy_version 51740 (0.0009) +[2023-10-08 17:48:58,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 105545728. Throughput: 0: 1743.6, 1: 1724.9. Samples: 26393230. Policy #0 lag: (min: 1.0, avg: 17.7, max: 33.0) +[2023-10-08 17:48:58,803][19739] Avg episode reward: [(0, '629.920'), (1, '860.090')] +[2023-10-08 17:48:59,786][21194] Updated weights for policy 1, policy_version 51330 (0.0009) +[2023-10-08 17:49:00,155][21194] Updated weights for policy 1, policy_version 51340 (0.0008) +[2023-10-08 17:49:00,513][21194] Updated weights for policy 1, policy_version 51350 (0.0009) +[2023-10-08 17:49:00,877][21194] Updated weights for policy 1, policy_version 51360 (0.0009) +[2023-10-08 17:49:02,544][21195] Updated weights for policy 0, policy_version 51750 (0.0008) +[2023-10-08 17:49:02,915][21195] Updated weights for policy 0, policy_version 51760 (0.0010) +[2023-10-08 17:49:03,279][21195] Updated weights for policy 0, policy_version 51770 (0.0009) +[2023-10-08 17:49:03,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 105611264. Throughput: 0: 1715.5, 1: 1705.3. Samples: 26407452. Policy #0 lag: (min: 1.0, avg: 17.7, max: 33.0) +[2023-10-08 17:49:03,803][19739] Avg episode reward: [(0, '629.920'), (1, '860.090')] +[2023-10-08 17:49:04,970][21194] Updated weights for policy 1, policy_version 51370 (0.0007) +[2023-10-08 17:49:05,333][21194] Updated weights for policy 1, policy_version 51380 (0.0008) +[2023-10-08 17:49:05,701][21194] Updated weights for policy 1, policy_version 51390 (0.0009) +[2023-10-08 17:49:07,254][21195] Updated weights for policy 0, policy_version 51780 (0.0008) +[2023-10-08 17:49:07,628][21195] Updated weights for policy 0, policy_version 51790 (0.0008) +[2023-10-08 17:49:07,996][21195] Updated weights for policy 0, policy_version 51800 (0.0009) +[2023-10-08 17:49:08,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 105676800. Throughput: 0: 1745.6, 1: 1708.7. Samples: 26423964. Policy #0 lag: (min: 1.0, avg: 17.7, max: 33.0) +[2023-10-08 17:49:08,804][19739] Avg episode reward: [(0, '629.920'), (1, '860.180')] +[2023-10-08 17:49:09,739][21194] Updated weights for policy 1, policy_version 51400 (0.0009) +[2023-10-08 17:49:10,104][21194] Updated weights for policy 1, policy_version 51410 (0.0009) +[2023-10-08 17:49:10,472][21194] Updated weights for policy 1, policy_version 51420 (0.0009) +[2023-10-08 17:49:11,932][21195] Updated weights for policy 0, policy_version 51810 (0.0008) +[2023-10-08 17:49:12,297][21195] Updated weights for policy 0, policy_version 51820 (0.0007) +[2023-10-08 17:49:12,677][21195] Updated weights for policy 0, policy_version 51830 (0.0007) +[2023-10-08 17:49:13,052][21195] Updated weights for policy 0, policy_version 51840 (0.0007) +[2023-10-08 17:49:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 105742336. Throughput: 0: 1725.2, 1: 1735.4. Samples: 26444562. Policy #0 lag: (min: 1.0, avg: 17.7, max: 33.0) +[2023-10-08 17:49:13,803][19739] Avg episode reward: [(0, '629.920'), (1, '861.020')] +[2023-10-08 17:49:13,813][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000051840_53084160.pth... +[2023-10-08 17:49:13,813][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000051424_52658176.pth... +[2023-10-08 17:49:13,843][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000049824_51019776.pth +[2023-10-08 17:49:13,853][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000050208_51412992.pth +[2023-10-08 17:49:14,324][21194] Updated weights for policy 1, policy_version 51430 (0.0010) +[2023-10-08 17:49:14,696][21194] Updated weights for policy 1, policy_version 51440 (0.0007) +[2023-10-08 17:49:15,064][21194] Updated weights for policy 1, policy_version 51450 (0.0008) +[2023-10-08 17:49:16,923][21195] Updated weights for policy 0, policy_version 51850 (0.0007) +[2023-10-08 17:49:17,290][21195] Updated weights for policy 0, policy_version 51860 (0.0008) +[2023-10-08 17:49:17,654][21195] Updated weights for policy 0, policy_version 51870 (0.0009) +[2023-10-08 17:49:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 105807872. Throughput: 0: 1727.9, 1: 1702.6. Samples: 26459812. Policy #0 lag: (min: 1.0, avg: 17.7, max: 33.0) +[2023-10-08 17:49:18,803][19739] Avg episode reward: [(0, '629.920'), (1, '861.020')] +[2023-10-08 17:49:18,867][21194] Updated weights for policy 1, policy_version 51460 (0.0008) +[2023-10-08 17:49:19,227][21194] Updated weights for policy 1, policy_version 51470 (0.0010) +[2023-10-08 17:49:19,595][21194] Updated weights for policy 1, policy_version 51480 (0.0008) +[2023-10-08 17:49:21,778][21195] Updated weights for policy 0, policy_version 51880 (0.0007) +[2023-10-08 17:49:22,146][21195] Updated weights for policy 0, policy_version 51890 (0.0007) +[2023-10-08 17:49:22,516][21195] Updated weights for policy 0, policy_version 51900 (0.0008) +[2023-10-08 17:49:23,605][21194] Updated weights for policy 1, policy_version 51490 (0.0008) +[2023-10-08 17:49:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 105873408. Throughput: 0: 1750.8, 1: 1732.5. Samples: 26476120. Policy #0 lag: (min: 1.0, avg: 17.7, max: 33.0) +[2023-10-08 17:49:23,803][19739] Avg episode reward: [(0, '629.920'), (1, '861.020')] +[2023-10-08 17:49:23,970][21194] Updated weights for policy 1, policy_version 51500 (0.0008) +[2023-10-08 17:49:24,336][21194] Updated weights for policy 1, policy_version 51510 (0.0008) +[2023-10-08 17:49:24,701][21194] Updated weights for policy 1, policy_version 51520 (0.0007) +[2023-10-08 17:49:26,437][21195] Updated weights for policy 0, policy_version 51910 (0.0008) +[2023-10-08 17:49:26,800][21195] Updated weights for policy 0, policy_version 51920 (0.0007) +[2023-10-08 17:49:27,165][21195] Updated weights for policy 0, policy_version 51930 (0.0007) +[2023-10-08 17:49:28,443][21194] Updated weights for policy 1, policy_version 51530 (0.0007) +[2023-10-08 17:49:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 105938944. Throughput: 0: 1725.9, 1: 1746.5. Samples: 26496872. Policy #0 lag: (min: 1.0, avg: 17.7, max: 33.0) +[2023-10-08 17:49:28,803][19739] Avg episode reward: [(0, '629.920'), (1, '861.020')] +[2023-10-08 17:49:28,808][21194] Updated weights for policy 1, policy_version 51540 (0.0008) +[2023-10-08 17:49:29,170][21194] Updated weights for policy 1, policy_version 51550 (0.0008) +[2023-10-08 17:49:31,128][21195] Updated weights for policy 0, policy_version 51940 (0.0008) +[2023-10-08 17:49:31,487][21195] Updated weights for policy 0, policy_version 51950 (0.0007) +[2023-10-08 17:49:31,850][21195] Updated weights for policy 0, policy_version 51960 (0.0007) +[2023-10-08 17:49:33,013][21194] Updated weights for policy 1, policy_version 51560 (0.0008) +[2023-10-08 17:49:33,386][21194] Updated weights for policy 1, policy_version 51570 (0.0010) +[2023-10-08 17:49:33,750][21194] Updated weights for policy 1, policy_version 51580 (0.0007) +[2023-10-08 17:49:33,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 106004480. Throughput: 0: 1734.5, 1: 1736.1. Samples: 26512604. Policy #0 lag: (min: 8.0, avg: 31.4, max: 40.0) +[2023-10-08 17:49:33,803][19739] Avg episode reward: [(0, '629.920'), (1, '861.020')] +[2023-10-08 17:49:35,641][21195] Updated weights for policy 0, policy_version 51970 (0.0008) +[2023-10-08 17:49:36,011][21195] Updated weights for policy 0, policy_version 51980 (0.0009) +[2023-10-08 17:49:36,385][21195] Updated weights for policy 0, policy_version 51990 (0.0008) +[2023-10-08 17:49:36,747][21195] Updated weights for policy 0, policy_version 52000 (0.0009) +[2023-10-08 17:49:37,730][21194] Updated weights for policy 1, policy_version 51590 (0.0009) +[2023-10-08 17:49:38,095][21194] Updated weights for policy 1, policy_version 51600 (0.0009) +[2023-10-08 17:49:38,468][21194] Updated weights for policy 1, policy_version 51610 (0.0008) +[2023-10-08 17:49:38,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 106102784. Throughput: 0: 1719.1, 1: 1751.2. Samples: 26528128. Policy #0 lag: (min: 8.0, avg: 31.4, max: 40.0) +[2023-10-08 17:49:38,803][19739] Avg episode reward: [(0, '628.740'), (1, '891.210')] +[2023-10-08 17:49:40,758][21195] Updated weights for policy 0, policy_version 52010 (0.0009) +[2023-10-08 17:49:41,126][21195] Updated weights for policy 0, policy_version 52020 (0.0007) +[2023-10-08 17:49:41,500][21195] Updated weights for policy 0, policy_version 52030 (0.0008) +[2023-10-08 17:49:42,422][21194] Updated weights for policy 1, policy_version 51620 (0.0007) +[2023-10-08 17:49:42,781][21194] Updated weights for policy 1, policy_version 51630 (0.0007) +[2023-10-08 17:49:43,146][21194] Updated weights for policy 1, policy_version 51640 (0.0007) +[2023-10-08 17:49:43,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 106168320. Throughput: 0: 1720.1, 1: 1730.8. Samples: 26548522. Policy #0 lag: (min: 8.0, avg: 31.4, max: 40.0) +[2023-10-08 17:49:43,803][19739] Avg episode reward: [(0, '628.740'), (1, '891.210')] +[2023-10-08 17:49:45,463][21195] Updated weights for policy 0, policy_version 52040 (0.0010) +[2023-10-08 17:49:45,839][21195] Updated weights for policy 0, policy_version 52050 (0.0011) +[2023-10-08 17:49:46,199][21195] Updated weights for policy 0, policy_version 52060 (0.0008) +[2023-10-08 17:49:47,231][21194] Updated weights for policy 1, policy_version 51650 (0.0008) +[2023-10-08 17:49:47,602][21194] Updated weights for policy 1, policy_version 51660 (0.0009) +[2023-10-08 17:49:47,969][21194] Updated weights for policy 1, policy_version 51670 (0.0009) +[2023-10-08 17:49:48,330][21194] Updated weights for policy 1, policy_version 51680 (0.0008) +[2023-10-08 17:49:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 106233856. Throughput: 0: 1743.1, 1: 1749.7. Samples: 26564628. Policy #0 lag: (min: 8.0, avg: 31.4, max: 40.0) +[2023-10-08 17:49:48,803][19739] Avg episode reward: [(0, '628.740'), (1, '891.210')] +[2023-10-08 17:49:50,141][21195] Updated weights for policy 0, policy_version 52070 (0.0009) +[2023-10-08 17:49:50,506][21195] Updated weights for policy 0, policy_version 52080 (0.0010) +[2023-10-08 17:49:50,876][21195] Updated weights for policy 0, policy_version 52090 (0.0009) +[2023-10-08 17:49:52,470][21194] Updated weights for policy 1, policy_version 51690 (0.0009) +[2023-10-08 17:49:52,833][21194] Updated weights for policy 1, policy_version 51700 (0.0007) +[2023-10-08 17:49:53,199][21194] Updated weights for policy 1, policy_version 51710 (0.0008) +[2023-10-08 17:49:53,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 106299392. Throughput: 0: 1709.8, 1: 1751.2. Samples: 26579710. Policy #0 lag: (min: 8.0, avg: 31.4, max: 40.0) +[2023-10-08 17:49:53,803][19739] Avg episode reward: [(0, '628.740'), (1, '891.210')] +[2023-10-08 17:49:54,913][21195] Updated weights for policy 0, policy_version 52100 (0.0009) +[2023-10-08 17:49:55,279][21195] Updated weights for policy 0, policy_version 52110 (0.0008) +[2023-10-08 17:49:55,654][21195] Updated weights for policy 0, policy_version 52120 (0.0008) +[2023-10-08 17:49:57,079][21194] Updated weights for policy 1, policy_version 51720 (0.0007) +[2023-10-08 17:49:57,448][21194] Updated weights for policy 1, policy_version 51730 (0.0007) +[2023-10-08 17:49:57,806][21194] Updated weights for policy 1, policy_version 51740 (0.0008) +[2023-10-08 17:49:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 106364928. Throughput: 0: 1729.5, 1: 1716.4. Samples: 26599626. Policy #0 lag: (min: 8.0, avg: 31.4, max: 40.0) +[2023-10-08 17:49:58,804][19739] Avg episode reward: [(0, '628.740'), (1, '907.660')] +[2023-10-08 17:49:59,549][21195] Updated weights for policy 0, policy_version 52130 (0.0008) +[2023-10-08 17:49:59,912][21195] Updated weights for policy 0, policy_version 52140 (0.0007) +[2023-10-08 17:50:00,288][21195] Updated weights for policy 0, policy_version 52150 (0.0010) +[2023-10-08 17:50:00,641][21195] Updated weights for policy 0, policy_version 52160 (0.0010) +[2023-10-08 17:50:01,703][21194] Updated weights for policy 1, policy_version 51750 (0.0008) +[2023-10-08 17:50:02,078][21194] Updated weights for policy 1, policy_version 51760 (0.0007) +[2023-10-08 17:50:02,437][21194] Updated weights for policy 1, policy_version 51770 (0.0009) +[2023-10-08 17:50:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 106430464. Throughput: 0: 1733.4, 1: 1746.6. Samples: 26616412. Policy #0 lag: (min: 8.0, avg: 31.4, max: 40.0) +[2023-10-08 17:50:03,803][19739] Avg episode reward: [(0, '643.910'), (1, '908.630')] +[2023-10-08 17:50:04,579][21195] Updated weights for policy 0, policy_version 52170 (0.0010) +[2023-10-08 17:50:04,941][21195] Updated weights for policy 0, policy_version 52180 (0.0008) +[2023-10-08 17:50:05,309][21195] Updated weights for policy 0, policy_version 52190 (0.0010) +[2023-10-08 17:50:06,332][21194] Updated weights for policy 1, policy_version 51780 (0.0009) +[2023-10-08 17:50:06,706][21194] Updated weights for policy 1, policy_version 51790 (0.0008) +[2023-10-08 17:50:07,073][21194] Updated weights for policy 1, policy_version 51800 (0.0008) +[2023-10-08 17:50:08,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 106496000. Throughput: 0: 1712.4, 1: 1723.0. Samples: 26630712. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:50:08,803][19739] Avg episode reward: [(0, '643.910'), (1, '908.630')] +[2023-10-08 17:50:09,154][21195] Updated weights for policy 0, policy_version 52200 (0.0009) +[2023-10-08 17:50:09,528][21195] Updated weights for policy 0, policy_version 52210 (0.0009) +[2023-10-08 17:50:09,905][21195] Updated weights for policy 0, policy_version 52220 (0.0008) +[2023-10-08 17:50:10,964][21194] Updated weights for policy 1, policy_version 51810 (0.0009) +[2023-10-08 17:50:11,342][21194] Updated weights for policy 1, policy_version 51820 (0.0011) +[2023-10-08 17:50:11,705][21194] Updated weights for policy 1, policy_version 51830 (0.0011) +[2023-10-08 17:50:12,078][21194] Updated weights for policy 1, policy_version 51840 (0.0007) +[2023-10-08 17:50:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 106561536. Throughput: 0: 1736.3, 1: 1705.2. Samples: 26651738. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:50:13,803][19739] Avg episode reward: [(0, '643.930'), (1, '908.630')] +[2023-10-08 17:50:13,818][21195] Updated weights for policy 0, policy_version 52230 (0.0009) +[2023-10-08 17:50:14,189][21195] Updated weights for policy 0, policy_version 52240 (0.0010) +[2023-10-08 17:50:14,558][21195] Updated weights for policy 0, policy_version 52250 (0.0008) +[2023-10-08 17:50:15,952][21194] Updated weights for policy 1, policy_version 51850 (0.0010) +[2023-10-08 17:50:16,319][21194] Updated weights for policy 1, policy_version 51860 (0.0009) +[2023-10-08 17:50:16,683][21194] Updated weights for policy 1, policy_version 51870 (0.0008) +[2023-10-08 17:50:18,515][21195] Updated weights for policy 0, policy_version 52260 (0.0009) +[2023-10-08 17:50:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 106627072. Throughput: 0: 1726.7, 1: 1718.6. Samples: 26667642. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:50:18,803][19739] Avg episode reward: [(0, '643.930'), (1, '908.690')] +[2023-10-08 17:50:18,878][21195] Updated weights for policy 0, policy_version 52270 (0.0008) +[2023-10-08 17:50:19,251][21195] Updated weights for policy 0, policy_version 52280 (0.0009) +[2023-10-08 17:50:20,707][21194] Updated weights for policy 1, policy_version 51880 (0.0010) +[2023-10-08 17:50:21,080][21194] Updated weights for policy 1, policy_version 51890 (0.0008) +[2023-10-08 17:50:21,442][21194] Updated weights for policy 1, policy_version 51900 (0.0007) +[2023-10-08 17:50:23,180][21195] Updated weights for policy 0, policy_version 52290 (0.0008) +[2023-10-08 17:50:23,557][21195] Updated weights for policy 0, policy_version 52300 (0.0009) +[2023-10-08 17:50:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 106692608. Throughput: 0: 1735.8, 1: 1694.9. Samples: 26682510. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:50:23,803][19739] Avg episode reward: [(0, '643.930'), (1, '908.690')] +[2023-10-08 17:50:23,924][21195] Updated weights for policy 0, policy_version 52310 (0.0008) +[2023-10-08 17:50:24,292][21195] Updated weights for policy 0, policy_version 52320 (0.0007) +[2023-10-08 17:50:25,362][21194] Updated weights for policy 1, policy_version 51910 (0.0008) +[2023-10-08 17:50:25,722][21194] Updated weights for policy 1, policy_version 51920 (0.0009) +[2023-10-08 17:50:26,090][21194] Updated weights for policy 1, policy_version 51930 (0.0007) +[2023-10-08 17:50:28,099][21195] Updated weights for policy 0, policy_version 52330 (0.0010) +[2023-10-08 17:50:28,464][21195] Updated weights for policy 0, policy_version 52340 (0.0010) +[2023-10-08 17:50:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 106758144. Throughput: 0: 1738.4, 1: 1719.7. Samples: 26704136. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:50:28,803][19739] Avg episode reward: [(0, '643.930'), (1, '908.690')] +[2023-10-08 17:50:28,843][21195] Updated weights for policy 0, policy_version 52350 (0.0011) +[2023-10-08 17:50:29,949][21194] Updated weights for policy 1, policy_version 51940 (0.0008) +[2023-10-08 17:50:30,318][21194] Updated weights for policy 1, policy_version 51950 (0.0011) +[2023-10-08 17:50:30,690][21194] Updated weights for policy 1, policy_version 51960 (0.0009) +[2023-10-08 17:50:32,769][21195] Updated weights for policy 0, policy_version 52360 (0.0007) +[2023-10-08 17:50:33,134][21195] Updated weights for policy 0, policy_version 52370 (0.0008) +[2023-10-08 17:50:33,501][21195] Updated weights for policy 0, policy_version 52380 (0.0007) +[2023-10-08 17:50:33,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 106856448. Throughput: 0: 1713.5, 1: 1704.4. Samples: 26718434. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:50:33,803][19739] Avg episode reward: [(0, '643.930'), (1, '923.620')] +[2023-10-08 17:50:34,424][21194] Updated weights for policy 1, policy_version 51970 (0.0007) +[2023-10-08 17:50:34,788][21194] Updated weights for policy 1, policy_version 51980 (0.0007) +[2023-10-08 17:50:35,157][21194] Updated weights for policy 1, policy_version 51990 (0.0009) +[2023-10-08 17:50:35,517][21194] Updated weights for policy 1, policy_version 52000 (0.0010) +[2023-10-08 17:50:37,513][21195] Updated weights for policy 0, policy_version 52390 (0.0007) +[2023-10-08 17:50:37,891][21195] Updated weights for policy 0, policy_version 52400 (0.0008) +[2023-10-08 17:50:38,256][21195] Updated weights for policy 0, policy_version 52410 (0.0007) +[2023-10-08 17:50:38,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 106921984. Throughput: 0: 1745.0, 1: 1712.1. Samples: 26735280. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:50:38,803][19739] Avg episode reward: [(0, '643.930'), (1, '923.300')] +[2023-10-08 17:50:39,664][21194] Updated weights for policy 1, policy_version 52010 (0.0007) +[2023-10-08 17:50:40,035][21194] Updated weights for policy 1, policy_version 52020 (0.0009) +[2023-10-08 17:50:40,403][21194] Updated weights for policy 1, policy_version 52030 (0.0008) +[2023-10-08 17:50:42,030][21195] Updated weights for policy 0, policy_version 52420 (0.0007) +[2023-10-08 17:50:42,397][21195] Updated weights for policy 0, policy_version 52430 (0.0007) +[2023-10-08 17:50:42,776][21195] Updated weights for policy 0, policy_version 52440 (0.0007) +[2023-10-08 17:50:43,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 106987520. Throughput: 0: 1727.2, 1: 1744.5. Samples: 26755850. Policy #0 lag: (min: 31.0, avg: 54.0, max: 56.0) +[2023-10-08 17:50:43,804][19739] Avg episode reward: [(0, '643.930'), (1, '923.300')] +[2023-10-08 17:50:44,293][21194] Updated weights for policy 1, policy_version 52040 (0.0008) +[2023-10-08 17:50:44,667][21194] Updated weights for policy 1, policy_version 52050 (0.0009) +[2023-10-08 17:50:45,029][21194] Updated weights for policy 1, policy_version 52060 (0.0007) +[2023-10-08 17:50:46,706][21195] Updated weights for policy 0, policy_version 52450 (0.0008) +[2023-10-08 17:50:47,073][21195] Updated weights for policy 0, policy_version 52460 (0.0009) +[2023-10-08 17:50:47,446][21195] Updated weights for policy 0, policy_version 52470 (0.0011) +[2023-10-08 17:50:47,817][21195] Updated weights for policy 0, policy_version 52480 (0.0010) +[2023-10-08 17:50:48,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 107053056. Throughput: 0: 1715.6, 1: 1715.5. Samples: 26770810. Policy #0 lag: (min: 31.0, avg: 54.0, max: 56.0) +[2023-10-08 17:50:48,803][19739] Avg episode reward: [(0, '643.930'), (1, '923.480')] +[2023-10-08 17:50:48,922][21194] Updated weights for policy 1, policy_version 52070 (0.0008) +[2023-10-08 17:50:49,299][21194] Updated weights for policy 1, policy_version 52080 (0.0010) +[2023-10-08 17:50:49,665][21194] Updated weights for policy 1, policy_version 52090 (0.0010) +[2023-10-08 17:50:51,884][21195] Updated weights for policy 0, policy_version 52490 (0.0008) +[2023-10-08 17:50:52,251][21195] Updated weights for policy 0, policy_version 52500 (0.0007) +[2023-10-08 17:50:52,622][21195] Updated weights for policy 0, policy_version 52510 (0.0011) +[2023-10-08 17:50:53,409][21194] Updated weights for policy 1, policy_version 52100 (0.0007) +[2023-10-08 17:50:53,771][21194] Updated weights for policy 1, policy_version 52110 (0.0008) +[2023-10-08 17:50:53,802][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 107118592. Throughput: 0: 1739.6, 1: 1741.5. Samples: 26787364. Policy #0 lag: (min: 31.0, avg: 54.0, max: 56.0) +[2023-10-08 17:50:53,803][19739] Avg episode reward: [(0, '643.930'), (1, '923.480')] +[2023-10-08 17:50:54,139][21194] Updated weights for policy 1, policy_version 52120 (0.0008) +[2023-10-08 17:50:56,476][21195] Updated weights for policy 0, policy_version 52520 (0.0010) +[2023-10-08 17:50:56,856][21195] Updated weights for policy 0, policy_version 52530 (0.0009) +[2023-10-08 17:50:57,219][21195] Updated weights for policy 0, policy_version 52540 (0.0008) +[2023-10-08 17:50:57,998][21194] Updated weights for policy 1, policy_version 52130 (0.0011) +[2023-10-08 17:50:58,370][21194] Updated weights for policy 1, policy_version 52140 (0.0007) +[2023-10-08 17:50:58,740][21194] Updated weights for policy 1, policy_version 52150 (0.0008) +[2023-10-08 17:50:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 107184128. Throughput: 0: 1717.7, 1: 1755.1. Samples: 26808012. Policy #0 lag: (min: 31.0, avg: 54.0, max: 56.0) +[2023-10-08 17:50:58,803][19739] Avg episode reward: [(0, '643.930'), (1, '935.200')] +[2023-10-08 17:50:59,102][21194] Updated weights for policy 1, policy_version 52160 (0.0008) +[2023-10-08 17:51:01,099][21195] Updated weights for policy 0, policy_version 52550 (0.0010) +[2023-10-08 17:51:01,474][21195] Updated weights for policy 0, policy_version 52560 (0.0008) +[2023-10-08 17:51:01,841][21195] Updated weights for policy 0, policy_version 52570 (0.0011) +[2023-10-08 17:51:03,087][21194] Updated weights for policy 1, policy_version 52170 (0.0011) +[2023-10-08 17:51:03,457][21194] Updated weights for policy 1, policy_version 52180 (0.0012) +[2023-10-08 17:51:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 107249664. Throughput: 0: 1727.5, 1: 1738.3. Samples: 26823602. Policy #0 lag: (min: 31.0, avg: 54.0, max: 56.0) +[2023-10-08 17:51:03,803][19739] Avg episode reward: [(0, '643.930'), (1, '935.200')] +[2023-10-08 17:51:03,835][21194] Updated weights for policy 1, policy_version 52190 (0.0009) +[2023-10-08 17:51:05,760][21195] Updated weights for policy 0, policy_version 52580 (0.0009) +[2023-10-08 17:51:06,123][21195] Updated weights for policy 0, policy_version 52590 (0.0008) +[2023-10-08 17:51:06,507][21195] Updated weights for policy 0, policy_version 52600 (0.0008) +[2023-10-08 17:51:07,758][21194] Updated weights for policy 1, policy_version 52200 (0.0008) +[2023-10-08 17:51:08,114][21194] Updated weights for policy 1, policy_version 52210 (0.0008) +[2023-10-08 17:51:08,477][21194] Updated weights for policy 1, policy_version 52220 (0.0008) +[2023-10-08 17:51:08,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 107347968. Throughput: 0: 1720.2, 1: 1762.2. Samples: 26839218. Policy #0 lag: (min: 31.0, avg: 54.0, max: 56.0) +[2023-10-08 17:51:08,803][19739] Avg episode reward: [(0, '613.520'), (1, '944.710')] +[2023-10-08 17:51:10,393][21195] Updated weights for policy 0, policy_version 52610 (0.0008) +[2023-10-08 17:51:10,763][21195] Updated weights for policy 0, policy_version 52620 (0.0009) +[2023-10-08 17:51:11,129][21195] Updated weights for policy 0, policy_version 52630 (0.0010) +[2023-10-08 17:51:11,501][21195] Updated weights for policy 0, policy_version 52640 (0.0008) +[2023-10-08 17:51:12,524][21194] Updated weights for policy 1, policy_version 52230 (0.0008) +[2023-10-08 17:51:12,892][21194] Updated weights for policy 1, policy_version 52240 (0.0007) +[2023-10-08 17:51:13,268][21194] Updated weights for policy 1, policy_version 52250 (0.0007) +[2023-10-08 17:51:13,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 107413504. Throughput: 0: 1722.8, 1: 1741.1. Samples: 26860010. Policy #0 lag: (min: 31.0, avg: 54.0, max: 56.0) +[2023-10-08 17:51:13,803][19739] Avg episode reward: [(0, '584.120'), (1, '944.710')] +[2023-10-08 17:51:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000052640_53903360.pth... +[2023-10-08 17:51:13,813][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000052256_53510144.pth... +[2023-10-08 17:51:13,850][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000051040_52264960.pth +[2023-10-08 17:51:13,858][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000050624_51838976.pth +[2023-10-08 17:51:15,322][21195] Updated weights for policy 0, policy_version 52650 (0.0009) +[2023-10-08 17:51:15,695][21195] Updated weights for policy 0, policy_version 52660 (0.0009) +[2023-10-08 17:51:16,066][21195] Updated weights for policy 0, policy_version 52670 (0.0007) +[2023-10-08 17:51:17,237][21194] Updated weights for policy 1, policy_version 52260 (0.0009) +[2023-10-08 17:51:17,602][21194] Updated weights for policy 1, policy_version 52270 (0.0009) +[2023-10-08 17:51:17,955][21194] Updated weights for policy 1, policy_version 52280 (0.0008) +[2023-10-08 17:51:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 107479040. Throughput: 0: 1757.5, 1: 1754.8. Samples: 26876488. Policy #0 lag: (min: 31.0, avg: 54.0, max: 56.0) +[2023-10-08 17:51:18,803][19739] Avg episode reward: [(0, '584.120'), (1, '944.710')] +[2023-10-08 17:51:19,935][21195] Updated weights for policy 0, policy_version 52680 (0.0008) +[2023-10-08 17:51:20,295][21195] Updated weights for policy 0, policy_version 52690 (0.0008) +[2023-10-08 17:51:20,665][21195] Updated weights for policy 0, policy_version 52700 (0.0009) +[2023-10-08 17:51:21,894][21194] Updated weights for policy 1, policy_version 52290 (0.0008) +[2023-10-08 17:51:22,255][21194] Updated weights for policy 1, policy_version 52300 (0.0010) +[2023-10-08 17:51:22,627][21194] Updated weights for policy 1, policy_version 52310 (0.0010) +[2023-10-08 17:51:23,003][21194] Updated weights for policy 1, policy_version 52320 (0.0010) +[2023-10-08 17:51:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 107544576. Throughput: 0: 1730.0, 1: 1746.7. Samples: 26891734. Policy #0 lag: (min: 31.0, avg: 31.6, max: 49.0) +[2023-10-08 17:51:23,803][19739] Avg episode reward: [(0, '584.120'), (1, '944.710')] +[2023-10-08 17:51:24,438][21195] Updated weights for policy 0, policy_version 52710 (0.0009) +[2023-10-08 17:51:24,810][21195] Updated weights for policy 0, policy_version 52720 (0.0010) +[2023-10-08 17:51:25,173][21195] Updated weights for policy 0, policy_version 52730 (0.0010) +[2023-10-08 17:51:27,110][21194] Updated weights for policy 1, policy_version 52330 (0.0009) +[2023-10-08 17:51:27,474][21194] Updated weights for policy 1, policy_version 52340 (0.0010) +[2023-10-08 17:51:27,845][21194] Updated weights for policy 1, policy_version 52350 (0.0008) +[2023-10-08 17:51:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 107610112. Throughput: 0: 1758.9, 1: 1717.8. Samples: 26912298. Policy #0 lag: (min: 31.0, avg: 31.6, max: 49.0) +[2023-10-08 17:51:28,803][19739] Avg episode reward: [(0, '614.150'), (1, '944.710')] +[2023-10-08 17:51:29,174][21195] Updated weights for policy 0, policy_version 52740 (0.0008) +[2023-10-08 17:51:29,544][21195] Updated weights for policy 0, policy_version 52750 (0.0007) +[2023-10-08 17:51:29,910][21195] Updated weights for policy 0, policy_version 52760 (0.0007) +[2023-10-08 17:51:31,861][21194] Updated weights for policy 1, policy_version 52360 (0.0007) +[2023-10-08 17:51:32,221][21194] Updated weights for policy 1, policy_version 52370 (0.0007) +[2023-10-08 17:51:32,595][21194] Updated weights for policy 1, policy_version 52380 (0.0007) +[2023-10-08 17:51:33,647][21195] Updated weights for policy 0, policy_version 52770 (0.0008) +[2023-10-08 17:51:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 107675648. Throughput: 0: 1769.0, 1: 1741.3. Samples: 26928776. Policy #0 lag: (min: 31.0, avg: 31.6, max: 49.0) +[2023-10-08 17:51:33,803][19739] Avg episode reward: [(0, '614.150'), (1, '946.390')] +[2023-10-08 17:51:34,016][21195] Updated weights for policy 0, policy_version 52780 (0.0008) +[2023-10-08 17:51:34,390][21195] Updated weights for policy 0, policy_version 52790 (0.0008) +[2023-10-08 17:51:34,762][21195] Updated weights for policy 0, policy_version 52800 (0.0008) +[2023-10-08 17:51:36,458][21194] Updated weights for policy 1, policy_version 52390 (0.0007) +[2023-10-08 17:51:36,822][21194] Updated weights for policy 1, policy_version 52400 (0.0008) +[2023-10-08 17:51:37,190][21194] Updated weights for policy 1, policy_version 52410 (0.0008) +[2023-10-08 17:51:38,534][21195] Updated weights for policy 0, policy_version 52810 (0.0008) +[2023-10-08 17:51:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 107741184. Throughput: 0: 1751.5, 1: 1720.1. Samples: 26943586. Policy #0 lag: (min: 31.0, avg: 31.6, max: 49.0) +[2023-10-08 17:51:38,803][19739] Avg episode reward: [(0, '629.230'), (1, '946.470')] +[2023-10-08 17:51:38,902][21195] Updated weights for policy 0, policy_version 52820 (0.0008) +[2023-10-08 17:51:39,268][21195] Updated weights for policy 0, policy_version 52830 (0.0009) +[2023-10-08 17:51:41,234][21194] Updated weights for policy 1, policy_version 52420 (0.0008) +[2023-10-08 17:51:41,605][21194] Updated weights for policy 1, policy_version 52430 (0.0009) +[2023-10-08 17:51:41,984][21194] Updated weights for policy 1, policy_version 52440 (0.0010) +[2023-10-08 17:51:43,388][21195] Updated weights for policy 0, policy_version 52840 (0.0010) +[2023-10-08 17:51:43,752][21195] Updated weights for policy 0, policy_version 52850 (0.0010) +[2023-10-08 17:51:43,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 107806720. Throughput: 0: 1772.6, 1: 1701.6. Samples: 26964348. Policy #0 lag: (min: 31.0, avg: 31.6, max: 49.0) +[2023-10-08 17:51:43,803][19739] Avg episode reward: [(0, '629.230'), (1, '946.470')] +[2023-10-08 17:51:44,119][21195] Updated weights for policy 0, policy_version 52860 (0.0009) +[2023-10-08 17:51:45,692][21194] Updated weights for policy 1, policy_version 52450 (0.0008) +[2023-10-08 17:51:46,057][21194] Updated weights for policy 1, policy_version 52460 (0.0009) +[2023-10-08 17:51:46,425][21194] Updated weights for policy 1, policy_version 52470 (0.0009) +[2023-10-08 17:51:46,792][21194] Updated weights for policy 1, policy_version 52480 (0.0009) +[2023-10-08 17:51:48,025][21195] Updated weights for policy 0, policy_version 52870 (0.0009) +[2023-10-08 17:51:48,396][21195] Updated weights for policy 0, policy_version 52880 (0.0009) +[2023-10-08 17:51:48,766][21195] Updated weights for policy 0, policy_version 52890 (0.0008) +[2023-10-08 17:51:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 107872256. Throughput: 0: 1743.6, 1: 1721.1. Samples: 26979512. Policy #0 lag: (min: 31.0, avg: 31.6, max: 49.0) +[2023-10-08 17:51:48,803][19739] Avg episode reward: [(0, '629.230'), (1, '946.470')] +[2023-10-08 17:51:50,675][21194] Updated weights for policy 1, policy_version 52490 (0.0008) +[2023-10-08 17:51:51,048][21194] Updated weights for policy 1, policy_version 52500 (0.0007) +[2023-10-08 17:51:51,417][21194] Updated weights for policy 1, policy_version 52510 (0.0008) +[2023-10-08 17:51:52,743][21195] Updated weights for policy 0, policy_version 52900 (0.0008) +[2023-10-08 17:51:53,117][21195] Updated weights for policy 0, policy_version 52910 (0.0007) +[2023-10-08 17:51:53,489][21195] Updated weights for policy 0, policy_version 52920 (0.0008) +[2023-10-08 17:51:53,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 107970560. Throughput: 0: 1763.5, 1: 1698.3. Samples: 26995000. Policy #0 lag: (min: 31.0, avg: 31.6, max: 49.0) +[2023-10-08 17:51:53,803][19739] Avg episode reward: [(0, '657.190'), (1, '946.470')] +[2023-10-08 17:51:55,396][21194] Updated weights for policy 1, policy_version 52520 (0.0008) +[2023-10-08 17:51:55,750][21194] Updated weights for policy 1, policy_version 52530 (0.0009) +[2023-10-08 17:51:56,120][21194] Updated weights for policy 1, policy_version 52540 (0.0008) +[2023-10-08 17:51:57,402][21195] Updated weights for policy 0, policy_version 52930 (0.0008) +[2023-10-08 17:51:57,767][21195] Updated weights for policy 0, policy_version 52940 (0.0007) +[2023-10-08 17:51:58,129][21195] Updated weights for policy 0, policy_version 52950 (0.0008) +[2023-10-08 17:51:58,504][21195] Updated weights for policy 0, policy_version 52960 (0.0009) +[2023-10-08 17:51:58,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 108036096. Throughput: 0: 1746.7, 1: 1717.9. Samples: 27015916. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:51:58,803][19739] Avg episode reward: [(0, '657.170'), (1, '946.470')] +[2023-10-08 17:52:00,012][21194] Updated weights for policy 1, policy_version 52550 (0.0007) +[2023-10-08 17:52:00,374][21194] Updated weights for policy 1, policy_version 52560 (0.0008) +[2023-10-08 17:52:00,751][21194] Updated weights for policy 1, policy_version 52570 (0.0007) +[2023-10-08 17:52:02,298][21195] Updated weights for policy 0, policy_version 52970 (0.0009) +[2023-10-08 17:52:02,668][21195] Updated weights for policy 0, policy_version 52980 (0.0011) +[2023-10-08 17:52:03,033][21195] Updated weights for policy 0, policy_version 52990 (0.0010) +[2023-10-08 17:52:03,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 108101632. Throughput: 0: 1720.2, 1: 1699.8. Samples: 27030388. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:52:03,804][19739] Avg episode reward: [(0, '657.170'), (1, '946.470')] +[2023-10-08 17:52:04,853][21194] Updated weights for policy 1, policy_version 52580 (0.0008) +[2023-10-08 17:52:05,213][21194] Updated weights for policy 1, policy_version 52590 (0.0008) +[2023-10-08 17:52:05,579][21194] Updated weights for policy 1, policy_version 52600 (0.0010) +[2023-10-08 17:52:07,009][21195] Updated weights for policy 0, policy_version 53000 (0.0009) +[2023-10-08 17:52:07,378][21195] Updated weights for policy 0, policy_version 53010 (0.0008) +[2023-10-08 17:52:07,757][21195] Updated weights for policy 0, policy_version 53020 (0.0010) +[2023-10-08 17:52:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 108167168. Throughput: 0: 1748.1, 1: 1704.8. Samples: 27047116. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:52:08,803][19739] Avg episode reward: [(0, '657.170'), (1, '946.470')] +[2023-10-08 17:52:09,367][21194] Updated weights for policy 1, policy_version 52610 (0.0008) +[2023-10-08 17:52:09,751][21194] Updated weights for policy 1, policy_version 52620 (0.0009) +[2023-10-08 17:52:10,120][21194] Updated weights for policy 1, policy_version 52630 (0.0009) +[2023-10-08 17:52:10,494][21194] Updated weights for policy 1, policy_version 52640 (0.0009) +[2023-10-08 17:52:11,629][21195] Updated weights for policy 0, policy_version 53030 (0.0009) +[2023-10-08 17:52:11,998][21195] Updated weights for policy 0, policy_version 53040 (0.0008) +[2023-10-08 17:52:12,375][21195] Updated weights for policy 0, policy_version 53050 (0.0009) +[2023-10-08 17:52:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 108232704. Throughput: 0: 1714.1, 1: 1734.0. Samples: 27067464. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:52:13,803][19739] Avg episode reward: [(0, '657.170'), (1, '946.470')] +[2023-10-08 17:52:14,474][21194] Updated weights for policy 1, policy_version 52650 (0.0009) +[2023-10-08 17:52:14,848][21194] Updated weights for policy 1, policy_version 52660 (0.0009) +[2023-10-08 17:52:15,211][21194] Updated weights for policy 1, policy_version 52670 (0.0008) +[2023-10-08 17:52:16,355][21195] Updated weights for policy 0, policy_version 53060 (0.0008) +[2023-10-08 17:52:16,723][21195] Updated weights for policy 0, policy_version 53070 (0.0007) +[2023-10-08 17:52:17,087][21195] Updated weights for policy 0, policy_version 53080 (0.0007) +[2023-10-08 17:52:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 108298240. Throughput: 0: 1715.1, 1: 1706.3. Samples: 27082738. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:52:18,803][19739] Avg episode reward: [(0, '657.170'), (1, '949.420')] +[2023-10-08 17:52:19,229][21194] Updated weights for policy 1, policy_version 52680 (0.0008) +[2023-10-08 17:52:19,592][21194] Updated weights for policy 1, policy_version 52690 (0.0008) +[2023-10-08 17:52:19,973][21194] Updated weights for policy 1, policy_version 52700 (0.0009) +[2023-10-08 17:52:21,070][21195] Updated weights for policy 0, policy_version 53090 (0.0008) +[2023-10-08 17:52:21,439][21195] Updated weights for policy 0, policy_version 53100 (0.0010) +[2023-10-08 17:52:21,817][21195] Updated weights for policy 0, policy_version 53110 (0.0008) +[2023-10-08 17:52:22,176][21195] Updated weights for policy 0, policy_version 53120 (0.0009) +[2023-10-08 17:52:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 108363776. Throughput: 0: 1715.2, 1: 1720.3. Samples: 27098184. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:52:23,803][19739] Avg episode reward: [(0, '656.800'), (1, '949.420')] +[2023-10-08 17:52:24,014][21194] Updated weights for policy 1, policy_version 52710 (0.0007) +[2023-10-08 17:52:24,384][21194] Updated weights for policy 1, policy_version 52720 (0.0009) +[2023-10-08 17:52:24,756][21194] Updated weights for policy 1, policy_version 52730 (0.0008) +[2023-10-08 17:52:26,053][21195] Updated weights for policy 0, policy_version 53130 (0.0007) +[2023-10-08 17:52:26,419][21195] Updated weights for policy 0, policy_version 53140 (0.0007) +[2023-10-08 17:52:26,787][21195] Updated weights for policy 0, policy_version 53150 (0.0009) +[2023-10-08 17:52:28,771][21194] Updated weights for policy 1, policy_version 52740 (0.0010) +[2023-10-08 17:52:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 108429312. Throughput: 0: 1706.2, 1: 1731.3. Samples: 27119034. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:52:28,803][19739] Avg episode reward: [(0, '671.280'), (1, '949.420')] +[2023-10-08 17:52:29,137][21194] Updated weights for policy 1, policy_version 52750 (0.0012) +[2023-10-08 17:52:29,500][21194] Updated weights for policy 1, policy_version 52760 (0.0011) +[2023-10-08 17:52:30,816][21195] Updated weights for policy 0, policy_version 53160 (0.0009) +[2023-10-08 17:52:31,190][21195] Updated weights for policy 0, policy_version 53170 (0.0009) +[2023-10-08 17:52:31,562][21195] Updated weights for policy 0, policy_version 53180 (0.0008) +[2023-10-08 17:52:33,622][21194] Updated weights for policy 1, policy_version 52770 (0.0009) +[2023-10-08 17:52:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 108494848. Throughput: 0: 1732.8, 1: 1707.2. Samples: 27134314. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:52:33,803][19739] Avg episode reward: [(0, '671.420'), (1, '949.610')] +[2023-10-08 17:52:33,987][21194] Updated weights for policy 1, policy_version 52780 (0.0009) +[2023-10-08 17:52:34,353][21194] Updated weights for policy 1, policy_version 52790 (0.0011) +[2023-10-08 17:52:34,717][21194] Updated weights for policy 1, policy_version 52800 (0.0008) +[2023-10-08 17:52:35,545][21195] Updated weights for policy 0, policy_version 53190 (0.0008) +[2023-10-08 17:52:35,921][21195] Updated weights for policy 0, policy_version 53200 (0.0007) +[2023-10-08 17:52:36,291][21195] Updated weights for policy 0, policy_version 53210 (0.0007) +[2023-10-08 17:52:38,631][21194] Updated weights for policy 1, policy_version 52810 (0.0009) +[2023-10-08 17:52:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 108560384. Throughput: 0: 1711.0, 1: 1728.9. Samples: 27149796. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:52:38,803][19739] Avg episode reward: [(0, '671.420'), (1, '939.340')] +[2023-10-08 17:52:38,991][21194] Updated weights for policy 1, policy_version 52820 (0.0009) +[2023-10-08 17:52:39,367][21194] Updated weights for policy 1, policy_version 52830 (0.0009) +[2023-10-08 17:52:40,344][21195] Updated weights for policy 0, policy_version 53220 (0.0007) +[2023-10-08 17:52:40,717][21195] Updated weights for policy 0, policy_version 53230 (0.0008) +[2023-10-08 17:52:41,090][21195] Updated weights for policy 0, policy_version 53240 (0.0009) +[2023-10-08 17:52:43,195][21194] Updated weights for policy 1, policy_version 52840 (0.0008) +[2023-10-08 17:52:43,558][21194] Updated weights for policy 1, policy_version 52850 (0.0009) +[2023-10-08 17:52:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 108625920. Throughput: 0: 1723.1, 1: 1725.2. Samples: 27171088. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:52:43,803][19739] Avg episode reward: [(0, '671.420'), (1, '939.340')] +[2023-10-08 17:52:43,921][21194] Updated weights for policy 1, policy_version 52860 (0.0009) +[2023-10-08 17:52:44,891][21195] Updated weights for policy 0, policy_version 53250 (0.0009) +[2023-10-08 17:52:45,254][21195] Updated weights for policy 0, policy_version 53260 (0.0009) +[2023-10-08 17:52:45,633][21195] Updated weights for policy 0, policy_version 53270 (0.0009) +[2023-10-08 17:52:45,995][21195] Updated weights for policy 0, policy_version 53280 (0.0008) +[2023-10-08 17:52:47,721][21194] Updated weights for policy 1, policy_version 52870 (0.0011) +[2023-10-08 17:52:48,090][21194] Updated weights for policy 1, policy_version 52880 (0.0010) +[2023-10-08 17:52:48,454][21194] Updated weights for policy 1, policy_version 52890 (0.0011) +[2023-10-08 17:52:48,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 108724224. Throughput: 0: 1743.9, 1: 1735.6. Samples: 27186964. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:52:48,803][19739] Avg episode reward: [(0, '671.420'), (1, '939.340')] +[2023-10-08 17:52:49,908][21195] Updated weights for policy 0, policy_version 53290 (0.0008) +[2023-10-08 17:52:50,279][21195] Updated weights for policy 0, policy_version 53300 (0.0008) +[2023-10-08 17:52:50,652][21195] Updated weights for policy 0, policy_version 53310 (0.0009) +[2023-10-08 17:52:52,454][21194] Updated weights for policy 1, policy_version 52900 (0.0008) +[2023-10-08 17:52:52,823][21194] Updated weights for policy 1, policy_version 52910 (0.0008) +[2023-10-08 17:52:53,190][21194] Updated weights for policy 1, policy_version 52920 (0.0007) +[2023-10-08 17:52:53,803][19739] Fps is (10 sec: 16383.7, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 108789760. Throughput: 0: 1715.6, 1: 1730.9. Samples: 27202208. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:52:53,803][19739] Avg episode reward: [(0, '671.420'), (1, '939.340')] +[2023-10-08 17:52:54,511][21195] Updated weights for policy 0, policy_version 53320 (0.0008) +[2023-10-08 17:52:54,880][21195] Updated weights for policy 0, policy_version 53330 (0.0007) +[2023-10-08 17:52:55,252][21195] Updated weights for policy 0, policy_version 53340 (0.0008) +[2023-10-08 17:52:57,250][21194] Updated weights for policy 1, policy_version 52930 (0.0008) +[2023-10-08 17:52:57,629][21194] Updated weights for policy 1, policy_version 52940 (0.0008) +[2023-10-08 17:52:57,996][21194] Updated weights for policy 1, policy_version 52950 (0.0008) +[2023-10-08 17:52:58,360][21194] Updated weights for policy 1, policy_version 52960 (0.0007) +[2023-10-08 17:52:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 108855296. Throughput: 0: 1743.4, 1: 1702.4. Samples: 27222528. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:52:58,803][19739] Avg episode reward: [(0, '671.590'), (1, '939.340')] +[2023-10-08 17:52:59,189][21195] Updated weights for policy 0, policy_version 53350 (0.0009) +[2023-10-08 17:52:59,558][21195] Updated weights for policy 0, policy_version 53360 (0.0009) +[2023-10-08 17:52:59,925][21195] Updated weights for policy 0, policy_version 53370 (0.0007) +[2023-10-08 17:53:02,430][21194] Updated weights for policy 1, policy_version 52970 (0.0009) +[2023-10-08 17:53:02,797][21194] Updated weights for policy 1, policy_version 52980 (0.0007) +[2023-10-08 17:53:03,158][21194] Updated weights for policy 1, policy_version 52990 (0.0008) +[2023-10-08 17:53:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 108920832. Throughput: 0: 1743.0, 1: 1724.4. Samples: 27238770. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:53:03,804][19739] Avg episode reward: [(0, '671.730'), (1, '939.340')] +[2023-10-08 17:53:03,940][21195] Updated weights for policy 0, policy_version 53380 (0.0010) +[2023-10-08 17:53:04,309][21195] Updated weights for policy 0, policy_version 53390 (0.0009) +[2023-10-08 17:53:04,673][21195] Updated weights for policy 0, policy_version 53400 (0.0009) +[2023-10-08 17:53:07,064][21194] Updated weights for policy 1, policy_version 53000 (0.0007) +[2023-10-08 17:53:07,425][21194] Updated weights for policy 1, policy_version 53010 (0.0007) +[2023-10-08 17:53:07,799][21194] Updated weights for policy 1, policy_version 53020 (0.0010) +[2023-10-08 17:53:08,465][21195] Updated weights for policy 0, policy_version 53410 (0.0010) +[2023-10-08 17:53:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 108986368. Throughput: 0: 1738.6, 1: 1722.1. Samples: 27253914. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:53:08,803][19739] Avg episode reward: [(0, '671.730'), (1, '939.340')] +[2023-10-08 17:53:08,838][21195] Updated weights for policy 0, policy_version 53420 (0.0007) +[2023-10-08 17:53:09,200][21195] Updated weights for policy 0, policy_version 53430 (0.0007) +[2023-10-08 17:53:09,572][21195] Updated weights for policy 0, policy_version 53440 (0.0008) +[2023-10-08 17:53:11,844][21194] Updated weights for policy 1, policy_version 53030 (0.0010) +[2023-10-08 17:53:12,206][21194] Updated weights for policy 1, policy_version 53040 (0.0009) +[2023-10-08 17:53:12,566][21194] Updated weights for policy 1, policy_version 53050 (0.0007) +[2023-10-08 17:53:13,208][21195] Updated weights for policy 0, policy_version 53450 (0.0007) +[2023-10-08 17:53:13,581][21195] Updated weights for policy 0, policy_version 53460 (0.0007) +[2023-10-08 17:53:13,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 109051904. Throughput: 0: 1756.6, 1: 1701.7. Samples: 27274658. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:53:13,803][19739] Avg episode reward: [(0, '656.930'), (1, '952.000')] +[2023-10-08 17:53:13,811][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000053056_54329344.pth... +[2023-10-08 17:53:13,850][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000051424_52658176.pth +[2023-10-08 17:53:13,942][21195] Updated weights for policy 0, policy_version 53470 (0.0011) +[2023-10-08 17:53:14,017][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000053472_54755328.pth... +[2023-10-08 17:53:14,045][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000051840_53084160.pth +[2023-10-08 17:53:16,805][21194] Updated weights for policy 1, policy_version 53060 (0.0007) +[2023-10-08 17:53:17,165][21194] Updated weights for policy 1, policy_version 53070 (0.0008) +[2023-10-08 17:53:17,526][21194] Updated weights for policy 1, policy_version 53080 (0.0007) +[2023-10-08 17:53:17,800][21195] Updated weights for policy 0, policy_version 53480 (0.0008) +[2023-10-08 17:53:18,176][21195] Updated weights for policy 0, policy_version 53490 (0.0007) +[2023-10-08 17:53:18,542][21195] Updated weights for policy 0, policy_version 53500 (0.0007) +[2023-10-08 17:53:18,802][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 109150208. Throughput: 0: 1728.7, 1: 1730.9. Samples: 27289996. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 17:53:18,803][19739] Avg episode reward: [(0, '656.930'), (1, '952.000')] +[2023-10-08 17:53:21,599][21194] Updated weights for policy 1, policy_version 53090 (0.0007) +[2023-10-08 17:53:21,964][21194] Updated weights for policy 1, policy_version 53100 (0.0007) +[2023-10-08 17:53:22,331][21194] Updated weights for policy 1, policy_version 53110 (0.0009) +[2023-10-08 17:53:22,538][21195] Updated weights for policy 0, policy_version 53510 (0.0008) +[2023-10-08 17:53:22,696][21194] Updated weights for policy 1, policy_version 53120 (0.0007) +[2023-10-08 17:53:22,912][21195] Updated weights for policy 0, policy_version 53520 (0.0008) +[2023-10-08 17:53:23,286][21195] Updated weights for policy 0, policy_version 53530 (0.0007) +[2023-10-08 17:53:23,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 109215744. Throughput: 0: 1754.8, 1: 1712.6. Samples: 27305828. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 17:53:23,803][19739] Avg episode reward: [(0, '656.930'), (1, '952.000')] +[2023-10-08 17:53:26,557][21194] Updated weights for policy 1, policy_version 53130 (0.0007) +[2023-10-08 17:53:26,922][21194] Updated weights for policy 1, policy_version 53140 (0.0009) +[2023-10-08 17:53:27,281][21194] Updated weights for policy 1, policy_version 53150 (0.0008) +[2023-10-08 17:53:27,296][21195] Updated weights for policy 0, policy_version 53540 (0.0008) +[2023-10-08 17:53:27,656][21195] Updated weights for policy 0, policy_version 53550 (0.0011) +[2023-10-08 17:53:28,024][21195] Updated weights for policy 0, policy_version 53560 (0.0011) +[2023-10-08 17:53:28,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 109281280. Throughput: 0: 1736.7, 1: 1699.4. Samples: 27325716. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 17:53:28,804][19739] Avg episode reward: [(0, '656.930'), (1, '952.290')] +[2023-10-08 17:53:30,951][21194] Updated weights for policy 1, policy_version 53160 (0.0010) +[2023-10-08 17:53:31,309][21194] Updated weights for policy 1, policy_version 53170 (0.0011) +[2023-10-08 17:53:31,670][21194] Updated weights for policy 1, policy_version 53180 (0.0010) +[2023-10-08 17:53:31,862][21195] Updated weights for policy 0, policy_version 53570 (0.0010) +[2023-10-08 17:53:32,229][21195] Updated weights for policy 0, policy_version 53580 (0.0008) +[2023-10-08 17:53:32,609][21195] Updated weights for policy 0, policy_version 53590 (0.0007) +[2023-10-08 17:53:32,976][21195] Updated weights for policy 0, policy_version 53600 (0.0007) +[2023-10-08 17:53:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 109346816. Throughput: 0: 1718.0, 1: 1713.8. Samples: 27341394. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 17:53:33,803][19739] Avg episode reward: [(0, '656.930'), (1, '952.290')] +[2023-10-08 17:53:35,592][21194] Updated weights for policy 1, policy_version 53190 (0.0007) +[2023-10-08 17:53:35,953][21194] Updated weights for policy 1, policy_version 53200 (0.0007) +[2023-10-08 17:53:36,325][21194] Updated weights for policy 1, policy_version 53210 (0.0008) +[2023-10-08 17:53:36,919][21195] Updated weights for policy 0, policy_version 53610 (0.0007) +[2023-10-08 17:53:37,286][21195] Updated weights for policy 0, policy_version 53620 (0.0008) +[2023-10-08 17:53:37,650][21195] Updated weights for policy 0, policy_version 53630 (0.0009) +[2023-10-08 17:53:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 109412352. Throughput: 0: 1745.4, 1: 1697.4. Samples: 27357132. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 17:53:38,804][19739] Avg episode reward: [(0, '656.930'), (1, '952.290')] +[2023-10-08 17:53:40,154][21194] Updated weights for policy 1, policy_version 53220 (0.0009) +[2023-10-08 17:53:40,515][21194] Updated weights for policy 1, policy_version 53230 (0.0011) +[2023-10-08 17:53:40,877][21194] Updated weights for policy 1, policy_version 53240 (0.0008) +[2023-10-08 17:53:41,761][21195] Updated weights for policy 0, policy_version 53640 (0.0008) +[2023-10-08 17:53:42,129][21195] Updated weights for policy 0, policy_version 53650 (0.0007) +[2023-10-08 17:53:42,497][21195] Updated weights for policy 0, policy_version 53660 (0.0007) +[2023-10-08 17:53:43,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 109477888. Throughput: 0: 1718.0, 1: 1727.1. Samples: 27377558. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 17:53:43,804][19739] Avg episode reward: [(0, '684.950'), (1, '952.290')] +[2023-10-08 17:53:44,772][21194] Updated weights for policy 1, policy_version 53250 (0.0011) +[2023-10-08 17:53:45,131][21194] Updated weights for policy 1, policy_version 53260 (0.0009) +[2023-10-08 17:53:45,498][21194] Updated weights for policy 1, policy_version 53270 (0.0008) +[2023-10-08 17:53:45,863][21194] Updated weights for policy 1, policy_version 53280 (0.0008) +[2023-10-08 17:53:46,328][21195] Updated weights for policy 0, policy_version 53670 (0.0008) +[2023-10-08 17:53:46,691][21195] Updated weights for policy 0, policy_version 53680 (0.0008) +[2023-10-08 17:53:47,060][21195] Updated weights for policy 0, policy_version 53690 (0.0008) +[2023-10-08 17:53:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 109543424. Throughput: 0: 1720.6, 1: 1705.1. Samples: 27392926. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 17:53:48,803][19739] Avg episode reward: [(0, '684.950'), (1, '938.130')] +[2023-10-08 17:53:49,939][21194] Updated weights for policy 1, policy_version 53290 (0.0009) +[2023-10-08 17:53:50,306][21194] Updated weights for policy 1, policy_version 53300 (0.0008) +[2023-10-08 17:53:50,668][21194] Updated weights for policy 1, policy_version 53310 (0.0008) +[2023-10-08 17:53:51,061][21195] Updated weights for policy 0, policy_version 53700 (0.0008) +[2023-10-08 17:53:51,435][21195] Updated weights for policy 0, policy_version 53710 (0.0007) +[2023-10-08 17:53:51,803][21195] Updated weights for policy 0, policy_version 53720 (0.0009) +[2023-10-08 17:53:53,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 109608960. Throughput: 0: 1729.1, 1: 1712.4. Samples: 27408780. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 17:53:53,803][19739] Avg episode reward: [(0, '684.950'), (1, '931.260')] +[2023-10-08 17:53:54,716][21194] Updated weights for policy 1, policy_version 53320 (0.0009) +[2023-10-08 17:53:55,089][21194] Updated weights for policy 1, policy_version 53330 (0.0009) +[2023-10-08 17:53:55,459][21194] Updated weights for policy 1, policy_version 53340 (0.0008) +[2023-10-08 17:53:55,678][21195] Updated weights for policy 0, policy_version 53730 (0.0007) +[2023-10-08 17:53:56,041][21195] Updated weights for policy 0, policy_version 53740 (0.0007) +[2023-10-08 17:53:56,407][21195] Updated weights for policy 0, policy_version 53750 (0.0010) +[2023-10-08 17:53:56,774][21195] Updated weights for policy 0, policy_version 53760 (0.0010) +[2023-10-08 17:53:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 109674496. Throughput: 0: 1714.1, 1: 1743.3. Samples: 27430240. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 17:53:58,803][19739] Avg episode reward: [(0, '684.950'), (1, '901.640')] +[2023-10-08 17:53:59,211][21194] Updated weights for policy 1, policy_version 53350 (0.0007) +[2023-10-08 17:53:59,575][21194] Updated weights for policy 1, policy_version 53360 (0.0010) +[2023-10-08 17:53:59,935][21194] Updated weights for policy 1, policy_version 53370 (0.0007) +[2023-10-08 17:54:00,585][21195] Updated weights for policy 0, policy_version 53770 (0.0007) +[2023-10-08 17:54:00,956][21195] Updated weights for policy 0, policy_version 53780 (0.0008) +[2023-10-08 17:54:01,324][21195] Updated weights for policy 0, policy_version 53790 (0.0007) +[2023-10-08 17:54:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 109740032. Throughput: 0: 1748.3, 1: 1716.5. Samples: 27445914. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 17:54:03,803][19739] Avg episode reward: [(0, '684.950'), (1, '901.720')] +[2023-10-08 17:54:04,020][21194] Updated weights for policy 1, policy_version 53380 (0.0008) +[2023-10-08 17:54:04,384][21194] Updated weights for policy 1, policy_version 53390 (0.0007) +[2023-10-08 17:54:04,747][21194] Updated weights for policy 1, policy_version 53400 (0.0010) +[2023-10-08 17:54:05,211][21195] Updated weights for policy 0, policy_version 53800 (0.0009) +[2023-10-08 17:54:05,587][21195] Updated weights for policy 0, policy_version 53810 (0.0007) +[2023-10-08 17:54:05,952][21195] Updated weights for policy 0, policy_version 53820 (0.0007) +[2023-10-08 17:54:08,616][21194] Updated weights for policy 1, policy_version 53410 (0.0010) +[2023-10-08 17:54:08,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 109805568. Throughput: 0: 1721.6, 1: 1731.2. Samples: 27461208. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 17:54:08,804][19739] Avg episode reward: [(0, '684.950'), (1, '901.720')] +[2023-10-08 17:54:08,981][21194] Updated weights for policy 1, policy_version 53420 (0.0012) +[2023-10-08 17:54:09,359][21194] Updated weights for policy 1, policy_version 53430 (0.0009) +[2023-10-08 17:54:09,611][21195] Updated weights for policy 0, policy_version 53830 (0.0008) +[2023-10-08 17:54:09,718][21194] Updated weights for policy 1, policy_version 53440 (0.0009) +[2023-10-08 17:54:09,978][21195] Updated weights for policy 0, policy_version 53840 (0.0009) +[2023-10-08 17:54:10,354][21195] Updated weights for policy 0, policy_version 53850 (0.0008) +[2023-10-08 17:54:13,655][21194] Updated weights for policy 1, policy_version 53450 (0.0010) +[2023-10-08 17:54:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 109871104. Throughput: 0: 1744.1, 1: 1742.4. Samples: 27482604. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 17:54:13,803][19739] Avg episode reward: [(0, '700.120'), (1, '901.950')] +[2023-10-08 17:54:14,026][21194] Updated weights for policy 1, policy_version 53460 (0.0011) +[2023-10-08 17:54:14,267][21195] Updated weights for policy 0, policy_version 53860 (0.0008) +[2023-10-08 17:54:14,385][21194] Updated weights for policy 1, policy_version 53470 (0.0011) +[2023-10-08 17:54:14,634][21195] Updated weights for policy 0, policy_version 53870 (0.0007) +[2023-10-08 17:54:15,004][21195] Updated weights for policy 0, policy_version 53880 (0.0010) +[2023-10-08 17:54:18,180][21194] Updated weights for policy 1, policy_version 53480 (0.0010) +[2023-10-08 17:54:18,548][21194] Updated weights for policy 1, policy_version 53490 (0.0008) +[2023-10-08 17:54:18,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 109936640. Throughput: 0: 1763.4, 1: 1720.1. Samples: 27498152. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 17:54:18,803][19739] Avg episode reward: [(0, '700.120'), (1, '901.950')] +[2023-10-08 17:54:18,911][21194] Updated weights for policy 1, policy_version 53500 (0.0009) +[2023-10-08 17:54:18,973][21195] Updated weights for policy 0, policy_version 53890 (0.0010) +[2023-10-08 17:54:19,337][21195] Updated weights for policy 0, policy_version 53900 (0.0010) +[2023-10-08 17:54:19,698][21195] Updated weights for policy 0, policy_version 53910 (0.0011) +[2023-10-08 17:54:20,075][21195] Updated weights for policy 0, policy_version 53920 (0.0010) +[2023-10-08 17:54:22,907][21194] Updated weights for policy 1, policy_version 53510 (0.0007) +[2023-10-08 17:54:23,277][21194] Updated weights for policy 1, policy_version 53520 (0.0009) +[2023-10-08 17:54:23,645][21194] Updated weights for policy 1, policy_version 53530 (0.0010) +[2023-10-08 17:54:23,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13107.1, 300 sec: 13773.7). Total num frames: 110002176. Throughput: 0: 1734.8, 1: 1742.8. Samples: 27513628. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 17:54:23,804][19739] Avg episode reward: [(0, '714.120'), (1, '901.950')] +[2023-10-08 17:54:23,981][21195] Updated weights for policy 0, policy_version 53930 (0.0010) +[2023-10-08 17:54:24,342][21195] Updated weights for policy 0, policy_version 53940 (0.0009) +[2023-10-08 17:54:24,718][21195] Updated weights for policy 0, policy_version 53950 (0.0007) +[2023-10-08 17:54:27,576][21194] Updated weights for policy 1, policy_version 53540 (0.0007) +[2023-10-08 17:54:27,939][21194] Updated weights for policy 1, policy_version 53550 (0.0007) +[2023-10-08 17:54:28,303][21194] Updated weights for policy 1, policy_version 53560 (0.0008) +[2023-10-08 17:54:28,479][21195] Updated weights for policy 0, policy_version 53960 (0.0007) +[2023-10-08 17:54:28,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 110100480. Throughput: 0: 1764.8, 1: 1720.9. Samples: 27534410. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 17:54:28,803][19739] Avg episode reward: [(0, '714.120'), (1, '901.950')] +[2023-10-08 17:54:28,861][21195] Updated weights for policy 0, policy_version 53970 (0.0008) +[2023-10-08 17:54:29,229][21195] Updated weights for policy 0, policy_version 53980 (0.0011) +[2023-10-08 17:54:32,403][21194] Updated weights for policy 1, policy_version 53570 (0.0008) +[2023-10-08 17:54:32,765][21194] Updated weights for policy 1, policy_version 53580 (0.0009) +[2023-10-08 17:54:33,124][21194] Updated weights for policy 1, policy_version 53590 (0.0008) +[2023-10-08 17:54:33,252][21195] Updated weights for policy 0, policy_version 53990 (0.0008) +[2023-10-08 17:54:33,493][21194] Updated weights for policy 1, policy_version 53600 (0.0009) +[2023-10-08 17:54:33,611][21195] Updated weights for policy 0, policy_version 54000 (0.0007) +[2023-10-08 17:54:33,803][19739] Fps is (10 sec: 16384.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 110166016. Throughput: 0: 1742.2, 1: 1736.4. Samples: 27549462. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:54:33,803][19739] Avg episode reward: [(0, '714.120'), (1, '905.370')] +[2023-10-08 17:54:33,983][21195] Updated weights for policy 0, policy_version 54010 (0.0008) +[2023-10-08 17:54:37,639][21194] Updated weights for policy 1, policy_version 53610 (0.0008) +[2023-10-08 17:54:37,859][21195] Updated weights for policy 0, policy_version 54020 (0.0008) +[2023-10-08 17:54:38,015][21194] Updated weights for policy 1, policy_version 53620 (0.0008) +[2023-10-08 17:54:38,231][21195] Updated weights for policy 0, policy_version 54030 (0.0010) +[2023-10-08 17:54:38,374][21194] Updated weights for policy 1, policy_version 53630 (0.0008) +[2023-10-08 17:54:38,594][21195] Updated weights for policy 0, policy_version 54040 (0.0008) +[2023-10-08 17:54:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 110231552. Throughput: 0: 1751.1, 1: 1733.8. Samples: 27565600. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:54:38,803][19739] Avg episode reward: [(0, '714.120'), (1, '905.370')] +[2023-10-08 17:54:42,390][21194] Updated weights for policy 1, policy_version 53640 (0.0008) +[2023-10-08 17:54:42,497][21195] Updated weights for policy 0, policy_version 54050 (0.0009) +[2023-10-08 17:54:42,757][21194] Updated weights for policy 1, policy_version 53650 (0.0007) +[2023-10-08 17:54:42,859][21195] Updated weights for policy 0, policy_version 54060 (0.0007) +[2023-10-08 17:54:43,124][21194] Updated weights for policy 1, policy_version 53660 (0.0008) +[2023-10-08 17:54:43,234][21195] Updated weights for policy 0, policy_version 54070 (0.0010) +[2023-10-08 17:54:43,593][21195] Updated weights for policy 0, policy_version 54080 (0.0011) +[2023-10-08 17:54:43,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 110329856. Throughput: 0: 1751.7, 1: 1702.4. Samples: 27585674. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:54:43,803][19739] Avg episode reward: [(0, '714.120'), (1, '919.900')] +[2023-10-08 17:54:47,055][21194] Updated weights for policy 1, policy_version 53670 (0.0008) +[2023-10-08 17:54:47,412][21194] Updated weights for policy 1, policy_version 53680 (0.0009) +[2023-10-08 17:54:47,637][21195] Updated weights for policy 0, policy_version 54090 (0.0010) +[2023-10-08 17:54:47,773][21194] Updated weights for policy 1, policy_version 53690 (0.0008) +[2023-10-08 17:54:47,998][21195] Updated weights for policy 0, policy_version 54100 (0.0007) +[2023-10-08 17:54:48,362][21195] Updated weights for policy 0, policy_version 54110 (0.0007) +[2023-10-08 17:54:48,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 110395392. Throughput: 0: 1724.3, 1: 1724.6. Samples: 27601116. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:54:48,803][19739] Avg episode reward: [(0, '714.120'), (1, '933.880')] +[2023-10-08 17:54:51,775][21194] Updated weights for policy 1, policy_version 53700 (0.0008) +[2023-10-08 17:54:52,132][21194] Updated weights for policy 1, policy_version 53710 (0.0007) +[2023-10-08 17:54:52,419][21195] Updated weights for policy 0, policy_version 54120 (0.0007) +[2023-10-08 17:54:52,496][21194] Updated weights for policy 1, policy_version 53720 (0.0007) +[2023-10-08 17:54:52,792][21195] Updated weights for policy 0, policy_version 54130 (0.0007) +[2023-10-08 17:54:53,156][21195] Updated weights for policy 0, policy_version 54140 (0.0011) +[2023-10-08 17:54:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 110460928. Throughput: 0: 1751.8, 1: 1716.1. Samples: 27617266. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:54:53,804][19739] Avg episode reward: [(0, '714.120'), (1, '934.200')] +[2023-10-08 17:54:56,521][21194] Updated weights for policy 1, policy_version 53730 (0.0009) +[2023-10-08 17:54:56,885][21194] Updated weights for policy 1, policy_version 53740 (0.0009) +[2023-10-08 17:54:57,143][21195] Updated weights for policy 0, policy_version 54150 (0.0008) +[2023-10-08 17:54:57,254][21194] Updated weights for policy 1, policy_version 53750 (0.0009) +[2023-10-08 17:54:57,501][21195] Updated weights for policy 0, policy_version 54160 (0.0009) +[2023-10-08 17:54:57,619][21194] Updated weights for policy 1, policy_version 53760 (0.0009) +[2023-10-08 17:54:57,879][21195] Updated weights for policy 0, policy_version 54170 (0.0010) +[2023-10-08 17:54:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 110526464. Throughput: 0: 1723.6, 1: 1697.0. Samples: 27636530. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:54:58,803][19739] Avg episode reward: [(0, '714.120'), (1, '934.200')] +[2023-10-08 17:55:01,557][21194] Updated weights for policy 1, policy_version 53770 (0.0010) +[2023-10-08 17:55:01,900][21195] Updated weights for policy 0, policy_version 54180 (0.0009) +[2023-10-08 17:55:01,922][21194] Updated weights for policy 1, policy_version 53780 (0.0009) +[2023-10-08 17:55:02,281][21195] Updated weights for policy 0, policy_version 54190 (0.0008) +[2023-10-08 17:55:02,284][21194] Updated weights for policy 1, policy_version 53790 (0.0008) +[2023-10-08 17:55:02,644][21195] Updated weights for policy 0, policy_version 54200 (0.0008) +[2023-10-08 17:55:03,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 110592000. Throughput: 0: 1710.8, 1: 1725.2. Samples: 27652768. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:55:03,803][19739] Avg episode reward: [(0, '714.120'), (1, '934.120')] +[2023-10-08 17:55:06,355][21194] Updated weights for policy 1, policy_version 53800 (0.0009) +[2023-10-08 17:55:06,537][21195] Updated weights for policy 0, policy_version 54210 (0.0009) +[2023-10-08 17:55:06,718][21194] Updated weights for policy 1, policy_version 53810 (0.0007) +[2023-10-08 17:55:06,903][21195] Updated weights for policy 0, policy_version 54220 (0.0009) +[2023-10-08 17:55:07,083][21194] Updated weights for policy 1, policy_version 53820 (0.0008) +[2023-10-08 17:55:07,271][21195] Updated weights for policy 0, policy_version 54230 (0.0007) +[2023-10-08 17:55:07,642][21195] Updated weights for policy 0, policy_version 54240 (0.0009) +[2023-10-08 17:55:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 110657536. Throughput: 0: 1737.0, 1: 1690.3. Samples: 27667854. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 17:55:08,803][19739] Avg episode reward: [(0, '714.120'), (1, '934.120')] +[2023-10-08 17:55:11,110][21194] Updated weights for policy 1, policy_version 53830 (0.0007) +[2023-10-08 17:55:11,468][21194] Updated weights for policy 1, policy_version 53840 (0.0009) +[2023-10-08 17:55:11,560][21195] Updated weights for policy 0, policy_version 54250 (0.0008) +[2023-10-08 17:55:11,830][21194] Updated weights for policy 1, policy_version 53850 (0.0009) +[2023-10-08 17:55:11,937][21195] Updated weights for policy 0, policy_version 54260 (0.0007) +[2023-10-08 17:55:12,297][21195] Updated weights for policy 0, policy_version 54270 (0.0009) +[2023-10-08 17:55:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 110723072. Throughput: 0: 1710.5, 1: 1704.5. Samples: 27688086. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 17:55:13,803][19739] Avg episode reward: [(0, '714.120'), (1, '934.120')] +[2023-10-08 17:55:13,813][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000054272_55574528.pth... +[2023-10-08 17:55:13,813][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000053856_55148544.pth... +[2023-10-08 17:55:13,859][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000052256_53510144.pth +[2023-10-08 17:55:13,861][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000052640_53903360.pth +[2023-10-08 17:55:15,873][21194] Updated weights for policy 1, policy_version 53860 (0.0007) +[2023-10-08 17:55:16,145][21195] Updated weights for policy 0, policy_version 54280 (0.0008) +[2023-10-08 17:55:16,237][21194] Updated weights for policy 1, policy_version 53870 (0.0008) +[2023-10-08 17:55:16,517][21195] Updated weights for policy 0, policy_version 54290 (0.0007) +[2023-10-08 17:55:16,596][21194] Updated weights for policy 1, policy_version 53880 (0.0009) +[2023-10-08 17:55:16,890][21195] Updated weights for policy 0, policy_version 54300 (0.0007) +[2023-10-08 17:55:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 110788608. Throughput: 0: 1732.6, 1: 1710.8. Samples: 27704416. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 17:55:18,803][19739] Avg episode reward: [(0, '714.120'), (1, '934.120')] +[2023-10-08 17:55:20,441][21194] Updated weights for policy 1, policy_version 53890 (0.0008) +[2023-10-08 17:55:20,809][21194] Updated weights for policy 1, policy_version 53900 (0.0007) +[2023-10-08 17:55:20,957][21195] Updated weights for policy 0, policy_version 54310 (0.0009) +[2023-10-08 17:55:21,173][21194] Updated weights for policy 1, policy_version 53910 (0.0008) +[2023-10-08 17:55:21,325][21195] Updated weights for policy 0, policy_version 54320 (0.0008) +[2023-10-08 17:55:21,536][21194] Updated weights for policy 1, policy_version 53920 (0.0008) +[2023-10-08 17:55:21,695][21195] Updated weights for policy 0, policy_version 54330 (0.0007) +[2023-10-08 17:55:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 110854144. Throughput: 0: 1717.6, 1: 1686.4. Samples: 27718784. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 17:55:23,803][19739] Avg episode reward: [(0, '729.050'), (1, '934.120')] +[2023-10-08 17:55:25,183][21194] Updated weights for policy 1, policy_version 53930 (0.0009) +[2023-10-08 17:55:25,513][21195] Updated weights for policy 0, policy_version 54340 (0.0008) +[2023-10-08 17:55:25,550][21194] Updated weights for policy 1, policy_version 53940 (0.0008) +[2023-10-08 17:55:25,874][21195] Updated weights for policy 0, policy_version 54350 (0.0008) +[2023-10-08 17:55:25,908][21194] Updated weights for policy 1, policy_version 53950 (0.0008) +[2023-10-08 17:55:26,242][21195] Updated weights for policy 0, policy_version 54360 (0.0008) +[2023-10-08 17:55:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 110919680. Throughput: 0: 1724.3, 1: 1715.8. Samples: 27740478. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 17:55:28,803][19739] Avg episode reward: [(0, '726.260'), (1, '934.120')] +[2023-10-08 17:55:29,946][21194] Updated weights for policy 1, policy_version 53960 (0.0009) +[2023-10-08 17:55:30,079][21195] Updated weights for policy 0, policy_version 54370 (0.0009) +[2023-10-08 17:55:30,315][21194] Updated weights for policy 1, policy_version 53970 (0.0008) +[2023-10-08 17:55:30,448][21195] Updated weights for policy 0, policy_version 54380 (0.0008) +[2023-10-08 17:55:30,674][21194] Updated weights for policy 1, policy_version 53980 (0.0009) +[2023-10-08 17:55:30,813][21195] Updated weights for policy 0, policy_version 54390 (0.0011) +[2023-10-08 17:55:31,196][21195] Updated weights for policy 0, policy_version 54400 (0.0008) +[2023-10-08 17:55:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 110985216. Throughput: 0: 1741.9, 1: 1692.3. Samples: 27755654. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 17:55:33,804][19739] Avg episode reward: [(0, '726.260'), (1, '934.120')] +[2023-10-08 17:55:34,668][21194] Updated weights for policy 1, policy_version 53990 (0.0007) +[2023-10-08 17:55:35,029][21194] Updated weights for policy 1, policy_version 54000 (0.0008) +[2023-10-08 17:55:35,169][21195] Updated weights for policy 0, policy_version 54410 (0.0007) +[2023-10-08 17:55:35,393][21194] Updated weights for policy 1, policy_version 54010 (0.0008) +[2023-10-08 17:55:35,532][21195] Updated weights for policy 0, policy_version 54420 (0.0010) +[2023-10-08 17:55:35,901][21195] Updated weights for policy 0, policy_version 54430 (0.0008) +[2023-10-08 17:55:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 111050752. Throughput: 0: 1714.1, 1: 1705.7. Samples: 27771160. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 17:55:38,803][19739] Avg episode reward: [(0, '726.260'), (1, '934.120')] +[2023-10-08 17:55:39,364][21194] Updated weights for policy 1, policy_version 54020 (0.0007) +[2023-10-08 17:55:39,728][21194] Updated weights for policy 1, policy_version 54030 (0.0008) +[2023-10-08 17:55:39,895][21195] Updated weights for policy 0, policy_version 54440 (0.0008) +[2023-10-08 17:55:40,098][21194] Updated weights for policy 1, policy_version 54040 (0.0007) +[2023-10-08 17:55:40,261][21195] Updated weights for policy 0, policy_version 54450 (0.0007) +[2023-10-08 17:55:40,630][21195] Updated weights for policy 0, policy_version 54460 (0.0009) +[2023-10-08 17:55:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 111116288. Throughput: 0: 1741.2, 1: 1730.3. Samples: 27792748. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 17:55:43,803][19739] Avg episode reward: [(0, '702.460'), (1, '948.790')] +[2023-10-08 17:55:43,996][21194] Updated weights for policy 1, policy_version 54050 (0.0007) +[2023-10-08 17:55:44,358][21194] Updated weights for policy 1, policy_version 54060 (0.0008) +[2023-10-08 17:55:44,434][21195] Updated weights for policy 0, policy_version 54470 (0.0008) +[2023-10-08 17:55:44,729][21194] Updated weights for policy 1, policy_version 54070 (0.0008) +[2023-10-08 17:55:44,796][21195] Updated weights for policy 0, policy_version 54480 (0.0008) +[2023-10-08 17:55:45,087][21194] Updated weights for policy 1, policy_version 54080 (0.0008) +[2023-10-08 17:55:45,171][21195] Updated weights for policy 0, policy_version 54490 (0.0009) +[2023-10-08 17:55:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 111181824. Throughput: 0: 1751.6, 1: 1701.1. Samples: 27808140. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 17:55:48,803][19739] Avg episode reward: [(0, '701.130'), (1, '963.510')] +[2023-10-08 17:55:49,089][21194] Updated weights for policy 1, policy_version 54090 (0.0008) +[2023-10-08 17:55:49,109][21195] Updated weights for policy 0, policy_version 54500 (0.0009) +[2023-10-08 17:55:49,448][21194] Updated weights for policy 1, policy_version 54100 (0.0008) +[2023-10-08 17:55:49,484][21195] Updated weights for policy 0, policy_version 54510 (0.0007) +[2023-10-08 17:55:49,817][21194] Updated weights for policy 1, policy_version 54110 (0.0007) +[2023-10-08 17:55:49,853][21195] Updated weights for policy 0, policy_version 54520 (0.0009) +[2023-10-08 17:55:53,726][21195] Updated weights for policy 0, policy_version 54530 (0.0009) +[2023-10-08 17:55:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 111247360. Throughput: 0: 1726.4, 1: 1730.8. Samples: 27823430. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 17:55:53,803][19739] Avg episode reward: [(0, '701.130'), (1, '954.580')] +[2023-10-08 17:55:53,857][21194] Updated weights for policy 1, policy_version 54120 (0.0008) +[2023-10-08 17:55:54,095][21195] Updated weights for policy 0, policy_version 54540 (0.0009) +[2023-10-08 17:55:54,226][21194] Updated weights for policy 1, policy_version 54130 (0.0007) +[2023-10-08 17:55:54,455][21195] Updated weights for policy 0, policy_version 54550 (0.0007) +[2023-10-08 17:55:54,588][21194] Updated weights for policy 1, policy_version 54140 (0.0008) +[2023-10-08 17:55:54,822][21195] Updated weights for policy 0, policy_version 54560 (0.0009) +[2023-10-08 17:55:58,710][21195] Updated weights for policy 0, policy_version 54570 (0.0008) +[2023-10-08 17:55:58,718][21194] Updated weights for policy 1, policy_version 54150 (0.0008) +[2023-10-08 17:55:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 111312896. Throughput: 0: 1754.4, 1: 1734.0. Samples: 27845066. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 17:55:58,803][19739] Avg episode reward: [(0, '715.030'), (1, '954.580')] +[2023-10-08 17:55:59,084][21195] Updated weights for policy 0, policy_version 54580 (0.0008) +[2023-10-08 17:55:59,085][21194] Updated weights for policy 1, policy_version 54160 (0.0009) +[2023-10-08 17:55:59,447][21194] Updated weights for policy 1, policy_version 54170 (0.0008) +[2023-10-08 17:55:59,450][21195] Updated weights for policy 0, policy_version 54590 (0.0007) +[2023-10-08 17:56:03,297][21195] Updated weights for policy 0, policy_version 54600 (0.0008) +[2023-10-08 17:56:03,339][21194] Updated weights for policy 1, policy_version 54180 (0.0009) +[2023-10-08 17:56:03,663][21195] Updated weights for policy 0, policy_version 54610 (0.0007) +[2023-10-08 17:56:03,710][21194] Updated weights for policy 1, policy_version 54190 (0.0009) +[2023-10-08 17:56:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 111378432. Throughput: 0: 1733.0, 1: 1711.4. Samples: 27859414. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 17:56:03,803][19739] Avg episode reward: [(0, '715.220'), (1, '939.770')] +[2023-10-08 17:56:04,043][21195] Updated weights for policy 0, policy_version 54620 (0.0010) +[2023-10-08 17:56:04,088][21194] Updated weights for policy 1, policy_version 54200 (0.0008) +[2023-10-08 17:56:08,020][21195] Updated weights for policy 0, policy_version 54630 (0.0010) +[2023-10-08 17:56:08,137][21194] Updated weights for policy 1, policy_version 54210 (0.0008) +[2023-10-08 17:56:08,390][21195] Updated weights for policy 0, policy_version 54640 (0.0007) +[2023-10-08 17:56:08,513][21194] Updated weights for policy 1, policy_version 54220 (0.0007) +[2023-10-08 17:56:08,762][21195] Updated weights for policy 0, policy_version 54650 (0.0007) +[2023-10-08 17:56:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 111443968. Throughput: 0: 1749.4, 1: 1738.2. Samples: 27875726. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 17:56:08,803][19739] Avg episode reward: [(0, '717.520'), (1, '939.770')] +[2023-10-08 17:56:08,889][21194] Updated weights for policy 1, policy_version 54230 (0.0009) +[2023-10-08 17:56:09,252][21194] Updated weights for policy 1, policy_version 54240 (0.0008) +[2023-10-08 17:56:12,660][21195] Updated weights for policy 0, policy_version 54660 (0.0007) +[2023-10-08 17:56:13,025][21195] Updated weights for policy 0, policy_version 54670 (0.0007) +[2023-10-08 17:56:13,194][21194] Updated weights for policy 1, policy_version 54250 (0.0009) +[2023-10-08 17:56:13,393][21195] Updated weights for policy 0, policy_version 54680 (0.0007) +[2023-10-08 17:56:13,554][21194] Updated weights for policy 1, policy_version 54260 (0.0009) +[2023-10-08 17:56:13,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 111542272. Throughput: 0: 1741.0, 1: 1726.5. Samples: 27896518. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 17:56:13,803][19739] Avg episode reward: [(0, '702.650'), (1, '939.770')] +[2023-10-08 17:56:13,925][21194] Updated weights for policy 1, policy_version 54270 (0.0010) +[2023-10-08 17:56:17,278][21195] Updated weights for policy 0, policy_version 54690 (0.0007) +[2023-10-08 17:56:17,652][21195] Updated weights for policy 0, policy_version 54700 (0.0008) +[2023-10-08 17:56:17,870][21194] Updated weights for policy 1, policy_version 54280 (0.0009) +[2023-10-08 17:56:18,017][21195] Updated weights for policy 0, policy_version 54710 (0.0007) +[2023-10-08 17:56:18,228][21194] Updated weights for policy 1, policy_version 54290 (0.0008) +[2023-10-08 17:56:18,385][21195] Updated weights for policy 0, policy_version 54720 (0.0007) +[2023-10-08 17:56:18,594][21194] Updated weights for policy 1, policy_version 54300 (0.0008) +[2023-10-08 17:56:18,803][19739] Fps is (10 sec: 19660.8, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 111640576. Throughput: 0: 1723.1, 1: 1730.1. Samples: 27911046. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 17:56:18,803][19739] Avg episode reward: [(0, '702.650'), (1, '939.770')] +[2023-10-08 17:56:22,269][21195] Updated weights for policy 0, policy_version 54730 (0.0008) +[2023-10-08 17:56:22,646][21195] Updated weights for policy 0, policy_version 54740 (0.0008) +[2023-10-08 17:56:22,682][21194] Updated weights for policy 1, policy_version 54310 (0.0010) +[2023-10-08 17:56:23,018][21195] Updated weights for policy 0, policy_version 54750 (0.0008) +[2023-10-08 17:56:23,049][21194] Updated weights for policy 1, policy_version 54320 (0.0007) +[2023-10-08 17:56:23,404][21194] Updated weights for policy 1, policy_version 54330 (0.0007) +[2023-10-08 17:56:23,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 111706112. Throughput: 0: 1751.2, 1: 1722.4. Samples: 27927472. Policy #0 lag: (min: 13.0, avg: 18.7, max: 45.0) +[2023-10-08 17:56:23,803][19739] Avg episode reward: [(0, '702.650'), (1, '939.770')] +[2023-10-08 17:56:27,026][21195] Updated weights for policy 0, policy_version 54760 (0.0007) +[2023-10-08 17:56:27,398][21195] Updated weights for policy 0, policy_version 54770 (0.0007) +[2023-10-08 17:56:27,461][21194] Updated weights for policy 1, policy_version 54340 (0.0008) +[2023-10-08 17:56:27,763][21195] Updated weights for policy 0, policy_version 54780 (0.0009) +[2023-10-08 17:56:27,831][21194] Updated weights for policy 1, policy_version 54350 (0.0008) +[2023-10-08 17:56:28,194][21194] Updated weights for policy 1, policy_version 54360 (0.0009) +[2023-10-08 17:56:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 111771648. Throughput: 0: 1719.1, 1: 1705.2. Samples: 27946838. Policy #0 lag: (min: 13.0, avg: 18.7, max: 45.0) +[2023-10-08 17:56:28,803][19739] Avg episode reward: [(0, '702.940'), (1, '940.150')] +[2023-10-08 17:56:31,644][21195] Updated weights for policy 0, policy_version 54790 (0.0010) +[2023-10-08 17:56:32,008][21195] Updated weights for policy 0, policy_version 54800 (0.0008) +[2023-10-08 17:56:32,041][21194] Updated weights for policy 1, policy_version 54370 (0.0007) +[2023-10-08 17:56:32,383][21195] Updated weights for policy 0, policy_version 54810 (0.0007) +[2023-10-08 17:56:32,412][21194] Updated weights for policy 1, policy_version 54380 (0.0008) +[2023-10-08 17:56:32,776][21194] Updated weights for policy 1, policy_version 54390 (0.0007) +[2023-10-08 17:56:33,135][21194] Updated weights for policy 1, policy_version 54400 (0.0007) +[2023-10-08 17:56:33,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 111837184. Throughput: 0: 1715.3, 1: 1721.1. Samples: 27962778. Policy #0 lag: (min: 13.0, avg: 18.7, max: 45.0) +[2023-10-08 17:56:33,803][19739] Avg episode reward: [(0, '702.940'), (1, '940.150')] +[2023-10-08 17:56:36,397][21195] Updated weights for policy 0, policy_version 54820 (0.0009) +[2023-10-08 17:56:36,763][21195] Updated weights for policy 0, policy_version 54830 (0.0011) +[2023-10-08 17:56:37,059][21194] Updated weights for policy 1, policy_version 54410 (0.0007) +[2023-10-08 17:56:37,132][21195] Updated weights for policy 0, policy_version 54840 (0.0009) +[2023-10-08 17:56:37,417][21194] Updated weights for policy 1, policy_version 54420 (0.0008) +[2023-10-08 17:56:37,787][21194] Updated weights for policy 1, policy_version 54430 (0.0011) +[2023-10-08 17:56:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 111902720. Throughput: 0: 1729.2, 1: 1716.1. Samples: 27978470. Policy #0 lag: (min: 13.0, avg: 18.7, max: 45.0) +[2023-10-08 17:56:38,803][19739] Avg episode reward: [(0, '707.760'), (1, '940.150')] +[2023-10-08 17:56:41,120][21195] Updated weights for policy 0, policy_version 54850 (0.0008) +[2023-10-08 17:56:41,481][21195] Updated weights for policy 0, policy_version 54860 (0.0007) +[2023-10-08 17:56:41,854][21195] Updated weights for policy 0, policy_version 54870 (0.0007) +[2023-10-08 17:56:41,907][21194] Updated weights for policy 1, policy_version 54440 (0.0009) +[2023-10-08 17:56:42,216][21195] Updated weights for policy 0, policy_version 54880 (0.0010) +[2023-10-08 17:56:42,272][21194] Updated weights for policy 1, policy_version 54450 (0.0007) +[2023-10-08 17:56:42,634][21194] Updated weights for policy 1, policy_version 54460 (0.0007) +[2023-10-08 17:56:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 111968256. Throughput: 0: 1705.6, 1: 1690.5. Samples: 27997890. Policy #0 lag: (min: 13.0, avg: 18.7, max: 45.0) +[2023-10-08 17:56:43,803][19739] Avg episode reward: [(0, '707.760'), (1, '940.150')] +[2023-10-08 17:56:46,161][21195] Updated weights for policy 0, policy_version 54890 (0.0008) +[2023-10-08 17:56:46,506][21194] Updated weights for policy 1, policy_version 54470 (0.0007) +[2023-10-08 17:56:46,533][21195] Updated weights for policy 0, policy_version 54900 (0.0007) +[2023-10-08 17:56:46,864][21194] Updated weights for policy 1, policy_version 54480 (0.0007) +[2023-10-08 17:56:46,905][21195] Updated weights for policy 0, policy_version 54910 (0.0009) +[2023-10-08 17:56:47,226][21194] Updated weights for policy 1, policy_version 54490 (0.0009) +[2023-10-08 17:56:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 112033792. Throughput: 0: 1723.2, 1: 1728.8. Samples: 28014750. Policy #0 lag: (min: 13.0, avg: 18.7, max: 45.0) +[2023-10-08 17:56:48,803][19739] Avg episode reward: [(0, '707.760'), (1, '940.310')] +[2023-10-08 17:56:50,859][21195] Updated weights for policy 0, policy_version 54920 (0.0009) +[2023-10-08 17:56:51,058][21194] Updated weights for policy 1, policy_version 54500 (0.0007) +[2023-10-08 17:56:51,234][21195] Updated weights for policy 0, policy_version 54930 (0.0007) +[2023-10-08 17:56:51,425][21194] Updated weights for policy 1, policy_version 54510 (0.0007) +[2023-10-08 17:56:51,597][21195] Updated weights for policy 0, policy_version 54940 (0.0009) +[2023-10-08 17:56:51,789][21194] Updated weights for policy 1, policy_version 54520 (0.0008) +[2023-10-08 17:56:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 112099328. Throughput: 0: 1702.9, 1: 1704.6. Samples: 28029064. Policy #0 lag: (min: 13.0, avg: 18.7, max: 45.0) +[2023-10-08 17:56:53,803][19739] Avg episode reward: [(0, '707.760'), (1, '940.310')] +[2023-10-08 17:56:55,495][21195] Updated weights for policy 0, policy_version 54950 (0.0008) +[2023-10-08 17:56:55,770][21194] Updated weights for policy 1, policy_version 54530 (0.0008) +[2023-10-08 17:56:55,856][21195] Updated weights for policy 0, policy_version 54960 (0.0009) +[2023-10-08 17:56:56,135][21194] Updated weights for policy 1, policy_version 54540 (0.0009) +[2023-10-08 17:56:56,232][21195] Updated weights for policy 0, policy_version 54970 (0.0009) +[2023-10-08 17:56:56,506][21194] Updated weights for policy 1, policy_version 54550 (0.0009) +[2023-10-08 17:56:56,865][21194] Updated weights for policy 1, policy_version 54560 (0.0008) +[2023-10-08 17:56:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 112164864. Throughput: 0: 1709.9, 1: 1705.6. Samples: 28050218. Policy #0 lag: (min: 13.0, avg: 18.7, max: 45.0) +[2023-10-08 17:56:58,803][19739] Avg episode reward: [(0, '708.210'), (1, '940.310')] +[2023-10-08 17:57:00,242][21195] Updated weights for policy 0, policy_version 54980 (0.0008) +[2023-10-08 17:57:00,616][21195] Updated weights for policy 0, policy_version 54990 (0.0008) +[2023-10-08 17:57:00,754][21194] Updated weights for policy 1, policy_version 54570 (0.0008) +[2023-10-08 17:57:00,977][21195] Updated weights for policy 0, policy_version 55000 (0.0009) +[2023-10-08 17:57:01,116][21194] Updated weights for policy 1, policy_version 54580 (0.0009) +[2023-10-08 17:57:01,492][21194] Updated weights for policy 1, policy_version 54590 (0.0009) +[2023-10-08 17:57:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 112230400. Throughput: 0: 1725.1, 1: 1720.2. Samples: 28066084. Policy #0 lag: (min: 31.0, avg: 35.0, max: 63.0) +[2023-10-08 17:57:03,803][19739] Avg episode reward: [(0, '723.350'), (1, '940.310')] +[2023-10-08 17:57:04,922][21195] Updated weights for policy 0, policy_version 55010 (0.0008) +[2023-10-08 17:57:05,291][21195] Updated weights for policy 0, policy_version 55020 (0.0009) +[2023-10-08 17:57:05,493][21194] Updated weights for policy 1, policy_version 54600 (0.0009) +[2023-10-08 17:57:05,657][21195] Updated weights for policy 0, policy_version 55030 (0.0007) +[2023-10-08 17:57:05,864][21194] Updated weights for policy 1, policy_version 54610 (0.0008) +[2023-10-08 17:57:06,026][21195] Updated weights for policy 0, policy_version 55040 (0.0008) +[2023-10-08 17:57:06,230][21194] Updated weights for policy 1, policy_version 54620 (0.0010) +[2023-10-08 17:57:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 112295936. Throughput: 0: 1697.7, 1: 1706.5. Samples: 28080664. Policy #0 lag: (min: 31.0, avg: 35.0, max: 63.0) +[2023-10-08 17:57:08,803][19739] Avg episode reward: [(0, '704.050'), (1, '940.310')] +[2023-10-08 17:57:09,985][21195] Updated weights for policy 0, policy_version 55050 (0.0010) +[2023-10-08 17:57:10,258][21194] Updated weights for policy 1, policy_version 54630 (0.0009) +[2023-10-08 17:57:10,354][21195] Updated weights for policy 0, policy_version 55060 (0.0009) +[2023-10-08 17:57:10,625][21194] Updated weights for policy 1, policy_version 54640 (0.0009) +[2023-10-08 17:57:10,722][21195] Updated weights for policy 0, policy_version 55070 (0.0008) +[2023-10-08 17:57:10,999][21194] Updated weights for policy 1, policy_version 54650 (0.0010) +[2023-10-08 17:57:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 112361472. Throughput: 0: 1733.9, 1: 1717.7. Samples: 28102158. Policy #0 lag: (min: 31.0, avg: 35.0, max: 63.0) +[2023-10-08 17:57:13,803][19739] Avg episode reward: [(0, '718.600'), (1, '940.310')] +[2023-10-08 17:57:13,810][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000054656_55967744.pth... +[2023-10-08 17:57:13,810][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000055072_56393728.pth... +[2023-10-08 17:57:13,843][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000053472_54755328.pth +[2023-10-08 17:57:13,854][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000053056_54329344.pth +[2023-10-08 17:57:14,761][21195] Updated weights for policy 0, policy_version 55080 (0.0009) +[2023-10-08 17:57:14,808][21194] Updated weights for policy 1, policy_version 54660 (0.0010) +[2023-10-08 17:57:15,135][21195] Updated weights for policy 0, policy_version 55090 (0.0007) +[2023-10-08 17:57:15,178][21194] Updated weights for policy 1, policy_version 54670 (0.0007) +[2023-10-08 17:57:15,501][21195] Updated weights for policy 0, policy_version 55100 (0.0007) +[2023-10-08 17:57:15,543][21194] Updated weights for policy 1, policy_version 54680 (0.0009) +[2023-10-08 17:57:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 112427008. Throughput: 0: 1736.1, 1: 1705.5. Samples: 28117650. Policy #0 lag: (min: 31.0, avg: 35.0, max: 63.0) +[2023-10-08 17:57:18,803][19739] Avg episode reward: [(0, '691.410'), (1, '940.310')] +[2023-10-08 17:57:19,367][21195] Updated weights for policy 0, policy_version 55110 (0.0007) +[2023-10-08 17:57:19,547][21194] Updated weights for policy 1, policy_version 54690 (0.0007) +[2023-10-08 17:57:19,736][21195] Updated weights for policy 0, policy_version 55120 (0.0007) +[2023-10-08 17:57:19,911][21194] Updated weights for policy 1, policy_version 54700 (0.0007) +[2023-10-08 17:57:20,109][21195] Updated weights for policy 0, policy_version 55130 (0.0007) +[2023-10-08 17:57:20,275][21194] Updated weights for policy 1, policy_version 54710 (0.0008) +[2023-10-08 17:57:20,642][21194] Updated weights for policy 1, policy_version 54720 (0.0009) +[2023-10-08 17:57:23,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 112492544. Throughput: 0: 1722.8, 1: 1708.1. Samples: 28132862. Policy #0 lag: (min: 31.0, avg: 35.0, max: 63.0) +[2023-10-08 17:57:23,803][19739] Avg episode reward: [(0, '691.560'), (1, '940.450')] +[2023-10-08 17:57:23,930][21195] Updated weights for policy 0, policy_version 55140 (0.0009) +[2023-10-08 17:57:24,297][21195] Updated weights for policy 0, policy_version 55150 (0.0008) +[2023-10-08 17:57:24,657][21194] Updated weights for policy 1, policy_version 54730 (0.0008) +[2023-10-08 17:57:24,665][21195] Updated weights for policy 0, policy_version 55160 (0.0007) +[2023-10-08 17:57:25,030][21194] Updated weights for policy 1, policy_version 54740 (0.0008) +[2023-10-08 17:57:25,396][21194] Updated weights for policy 1, policy_version 54750 (0.0008) +[2023-10-08 17:57:28,385][21195] Updated weights for policy 0, policy_version 55170 (0.0008) +[2023-10-08 17:57:28,742][21195] Updated weights for policy 0, policy_version 55180 (0.0010) +[2023-10-08 17:57:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 112558080. Throughput: 0: 1748.0, 1: 1730.2. Samples: 28154410. Policy #0 lag: (min: 31.0, avg: 35.0, max: 63.0) +[2023-10-08 17:57:28,803][19739] Avg episode reward: [(0, '691.560'), (1, '940.450')] +[2023-10-08 17:57:29,106][21195] Updated weights for policy 0, policy_version 55190 (0.0010) +[2023-10-08 17:57:29,327][21194] Updated weights for policy 1, policy_version 54760 (0.0008) +[2023-10-08 17:57:29,482][21195] Updated weights for policy 0, policy_version 55200 (0.0007) +[2023-10-08 17:57:29,691][21194] Updated weights for policy 1, policy_version 54770 (0.0007) +[2023-10-08 17:57:30,059][21194] Updated weights for policy 1, policy_version 54780 (0.0008) +[2023-10-08 17:57:33,285][21195] Updated weights for policy 0, policy_version 55210 (0.0007) +[2023-10-08 17:57:33,655][21195] Updated weights for policy 0, policy_version 55220 (0.0007) +[2023-10-08 17:57:33,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 112623616. Throughput: 0: 1730.1, 1: 1696.5. Samples: 28168948. Policy #0 lag: (min: 31.0, avg: 35.0, max: 63.0) +[2023-10-08 17:57:33,803][19739] Avg episode reward: [(0, '691.560'), (1, '940.450')] +[2023-10-08 17:57:34,012][21195] Updated weights for policy 0, policy_version 55230 (0.0007) +[2023-10-08 17:57:34,191][21194] Updated weights for policy 1, policy_version 54790 (0.0009) +[2023-10-08 17:57:34,548][21194] Updated weights for policy 1, policy_version 54800 (0.0007) +[2023-10-08 17:57:34,915][21194] Updated weights for policy 1, policy_version 54810 (0.0007) +[2023-10-08 17:57:38,090][21195] Updated weights for policy 0, policy_version 55240 (0.0007) +[2023-10-08 17:57:38,468][21195] Updated weights for policy 0, policy_version 55250 (0.0007) +[2023-10-08 17:57:38,782][21194] Updated weights for policy 1, policy_version 54820 (0.0007) +[2023-10-08 17:57:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 112689152. Throughput: 0: 1751.5, 1: 1722.0. Samples: 28185370. Policy #0 lag: (min: 31.0, avg: 35.0, max: 63.0) +[2023-10-08 17:57:38,803][19739] Avg episode reward: [(0, '691.560'), (1, '953.420')] +[2023-10-08 17:57:38,833][21195] Updated weights for policy 0, policy_version 55260 (0.0008) +[2023-10-08 17:57:39,144][21194] Updated weights for policy 1, policy_version 54830 (0.0009) +[2023-10-08 17:57:39,511][21194] Updated weights for policy 1, policy_version 54840 (0.0008) +[2023-10-08 17:57:42,598][21195] Updated weights for policy 0, policy_version 55270 (0.0007) +[2023-10-08 17:57:42,961][21195] Updated weights for policy 0, policy_version 55280 (0.0008) +[2023-10-08 17:57:43,327][21195] Updated weights for policy 0, policy_version 55290 (0.0010) +[2023-10-08 17:57:43,524][21194] Updated weights for policy 1, policy_version 54850 (0.0008) +[2023-10-08 17:57:43,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 112787456. Throughput: 0: 1742.7, 1: 1728.2. Samples: 28206408. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:57:43,803][19739] Avg episode reward: [(0, '691.560'), (1, '953.690')] +[2023-10-08 17:57:43,875][21194] Updated weights for policy 1, policy_version 54860 (0.0007) +[2023-10-08 17:57:44,243][21194] Updated weights for policy 1, policy_version 54870 (0.0007) +[2023-10-08 17:57:44,606][21194] Updated weights for policy 1, policy_version 54880 (0.0009) +[2023-10-08 17:57:47,318][21195] Updated weights for policy 0, policy_version 55300 (0.0009) +[2023-10-08 17:57:47,693][21195] Updated weights for policy 0, policy_version 55310 (0.0008) +[2023-10-08 17:57:48,061][21195] Updated weights for policy 0, policy_version 55320 (0.0010) +[2023-10-08 17:57:48,635][21194] Updated weights for policy 1, policy_version 54890 (0.0007) +[2023-10-08 17:57:48,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 112852992. Throughput: 0: 1730.8, 1: 1709.6. Samples: 28220900. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:57:48,803][19739] Avg episode reward: [(0, '691.510'), (1, '953.690')] +[2023-10-08 17:57:48,996][21194] Updated weights for policy 1, policy_version 54900 (0.0008) +[2023-10-08 17:57:49,363][21194] Updated weights for policy 1, policy_version 54910 (0.0009) +[2023-10-08 17:57:52,080][21195] Updated weights for policy 0, policy_version 55330 (0.0009) +[2023-10-08 17:57:52,458][21195] Updated weights for policy 0, policy_version 55340 (0.0009) +[2023-10-08 17:57:52,822][21195] Updated weights for policy 0, policy_version 55350 (0.0011) +[2023-10-08 17:57:53,193][21195] Updated weights for policy 0, policy_version 55360 (0.0008) +[2023-10-08 17:57:53,456][21194] Updated weights for policy 1, policy_version 54920 (0.0009) +[2023-10-08 17:57:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 112918528. Throughput: 0: 1755.8, 1: 1726.5. Samples: 28237370. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:57:53,803][19739] Avg episode reward: [(0, '696.890'), (1, '953.690')] +[2023-10-08 17:57:53,822][21194] Updated weights for policy 1, policy_version 54930 (0.0007) +[2023-10-08 17:57:54,186][21194] Updated weights for policy 1, policy_version 54940 (0.0008) +[2023-10-08 17:57:56,931][21195] Updated weights for policy 0, policy_version 55370 (0.0007) +[2023-10-08 17:57:57,302][21195] Updated weights for policy 0, policy_version 55380 (0.0009) +[2023-10-08 17:57:57,659][21195] Updated weights for policy 0, policy_version 55390 (0.0010) +[2023-10-08 17:57:58,182][21194] Updated weights for policy 1, policy_version 54950 (0.0010) +[2023-10-08 17:57:58,544][21194] Updated weights for policy 1, policy_version 54960 (0.0010) +[2023-10-08 17:57:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 112984064. Throughput: 0: 1721.2, 1: 1729.5. Samples: 28257440. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:57:58,803][19739] Avg episode reward: [(0, '696.890'), (1, '953.690')] +[2023-10-08 17:57:58,917][21194] Updated weights for policy 1, policy_version 54970 (0.0010) +[2023-10-08 17:58:01,765][21195] Updated weights for policy 0, policy_version 55400 (0.0009) +[2023-10-08 17:58:02,148][21195] Updated weights for policy 0, policy_version 55410 (0.0008) +[2023-10-08 17:58:02,513][21195] Updated weights for policy 0, policy_version 55420 (0.0009) +[2023-10-08 17:58:02,939][21194] Updated weights for policy 1, policy_version 54980 (0.0008) +[2023-10-08 17:58:03,300][21194] Updated weights for policy 1, policy_version 54990 (0.0007) +[2023-10-08 17:58:03,660][21194] Updated weights for policy 1, policy_version 55000 (0.0008) +[2023-10-08 17:58:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 113049600. Throughput: 0: 1720.6, 1: 1726.3. Samples: 28272760. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:58:03,804][19739] Avg episode reward: [(0, '696.890'), (1, '953.690')] +[2023-10-08 17:58:06,597][21195] Updated weights for policy 0, policy_version 55430 (0.0007) +[2023-10-08 17:58:06,973][21195] Updated weights for policy 0, policy_version 55440 (0.0009) +[2023-10-08 17:58:07,344][21195] Updated weights for policy 0, policy_version 55450 (0.0007) +[2023-10-08 17:58:07,524][21194] Updated weights for policy 1, policy_version 55010 (0.0008) +[2023-10-08 17:58:07,892][21194] Updated weights for policy 1, policy_version 55020 (0.0009) +[2023-10-08 17:58:08,256][21194] Updated weights for policy 1, policy_version 55030 (0.0008) +[2023-10-08 17:58:08,625][21194] Updated weights for policy 1, policy_version 55040 (0.0009) +[2023-10-08 17:58:08,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 113147904. Throughput: 0: 1737.0, 1: 1730.4. Samples: 28288898. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:58:08,803][19739] Avg episode reward: [(0, '696.890'), (1, '967.420')] +[2023-10-08 17:58:11,346][21195] Updated weights for policy 0, policy_version 55460 (0.0009) +[2023-10-08 17:58:11,716][21195] Updated weights for policy 0, policy_version 55470 (0.0010) +[2023-10-08 17:58:12,088][21195] Updated weights for policy 0, policy_version 55480 (0.0010) +[2023-10-08 17:58:12,601][21194] Updated weights for policy 1, policy_version 55050 (0.0007) +[2023-10-08 17:58:12,964][21194] Updated weights for policy 1, policy_version 55060 (0.0008) +[2023-10-08 17:58:13,326][21194] Updated weights for policy 1, policy_version 55070 (0.0008) +[2023-10-08 17:58:13,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 113213440. Throughput: 0: 1709.9, 1: 1714.2. Samples: 28308494. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:58:13,804][19739] Avg episode reward: [(0, '696.890'), (1, '967.420')] +[2023-10-08 17:58:15,926][21195] Updated weights for policy 0, policy_version 55490 (0.0008) +[2023-10-08 17:58:16,304][21195] Updated weights for policy 0, policy_version 55500 (0.0007) +[2023-10-08 17:58:16,677][21195] Updated weights for policy 0, policy_version 55510 (0.0007) +[2023-10-08 17:58:17,042][21195] Updated weights for policy 0, policy_version 55520 (0.0007) +[2023-10-08 17:58:17,296][21194] Updated weights for policy 1, policy_version 55080 (0.0008) +[2023-10-08 17:58:17,667][21194] Updated weights for policy 1, policy_version 55090 (0.0007) +[2023-10-08 17:58:18,030][21194] Updated weights for policy 1, policy_version 55100 (0.0010) +[2023-10-08 17:58:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 113278976. Throughput: 0: 1735.8, 1: 1732.4. Samples: 28325016. Policy #0 lag: (min: 23.0, avg: 23.7, max: 41.0) +[2023-10-08 17:58:18,803][19739] Avg episode reward: [(0, '696.890'), (1, '952.650')] +[2023-10-08 17:58:20,865][21195] Updated weights for policy 0, policy_version 55530 (0.0009) +[2023-10-08 17:58:21,225][21195] Updated weights for policy 0, policy_version 55540 (0.0010) +[2023-10-08 17:58:21,597][21195] Updated weights for policy 0, policy_version 55550 (0.0010) +[2023-10-08 17:58:21,871][21194] Updated weights for policy 1, policy_version 55110 (0.0010) +[2023-10-08 17:58:22,239][21194] Updated weights for policy 1, policy_version 55120 (0.0008) +[2023-10-08 17:58:22,601][21194] Updated weights for policy 1, policy_version 55130 (0.0010) +[2023-10-08 17:58:23,803][19739] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 113344512. Throughput: 0: 1713.9, 1: 1720.0. Samples: 28339896. Policy #0 lag: (min: 23.0, avg: 23.7, max: 41.0) +[2023-10-08 17:58:23,803][19739] Avg episode reward: [(0, '698.550'), (1, '952.650')] +[2023-10-08 17:58:25,390][21195] Updated weights for policy 0, policy_version 55560 (0.0008) +[2023-10-08 17:58:25,759][21195] Updated weights for policy 0, policy_version 55570 (0.0009) +[2023-10-08 17:58:26,139][21195] Updated weights for policy 0, policy_version 55580 (0.0010) +[2023-10-08 17:58:26,337][21194] Updated weights for policy 1, policy_version 55140 (0.0007) +[2023-10-08 17:58:26,705][21194] Updated weights for policy 1, policy_version 55150 (0.0008) +[2023-10-08 17:58:27,063][21194] Updated weights for policy 1, policy_version 55160 (0.0008) +[2023-10-08 17:58:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 113410048. Throughput: 0: 1726.6, 1: 1703.1. Samples: 28360744. Policy #0 lag: (min: 23.0, avg: 23.7, max: 41.0) +[2023-10-08 17:58:28,803][19739] Avg episode reward: [(0, '698.550'), (1, '952.540')] +[2023-10-08 17:58:30,056][21195] Updated weights for policy 0, policy_version 55590 (0.0008) +[2023-10-08 17:58:30,430][21195] Updated weights for policy 0, policy_version 55600 (0.0007) +[2023-10-08 17:58:30,800][21195] Updated weights for policy 0, policy_version 55610 (0.0007) +[2023-10-08 17:58:31,168][21194] Updated weights for policy 1, policy_version 55170 (0.0008) +[2023-10-08 17:58:31,533][21194] Updated weights for policy 1, policy_version 55180 (0.0008) +[2023-10-08 17:58:31,896][21194] Updated weights for policy 1, policy_version 55190 (0.0009) +[2023-10-08 17:58:32,263][21194] Updated weights for policy 1, policy_version 55200 (0.0010) +[2023-10-08 17:58:33,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 113475584. Throughput: 0: 1749.8, 1: 1736.7. Samples: 28377790. Policy #0 lag: (min: 23.0, avg: 23.7, max: 41.0) +[2023-10-08 17:58:33,803][19739] Avg episode reward: [(0, '709.950'), (1, '952.540')] +[2023-10-08 17:58:34,697][21195] Updated weights for policy 0, policy_version 55620 (0.0009) +[2023-10-08 17:58:35,064][21195] Updated weights for policy 0, policy_version 55630 (0.0009) +[2023-10-08 17:58:35,429][21195] Updated weights for policy 0, policy_version 55640 (0.0008) +[2023-10-08 17:58:36,060][21194] Updated weights for policy 1, policy_version 55210 (0.0009) +[2023-10-08 17:58:36,436][21194] Updated weights for policy 1, policy_version 55220 (0.0011) +[2023-10-08 17:58:36,795][21194] Updated weights for policy 1, policy_version 55230 (0.0009) +[2023-10-08 17:58:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 113541120. Throughput: 0: 1726.6, 1: 1712.5. Samples: 28392132. Policy #0 lag: (min: 23.0, avg: 23.7, max: 41.0) +[2023-10-08 17:58:38,803][19739] Avg episode reward: [(0, '709.950'), (1, '952.540')] +[2023-10-08 17:58:39,296][21195] Updated weights for policy 0, policy_version 55650 (0.0010) +[2023-10-08 17:58:39,664][21195] Updated weights for policy 0, policy_version 55660 (0.0008) +[2023-10-08 17:58:40,036][21195] Updated weights for policy 0, policy_version 55670 (0.0007) +[2023-10-08 17:58:40,398][21195] Updated weights for policy 0, policy_version 55680 (0.0009) +[2023-10-08 17:58:40,938][21194] Updated weights for policy 1, policy_version 55240 (0.0010) +[2023-10-08 17:58:41,309][21194] Updated weights for policy 1, policy_version 55250 (0.0008) +[2023-10-08 17:58:41,683][21194] Updated weights for policy 1, policy_version 55260 (0.0007) +[2023-10-08 17:58:43,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 113606656. Throughput: 0: 1757.6, 1: 1711.0. Samples: 28413528. Policy #0 lag: (min: 23.0, avg: 23.7, max: 41.0) +[2023-10-08 17:58:43,803][19739] Avg episode reward: [(0, '709.950'), (1, '952.540')] +[2023-10-08 17:58:44,208][21195] Updated weights for policy 0, policy_version 55690 (0.0008) +[2023-10-08 17:58:44,576][21195] Updated weights for policy 0, policy_version 55700 (0.0008) +[2023-10-08 17:58:44,949][21195] Updated weights for policy 0, policy_version 55710 (0.0009) +[2023-10-08 17:58:45,664][21194] Updated weights for policy 1, policy_version 55270 (0.0008) +[2023-10-08 17:58:46,026][21194] Updated weights for policy 1, policy_version 55280 (0.0008) +[2023-10-08 17:58:46,390][21194] Updated weights for policy 1, policy_version 55290 (0.0008) +[2023-10-08 17:58:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 113672192. Throughput: 0: 1758.2, 1: 1726.1. Samples: 28429554. Policy #0 lag: (min: 23.0, avg: 23.7, max: 41.0) +[2023-10-08 17:58:48,803][19739] Avg episode reward: [(0, '709.950'), (1, '967.230')] +[2023-10-08 17:58:48,992][21195] Updated weights for policy 0, policy_version 55720 (0.0008) +[2023-10-08 17:58:49,361][21195] Updated weights for policy 0, policy_version 55730 (0.0010) +[2023-10-08 17:58:49,734][21195] Updated weights for policy 0, policy_version 55740 (0.0009) +[2023-10-08 17:58:50,283][21194] Updated weights for policy 1, policy_version 55300 (0.0008) +[2023-10-08 17:58:50,653][21194] Updated weights for policy 1, policy_version 55310 (0.0007) +[2023-10-08 17:58:51,021][21194] Updated weights for policy 1, policy_version 55320 (0.0008) +[2023-10-08 17:58:53,394][21195] Updated weights for policy 0, policy_version 55750 (0.0010) +[2023-10-08 17:58:53,759][21195] Updated weights for policy 0, policy_version 55760 (0.0008) +[2023-10-08 17:58:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 113737728. Throughput: 0: 1746.4, 1: 1708.8. Samples: 28444386. Policy #0 lag: (min: 23.0, avg: 23.7, max: 41.0) +[2023-10-08 17:58:53,803][19739] Avg episode reward: [(0, '709.950'), (1, '967.230')] +[2023-10-08 17:58:54,135][21195] Updated weights for policy 0, policy_version 55770 (0.0010) +[2023-10-08 17:58:54,959][21194] Updated weights for policy 1, policy_version 55330 (0.0009) +[2023-10-08 17:58:55,326][21194] Updated weights for policy 1, policy_version 55340 (0.0008) +[2023-10-08 17:58:55,686][21194] Updated weights for policy 1, policy_version 55350 (0.0010) +[2023-10-08 17:58:56,059][21194] Updated weights for policy 1, policy_version 55360 (0.0007) +[2023-10-08 17:58:58,126][21195] Updated weights for policy 0, policy_version 55780 (0.0010) +[2023-10-08 17:58:58,489][21195] Updated weights for policy 0, policy_version 55790 (0.0009) +[2023-10-08 17:58:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 113803264. Throughput: 0: 1764.4, 1: 1733.0. Samples: 28465876. Policy #0 lag: (min: 23.0, avg: 31.0, max: 55.0) +[2023-10-08 17:58:58,803][19739] Avg episode reward: [(0, '709.950'), (1, '967.230')] +[2023-10-08 17:58:58,860][21195] Updated weights for policy 0, policy_version 55800 (0.0010) +[2023-10-08 17:58:59,994][21194] Updated weights for policy 1, policy_version 55370 (0.0009) +[2023-10-08 17:59:00,367][21194] Updated weights for policy 1, policy_version 55380 (0.0007) +[2023-10-08 17:59:00,733][21194] Updated weights for policy 1, policy_version 55390 (0.0007) +[2023-10-08 17:59:02,819][21195] Updated weights for policy 0, policy_version 55810 (0.0010) +[2023-10-08 17:59:03,192][21195] Updated weights for policy 0, policy_version 55820 (0.0007) +[2023-10-08 17:59:03,554][21195] Updated weights for policy 0, policy_version 55830 (0.0009) +[2023-10-08 17:59:03,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 113868800. Throughput: 0: 1734.2, 1: 1714.6. Samples: 28480210. Policy #0 lag: (min: 23.0, avg: 31.0, max: 55.0) +[2023-10-08 17:59:03,803][19739] Avg episode reward: [(0, '709.950'), (1, '982.250')] +[2023-10-08 17:59:03,920][21195] Updated weights for policy 0, policy_version 55840 (0.0009) +[2023-10-08 17:59:04,618][21194] Updated weights for policy 1, policy_version 55400 (0.0008) +[2023-10-08 17:59:04,990][21194] Updated weights for policy 1, policy_version 55410 (0.0008) +[2023-10-08 17:59:05,361][21194] Updated weights for policy 1, policy_version 55420 (0.0009) +[2023-10-08 17:59:07,915][21195] Updated weights for policy 0, policy_version 55850 (0.0011) +[2023-10-08 17:59:08,278][21195] Updated weights for policy 0, policy_version 55860 (0.0010) +[2023-10-08 17:59:08,649][21195] Updated weights for policy 0, policy_version 55870 (0.0009) +[2023-10-08 17:59:08,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 113967104. Throughput: 0: 1760.1, 1: 1724.9. Samples: 28496724. Policy #0 lag: (min: 23.0, avg: 31.0, max: 55.0) +[2023-10-08 17:59:08,803][19739] Avg episode reward: [(0, '709.950'), (1, '982.250')] +[2023-10-08 17:59:09,178][21194] Updated weights for policy 1, policy_version 55430 (0.0008) +[2023-10-08 17:59:09,544][21194] Updated weights for policy 1, policy_version 55440 (0.0009) +[2023-10-08 17:59:09,916][21194] Updated weights for policy 1, policy_version 55450 (0.0009) +[2023-10-08 17:59:12,545][21195] Updated weights for policy 0, policy_version 55880 (0.0008) +[2023-10-08 17:59:12,922][21195] Updated weights for policy 0, policy_version 55890 (0.0007) +[2023-10-08 17:59:13,289][21195] Updated weights for policy 0, policy_version 55900 (0.0007) +[2023-10-08 17:59:13,790][21194] Updated weights for policy 1, policy_version 55460 (0.0009) +[2023-10-08 17:59:13,803][19739] Fps is (10 sec: 16383.8, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 114032640. Throughput: 0: 1744.2, 1: 1745.6. Samples: 28517786. Policy #0 lag: (min: 23.0, avg: 31.0, max: 55.0) +[2023-10-08 17:59:13,803][19739] Avg episode reward: [(0, '709.950'), (1, '1012.390')] +[2023-10-08 17:59:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000055904_57245696.pth... +[2023-10-08 17:59:13,842][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000054272_55574528.pth +[2023-10-08 17:59:14,159][21194] Updated weights for policy 1, policy_version 55470 (0.0011) +[2023-10-08 17:59:14,522][21194] Updated weights for policy 1, policy_version 55480 (0.0011) +[2023-10-08 17:59:14,811][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000055488_56819712.pth... +[2023-10-08 17:59:14,851][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000053856_55148544.pth +[2023-10-08 17:59:17,260][21195] Updated weights for policy 0, policy_version 55910 (0.0007) +[2023-10-08 17:59:17,630][21195] Updated weights for policy 0, policy_version 55920 (0.0009) +[2023-10-08 17:59:17,996][21195] Updated weights for policy 0, policy_version 55930 (0.0011) +[2023-10-08 17:59:18,656][21194] Updated weights for policy 1, policy_version 55490 (0.0009) +[2023-10-08 17:59:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 114098176. Throughput: 0: 1723.4, 1: 1711.2. Samples: 28532350. Policy #0 lag: (min: 23.0, avg: 31.0, max: 55.0) +[2023-10-08 17:59:18,803][19739] Avg episode reward: [(0, '709.950'), (1, '1012.390')] +[2023-10-08 17:59:19,024][21194] Updated weights for policy 1, policy_version 55500 (0.0010) +[2023-10-08 17:59:19,381][21194] Updated weights for policy 1, policy_version 55510 (0.0009) +[2023-10-08 17:59:19,758][21194] Updated weights for policy 1, policy_version 55520 (0.0008) +[2023-10-08 17:59:21,910][21195] Updated weights for policy 0, policy_version 55940 (0.0010) +[2023-10-08 17:59:22,281][21195] Updated weights for policy 0, policy_version 55950 (0.0010) +[2023-10-08 17:59:22,646][21195] Updated weights for policy 0, policy_version 55960 (0.0007) +[2023-10-08 17:59:23,581][21194] Updated weights for policy 1, policy_version 55530 (0.0007) +[2023-10-08 17:59:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 114163712. Throughput: 0: 1749.9, 1: 1734.2. Samples: 28548914. Policy #0 lag: (min: 23.0, avg: 31.0, max: 55.0) +[2023-10-08 17:59:23,803][19739] Avg episode reward: [(0, '709.950'), (1, '1012.390')] +[2023-10-08 17:59:23,942][21194] Updated weights for policy 1, policy_version 55540 (0.0009) +[2023-10-08 17:59:24,305][21194] Updated weights for policy 1, policy_version 55550 (0.0008) +[2023-10-08 17:59:26,362][21195] Updated weights for policy 0, policy_version 55970 (0.0008) +[2023-10-08 17:59:26,727][21195] Updated weights for policy 0, policy_version 55980 (0.0007) +[2023-10-08 17:59:27,093][21195] Updated weights for policy 0, policy_version 55990 (0.0007) +[2023-10-08 17:59:27,459][21195] Updated weights for policy 0, policy_version 56000 (0.0007) +[2023-10-08 17:59:28,143][21194] Updated weights for policy 1, policy_version 55560 (0.0008) +[2023-10-08 17:59:28,514][21194] Updated weights for policy 1, policy_version 55570 (0.0009) +[2023-10-08 17:59:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 114229248. Throughput: 0: 1722.8, 1: 1736.9. Samples: 28569218. Policy #0 lag: (min: 23.0, avg: 31.0, max: 55.0) +[2023-10-08 17:59:28,803][19739] Avg episode reward: [(0, '709.220'), (1, '1012.390')] +[2023-10-08 17:59:28,886][21194] Updated weights for policy 1, policy_version 55580 (0.0007) +[2023-10-08 17:59:31,389][21195] Updated weights for policy 0, policy_version 56010 (0.0007) +[2023-10-08 17:59:31,763][21195] Updated weights for policy 0, policy_version 56020 (0.0008) +[2023-10-08 17:59:32,132][21195] Updated weights for policy 0, policy_version 56030 (0.0010) +[2023-10-08 17:59:32,967][21194] Updated weights for policy 1, policy_version 55590 (0.0008) +[2023-10-08 17:59:33,345][21194] Updated weights for policy 1, policy_version 55600 (0.0008) +[2023-10-08 17:59:33,715][21194] Updated weights for policy 1, policy_version 55610 (0.0010) +[2023-10-08 17:59:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 114294784. Throughput: 0: 1731.7, 1: 1723.3. Samples: 28585030. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:59:33,803][19739] Avg episode reward: [(0, '709.220'), (1, '1012.390')] +[2023-10-08 17:59:35,839][21195] Updated weights for policy 0, policy_version 56040 (0.0010) +[2023-10-08 17:59:36,207][21195] Updated weights for policy 0, policy_version 56050 (0.0010) +[2023-10-08 17:59:36,582][21195] Updated weights for policy 0, policy_version 56060 (0.0008) +[2023-10-08 17:59:37,624][21194] Updated weights for policy 1, policy_version 55620 (0.0011) +[2023-10-08 17:59:37,993][21194] Updated weights for policy 1, policy_version 55630 (0.0007) +[2023-10-08 17:59:38,354][21194] Updated weights for policy 1, policy_version 55640 (0.0008) +[2023-10-08 17:59:38,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 114393088. Throughput: 0: 1729.4, 1: 1737.2. Samples: 28600382. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:59:38,803][19739] Avg episode reward: [(0, '709.220'), (1, '1012.390')] +[2023-10-08 17:59:40,635][21195] Updated weights for policy 0, policy_version 56070 (0.0008) +[2023-10-08 17:59:40,998][21195] Updated weights for policy 0, policy_version 56080 (0.0010) +[2023-10-08 17:59:41,367][21195] Updated weights for policy 0, policy_version 56090 (0.0011) +[2023-10-08 17:59:42,399][21194] Updated weights for policy 1, policy_version 55650 (0.0008) +[2023-10-08 17:59:42,763][21194] Updated weights for policy 1, policy_version 55660 (0.0008) +[2023-10-08 17:59:43,129][21194] Updated weights for policy 1, policy_version 55670 (0.0008) +[2023-10-08 17:59:43,500][21194] Updated weights for policy 1, policy_version 55680 (0.0008) +[2023-10-08 17:59:43,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 114458624. Throughput: 0: 1732.9, 1: 1717.9. Samples: 28621162. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:59:43,803][19739] Avg episode reward: [(0, '709.220'), (1, '1012.390')] +[2023-10-08 17:59:45,159][21195] Updated weights for policy 0, policy_version 56100 (0.0010) +[2023-10-08 17:59:45,524][21195] Updated weights for policy 0, policy_version 56110 (0.0009) +[2023-10-08 17:59:45,900][21195] Updated weights for policy 0, policy_version 56120 (0.0008) +[2023-10-08 17:59:47,555][21194] Updated weights for policy 1, policy_version 55690 (0.0010) +[2023-10-08 17:59:47,916][21194] Updated weights for policy 1, policy_version 55700 (0.0010) +[2023-10-08 17:59:48,282][21194] Updated weights for policy 1, policy_version 55710 (0.0007) +[2023-10-08 17:59:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 114524160. Throughput: 0: 1762.1, 1: 1731.9. Samples: 28637438. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:59:48,803][19739] Avg episode reward: [(0, '709.220'), (1, '1012.390')] +[2023-10-08 17:59:49,833][21195] Updated weights for policy 0, policy_version 56130 (0.0007) +[2023-10-08 17:59:50,205][21195] Updated weights for policy 0, policy_version 56140 (0.0009) +[2023-10-08 17:59:50,571][21195] Updated weights for policy 0, policy_version 56150 (0.0008) +[2023-10-08 17:59:50,943][21195] Updated weights for policy 0, policy_version 56160 (0.0011) +[2023-10-08 17:59:52,336][21194] Updated weights for policy 1, policy_version 55720 (0.0011) +[2023-10-08 17:59:52,699][21194] Updated weights for policy 1, policy_version 55730 (0.0009) +[2023-10-08 17:59:53,072][21194] Updated weights for policy 1, policy_version 55740 (0.0007) +[2023-10-08 17:59:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 114589696. Throughput: 0: 1734.3, 1: 1732.2. Samples: 28652716. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:59:53,803][19739] Avg episode reward: [(0, '738.440'), (1, '1026.660')] +[2023-10-08 17:59:54,842][21195] Updated weights for policy 0, policy_version 56170 (0.0007) +[2023-10-08 17:59:55,207][21195] Updated weights for policy 0, policy_version 56180 (0.0007) +[2023-10-08 17:59:55,571][21195] Updated weights for policy 0, policy_version 56190 (0.0010) +[2023-10-08 17:59:57,127][21194] Updated weights for policy 1, policy_version 55750 (0.0007) +[2023-10-08 17:59:57,493][21194] Updated weights for policy 1, policy_version 55760 (0.0007) +[2023-10-08 17:59:57,852][21194] Updated weights for policy 1, policy_version 55770 (0.0007) +[2023-10-08 17:59:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 114655232. Throughput: 0: 1749.5, 1: 1695.0. Samples: 28672790. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 17:59:58,803][19739] Avg episode reward: [(0, '738.440'), (1, '1027.070')] +[2023-10-08 17:59:59,531][21195] Updated weights for policy 0, policy_version 56200 (0.0010) +[2023-10-08 17:59:59,918][21195] Updated weights for policy 0, policy_version 56210 (0.0010) +[2023-10-08 18:00:00,281][21195] Updated weights for policy 0, policy_version 56220 (0.0008) +[2023-10-08 18:00:01,697][21194] Updated weights for policy 1, policy_version 55780 (0.0010) +[2023-10-08 18:00:02,070][21194] Updated weights for policy 1, policy_version 55790 (0.0010) +[2023-10-08 18:00:02,432][21194] Updated weights for policy 1, policy_version 55800 (0.0009) +[2023-10-08 18:00:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 114720768. Throughput: 0: 1767.7, 1: 1726.2. Samples: 28689576. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:00:03,803][19739] Avg episode reward: [(0, '738.720'), (1, '1026.980')] +[2023-10-08 18:00:04,086][21195] Updated weights for policy 0, policy_version 56230 (0.0008) +[2023-10-08 18:00:04,447][21195] Updated weights for policy 0, policy_version 56240 (0.0010) +[2023-10-08 18:00:04,811][21195] Updated weights for policy 0, policy_version 56250 (0.0011) +[2023-10-08 18:00:06,295][21194] Updated weights for policy 1, policy_version 55810 (0.0008) +[2023-10-08 18:00:06,656][21194] Updated weights for policy 1, policy_version 55820 (0.0008) +[2023-10-08 18:00:07,029][21194] Updated weights for policy 1, policy_version 55830 (0.0010) +[2023-10-08 18:00:07,380][21194] Updated weights for policy 1, policy_version 55840 (0.0011) +[2023-10-08 18:00:08,531][21195] Updated weights for policy 0, policy_version 56260 (0.0009) +[2023-10-08 18:00:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 114786304. Throughput: 0: 1738.8, 1: 1707.4. Samples: 28703994. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:00:08,803][19739] Avg episode reward: [(0, '754.020'), (1, '1026.980')] +[2023-10-08 18:00:08,906][21195] Updated weights for policy 0, policy_version 56270 (0.0008) +[2023-10-08 18:00:09,278][21195] Updated weights for policy 0, policy_version 56280 (0.0010) +[2023-10-08 18:00:11,662][21194] Updated weights for policy 1, policy_version 55850 (0.0008) +[2023-10-08 18:00:12,028][21194] Updated weights for policy 1, policy_version 55860 (0.0008) +[2023-10-08 18:00:12,392][21194] Updated weights for policy 1, policy_version 55870 (0.0008) +[2023-10-08 18:00:13,240][21195] Updated weights for policy 0, policy_version 56290 (0.0009) +[2023-10-08 18:00:13,620][21195] Updated weights for policy 0, policy_version 56300 (0.0008) +[2023-10-08 18:00:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 114851840. Throughput: 0: 1765.4, 1: 1693.8. Samples: 28724884. Policy #0 lag: (min: 11.0, avg: 11.4, max: 26.0) +[2023-10-08 18:00:13,804][19739] Avg episode reward: [(0, '725.010'), (1, '1026.980')] +[2023-10-08 18:00:13,985][21195] Updated weights for policy 0, policy_version 56310 (0.0009) +[2023-10-08 18:00:14,359][21195] Updated weights for policy 0, policy_version 56320 (0.0008) +[2023-10-08 18:00:16,383][21194] Updated weights for policy 1, policy_version 55880 (0.0010) +[2023-10-08 18:00:16,757][21194] Updated weights for policy 1, policy_version 55890 (0.0009) +[2023-10-08 18:00:17,124][21194] Updated weights for policy 1, policy_version 55900 (0.0007) +[2023-10-08 18:00:18,394][21195] Updated weights for policy 0, policy_version 56330 (0.0011) +[2023-10-08 18:00:18,760][21195] Updated weights for policy 0, policy_version 56340 (0.0008) +[2023-10-08 18:00:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 114917376. Throughput: 0: 1738.8, 1: 1720.2. Samples: 28740684. Policy #0 lag: (min: 11.0, avg: 11.4, max: 26.0) +[2023-10-08 18:00:18,803][19739] Avg episode reward: [(0, '709.870'), (1, '1026.980')] +[2023-10-08 18:00:19,121][21195] Updated weights for policy 0, policy_version 56350 (0.0010) +[2023-10-08 18:00:21,072][21194] Updated weights for policy 1, policy_version 55910 (0.0008) +[2023-10-08 18:00:21,442][21194] Updated weights for policy 1, policy_version 55920 (0.0007) +[2023-10-08 18:00:21,807][21194] Updated weights for policy 1, policy_version 55930 (0.0010) +[2023-10-08 18:00:23,063][21195] Updated weights for policy 0, policy_version 56360 (0.0008) +[2023-10-08 18:00:23,431][21195] Updated weights for policy 0, policy_version 56370 (0.0007) +[2023-10-08 18:00:23,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 114982912. Throughput: 0: 1754.7, 1: 1692.7. Samples: 28755516. Policy #0 lag: (min: 11.0, avg: 11.4, max: 26.0) +[2023-10-08 18:00:23,803][19739] Avg episode reward: [(0, '724.660'), (1, '1026.980')] +[2023-10-08 18:00:23,805][21195] Updated weights for policy 0, policy_version 56380 (0.0009) +[2023-10-08 18:00:25,499][21194] Updated weights for policy 1, policy_version 55940 (0.0009) +[2023-10-08 18:00:25,849][21194] Updated weights for policy 1, policy_version 55950 (0.0010) +[2023-10-08 18:00:26,211][21194] Updated weights for policy 1, policy_version 55960 (0.0010) +[2023-10-08 18:00:27,795][21195] Updated weights for policy 0, policy_version 56390 (0.0008) +[2023-10-08 18:00:28,158][21195] Updated weights for policy 0, policy_version 56400 (0.0008) +[2023-10-08 18:00:28,520][21195] Updated weights for policy 0, policy_version 56410 (0.0008) +[2023-10-08 18:00:28,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13884.8). Total num frames: 115081216. Throughput: 0: 1745.0, 1: 1717.5. Samples: 28776974. Policy #0 lag: (min: 11.0, avg: 11.4, max: 26.0) +[2023-10-08 18:00:28,803][19739] Avg episode reward: [(0, '724.660'), (1, '1026.980')] +[2023-10-08 18:00:30,303][21194] Updated weights for policy 1, policy_version 55970 (0.0009) +[2023-10-08 18:00:30,668][21194] Updated weights for policy 1, policy_version 55980 (0.0008) +[2023-10-08 18:00:31,034][21194] Updated weights for policy 1, policy_version 55990 (0.0012) +[2023-10-08 18:00:31,404][21194] Updated weights for policy 1, policy_version 56000 (0.0008) +[2023-10-08 18:00:32,352][21195] Updated weights for policy 0, policy_version 56420 (0.0010) +[2023-10-08 18:00:32,720][21195] Updated weights for policy 0, policy_version 56430 (0.0008) +[2023-10-08 18:00:33,097][21195] Updated weights for policy 0, policy_version 56440 (0.0008) +[2023-10-08 18:00:33,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 115146752. Throughput: 0: 1718.8, 1: 1710.1. Samples: 28791740. Policy #0 lag: (min: 11.0, avg: 11.4, max: 26.0) +[2023-10-08 18:00:33,804][19739] Avg episode reward: [(0, '740.040'), (1, '1026.980')] +[2023-10-08 18:00:35,206][21194] Updated weights for policy 1, policy_version 56010 (0.0007) +[2023-10-08 18:00:35,564][21194] Updated weights for policy 1, policy_version 56020 (0.0010) +[2023-10-08 18:00:35,926][21194] Updated weights for policy 1, policy_version 56030 (0.0007) +[2023-10-08 18:00:37,024][21195] Updated weights for policy 0, policy_version 56450 (0.0007) +[2023-10-08 18:00:37,396][21195] Updated weights for policy 0, policy_version 56460 (0.0008) +[2023-10-08 18:00:37,766][21195] Updated weights for policy 0, policy_version 56470 (0.0007) +[2023-10-08 18:00:38,127][21195] Updated weights for policy 0, policy_version 56480 (0.0010) +[2023-10-08 18:00:38,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 115212288. Throughput: 0: 1750.2, 1: 1703.8. Samples: 28808144. Policy #0 lag: (min: 11.0, avg: 11.4, max: 26.0) +[2023-10-08 18:00:38,803][19739] Avg episode reward: [(0, '739.140'), (1, '1026.980')] +[2023-10-08 18:00:39,934][21194] Updated weights for policy 1, policy_version 56040 (0.0007) +[2023-10-08 18:00:40,295][21194] Updated weights for policy 1, policy_version 56050 (0.0009) +[2023-10-08 18:00:40,672][21194] Updated weights for policy 1, policy_version 56060 (0.0009) +[2023-10-08 18:00:42,051][21195] Updated weights for policy 0, policy_version 56490 (0.0009) +[2023-10-08 18:00:42,415][21195] Updated weights for policy 0, policy_version 56500 (0.0010) +[2023-10-08 18:00:42,778][21195] Updated weights for policy 0, policy_version 56510 (0.0011) +[2023-10-08 18:00:43,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 115277824. Throughput: 0: 1719.2, 1: 1733.3. Samples: 28828156. Policy #0 lag: (min: 11.0, avg: 11.4, max: 26.0) +[2023-10-08 18:00:43,803][19739] Avg episode reward: [(0, '740.400'), (1, '1027.820')] +[2023-10-08 18:00:44,532][21194] Updated weights for policy 1, policy_version 56070 (0.0008) +[2023-10-08 18:00:44,907][21194] Updated weights for policy 1, policy_version 56080 (0.0007) +[2023-10-08 18:00:45,270][21194] Updated weights for policy 1, policy_version 56090 (0.0007) +[2023-10-08 18:00:46,819][21195] Updated weights for policy 0, policy_version 56520 (0.0008) +[2023-10-08 18:00:47,188][21195] Updated weights for policy 0, policy_version 56530 (0.0007) +[2023-10-08 18:00:47,561][21195] Updated weights for policy 0, policy_version 56540 (0.0008) +[2023-10-08 18:00:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 115343360. Throughput: 0: 1711.4, 1: 1705.5. Samples: 28843336. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:00:48,803][19739] Avg episode reward: [(0, '740.930'), (1, '1027.820')] +[2023-10-08 18:00:49,066][21194] Updated weights for policy 1, policy_version 56100 (0.0010) +[2023-10-08 18:00:49,427][21194] Updated weights for policy 1, policy_version 56110 (0.0007) +[2023-10-08 18:00:49,794][21194] Updated weights for policy 1, policy_version 56120 (0.0009) +[2023-10-08 18:00:51,402][21195] Updated weights for policy 0, policy_version 56550 (0.0008) +[2023-10-08 18:00:51,763][21195] Updated weights for policy 0, policy_version 56560 (0.0008) +[2023-10-08 18:00:52,132][21195] Updated weights for policy 0, policy_version 56570 (0.0010) +[2023-10-08 18:00:53,720][21194] Updated weights for policy 1, policy_version 56130 (0.0009) +[2023-10-08 18:00:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 115408896. Throughput: 0: 1728.7, 1: 1732.6. Samples: 28859754. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:00:53,803][19739] Avg episode reward: [(0, '740.930'), (1, '1027.820')] +[2023-10-08 18:00:54,087][21194] Updated weights for policy 1, policy_version 56140 (0.0009) +[2023-10-08 18:00:54,461][21194] Updated weights for policy 1, policy_version 56150 (0.0009) +[2023-10-08 18:00:54,830][21194] Updated weights for policy 1, policy_version 56160 (0.0008) +[2023-10-08 18:00:56,006][21195] Updated weights for policy 0, policy_version 56580 (0.0008) +[2023-10-08 18:00:56,381][21195] Updated weights for policy 0, policy_version 56590 (0.0007) +[2023-10-08 18:00:56,750][21195] Updated weights for policy 0, policy_version 56600 (0.0010) +[2023-10-08 18:00:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 115474432. Throughput: 0: 1714.3, 1: 1745.2. Samples: 28880560. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:00:58,803][19739] Avg episode reward: [(0, '740.930'), (1, '1027.820')] +[2023-10-08 18:00:58,867][21194] Updated weights for policy 1, policy_version 56170 (0.0009) +[2023-10-08 18:00:59,229][21194] Updated weights for policy 1, policy_version 56180 (0.0007) +[2023-10-08 18:00:59,607][21194] Updated weights for policy 1, policy_version 56190 (0.0010) +[2023-10-08 18:01:00,610][21195] Updated weights for policy 0, policy_version 56610 (0.0009) +[2023-10-08 18:01:00,983][21195] Updated weights for policy 0, policy_version 56620 (0.0007) +[2023-10-08 18:01:01,358][21195] Updated weights for policy 0, policy_version 56630 (0.0007) +[2023-10-08 18:01:01,718][21195] Updated weights for policy 0, policy_version 56640 (0.0008) +[2023-10-08 18:01:03,622][21194] Updated weights for policy 1, policy_version 56200 (0.0010) +[2023-10-08 18:01:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 115539968. Throughput: 0: 1734.2, 1: 1715.6. Samples: 28895928. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:01:03,803][19739] Avg episode reward: [(0, '740.930'), (1, '1028.380')] +[2023-10-08 18:01:04,003][21194] Updated weights for policy 1, policy_version 56210 (0.0010) +[2023-10-08 18:01:04,379][21194] Updated weights for policy 1, policy_version 56220 (0.0007) +[2023-10-08 18:01:05,614][21195] Updated weights for policy 0, policy_version 56650 (0.0011) +[2023-10-08 18:01:05,971][21195] Updated weights for policy 0, policy_version 56660 (0.0010) +[2023-10-08 18:01:06,343][21195] Updated weights for policy 0, policy_version 56670 (0.0010) +[2023-10-08 18:01:08,291][21194] Updated weights for policy 1, policy_version 56230 (0.0009) +[2023-10-08 18:01:08,659][21194] Updated weights for policy 1, policy_version 56240 (0.0007) +[2023-10-08 18:01:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 115605504. Throughput: 0: 1715.2, 1: 1747.0. Samples: 28911314. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:01:08,803][19739] Avg episode reward: [(0, '755.860'), (1, '1028.380')] +[2023-10-08 18:01:09,023][21194] Updated weights for policy 1, policy_version 56250 (0.0008) +[2023-10-08 18:01:10,356][21195] Updated weights for policy 0, policy_version 56680 (0.0010) +[2023-10-08 18:01:10,722][21195] Updated weights for policy 0, policy_version 56690 (0.0009) +[2023-10-08 18:01:11,103][21195] Updated weights for policy 0, policy_version 56700 (0.0007) +[2023-10-08 18:01:12,896][21194] Updated weights for policy 1, policy_version 56260 (0.0009) +[2023-10-08 18:01:13,263][21194] Updated weights for policy 1, policy_version 56270 (0.0010) +[2023-10-08 18:01:13,641][21194] Updated weights for policy 1, policy_version 56280 (0.0009) +[2023-10-08 18:01:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 115671040. Throughput: 0: 1722.1, 1: 1733.1. Samples: 28932456. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:01:13,803][19739] Avg episode reward: [(0, '755.860'), (1, '1028.380')] +[2023-10-08 18:01:13,810][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000056704_58064896.pth... +[2023-10-08 18:01:13,839][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000055072_56393728.pth +[2023-10-08 18:01:13,843][20740] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p0/milestones/checkpoint_000056704_58064896.pth +[2023-10-08 18:01:13,923][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000056288_57638912.pth... +[2023-10-08 18:01:13,961][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000054656_55967744.pth +[2023-10-08 18:01:13,965][20836] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p1/milestones/checkpoint_000056288_57638912.pth +[2023-10-08 18:01:14,920][21195] Updated weights for policy 0, policy_version 56710 (0.0009) +[2023-10-08 18:01:15,298][21195] Updated weights for policy 0, policy_version 56720 (0.0010) +[2023-10-08 18:01:15,671][21195] Updated weights for policy 0, policy_version 56730 (0.0011) +[2023-10-08 18:01:17,587][21194] Updated weights for policy 1, policy_version 56290 (0.0009) +[2023-10-08 18:01:17,957][21194] Updated weights for policy 1, policy_version 56300 (0.0008) +[2023-10-08 18:01:18,321][21194] Updated weights for policy 1, policy_version 56310 (0.0008) +[2023-10-08 18:01:18,686][21194] Updated weights for policy 1, policy_version 56320 (0.0007) +[2023-10-08 18:01:18,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 115769344. Throughput: 0: 1745.4, 1: 1730.8. Samples: 28948168. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:01:18,803][19739] Avg episode reward: [(0, '770.630'), (1, '1028.380')] +[2023-10-08 18:01:19,624][21195] Updated weights for policy 0, policy_version 56740 (0.0009) +[2023-10-08 18:01:19,997][21195] Updated weights for policy 0, policy_version 56750 (0.0007) +[2023-10-08 18:01:20,362][21195] Updated weights for policy 0, policy_version 56760 (0.0008) +[2023-10-08 18:01:22,654][21194] Updated weights for policy 1, policy_version 56330 (0.0007) +[2023-10-08 18:01:23,025][21194] Updated weights for policy 1, policy_version 56340 (0.0009) +[2023-10-08 18:01:23,389][21194] Updated weights for policy 1, policy_version 56350 (0.0010) +[2023-10-08 18:01:23,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 115834880. Throughput: 0: 1713.4, 1: 1736.4. Samples: 28963384. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:01:23,803][19739] Avg episode reward: [(0, '756.770'), (1, '1028.380')] +[2023-10-08 18:01:24,455][21195] Updated weights for policy 0, policy_version 56770 (0.0010) +[2023-10-08 18:01:24,826][21195] Updated weights for policy 0, policy_version 56780 (0.0008) +[2023-10-08 18:01:25,201][21195] Updated weights for policy 0, policy_version 56790 (0.0010) +[2023-10-08 18:01:25,560][21195] Updated weights for policy 0, policy_version 56800 (0.0009) +[2023-10-08 18:01:27,395][21194] Updated weights for policy 1, policy_version 56360 (0.0008) +[2023-10-08 18:01:27,763][21194] Updated weights for policy 1, policy_version 56370 (0.0008) +[2023-10-08 18:01:28,131][21194] Updated weights for policy 1, policy_version 56380 (0.0009) +[2023-10-08 18:01:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 115900416. Throughput: 0: 1741.0, 1: 1720.3. Samples: 28983914. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:01:28,803][19739] Avg episode reward: [(0, '756.770'), (1, '1028.380')] +[2023-10-08 18:01:29,496][21195] Updated weights for policy 0, policy_version 56810 (0.0009) +[2023-10-08 18:01:29,872][21195] Updated weights for policy 0, policy_version 56820 (0.0008) +[2023-10-08 18:01:30,237][21195] Updated weights for policy 0, policy_version 56830 (0.0009) +[2023-10-08 18:01:32,047][21194] Updated weights for policy 1, policy_version 56390 (0.0010) +[2023-10-08 18:01:32,413][21194] Updated weights for policy 1, policy_version 56400 (0.0010) +[2023-10-08 18:01:32,781][21194] Updated weights for policy 1, policy_version 56410 (0.0008) +[2023-10-08 18:01:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 115965952. Throughput: 0: 1744.8, 1: 1742.1. Samples: 29000248. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:01:33,803][19739] Avg episode reward: [(0, '770.130'), (1, '1029.820')] +[2023-10-08 18:01:34,152][21195] Updated weights for policy 0, policy_version 56840 (0.0009) +[2023-10-08 18:01:34,521][21195] Updated weights for policy 0, policy_version 56850 (0.0009) +[2023-10-08 18:01:34,893][21195] Updated weights for policy 0, policy_version 56860 (0.0008) +[2023-10-08 18:01:36,779][21194] Updated weights for policy 1, policy_version 56420 (0.0008) +[2023-10-08 18:01:37,143][21194] Updated weights for policy 1, policy_version 56430 (0.0009) +[2023-10-08 18:01:37,506][21194] Updated weights for policy 1, policy_version 56440 (0.0010) +[2023-10-08 18:01:38,775][21195] Updated weights for policy 0, policy_version 56870 (0.0008) +[2023-10-08 18:01:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 116031488. Throughput: 0: 1729.6, 1: 1723.6. Samples: 29015148. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:01:38,803][19739] Avg episode reward: [(0, '770.130'), (1, '1029.820')] +[2023-10-08 18:01:39,149][21195] Updated weights for policy 0, policy_version 56880 (0.0009) +[2023-10-08 18:01:39,524][21195] Updated weights for policy 0, policy_version 56890 (0.0010) +[2023-10-08 18:01:41,561][21194] Updated weights for policy 1, policy_version 56450 (0.0009) +[2023-10-08 18:01:41,922][21194] Updated weights for policy 1, policy_version 56460 (0.0008) +[2023-10-08 18:01:42,292][21194] Updated weights for policy 1, policy_version 56470 (0.0010) +[2023-10-08 18:01:42,660][21194] Updated weights for policy 1, policy_version 56480 (0.0007) +[2023-10-08 18:01:43,423][21195] Updated weights for policy 0, policy_version 56900 (0.0009) +[2023-10-08 18:01:43,797][21195] Updated weights for policy 0, policy_version 56910 (0.0009) +[2023-10-08 18:01:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 116097024. Throughput: 0: 1744.0, 1: 1703.0. Samples: 29035674. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:01:43,803][19739] Avg episode reward: [(0, '770.130'), (1, '1029.820')] +[2023-10-08 18:01:44,157][21195] Updated weights for policy 0, policy_version 56920 (0.0011) +[2023-10-08 18:01:46,598][21194] Updated weights for policy 1, policy_version 56490 (0.0007) +[2023-10-08 18:01:46,960][21194] Updated weights for policy 1, policy_version 56500 (0.0007) +[2023-10-08 18:01:47,324][21194] Updated weights for policy 1, policy_version 56510 (0.0007) +[2023-10-08 18:01:48,078][21195] Updated weights for policy 0, policy_version 56930 (0.0010) +[2023-10-08 18:01:48,449][21195] Updated weights for policy 0, policy_version 56940 (0.0009) +[2023-10-08 18:01:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 116162560. Throughput: 0: 1726.5, 1: 1731.9. Samples: 29051558. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:01:48,803][19739] Avg episode reward: [(0, '770.130'), (1, '1029.820')] +[2023-10-08 18:01:48,830][21195] Updated weights for policy 0, policy_version 56950 (0.0007) +[2023-10-08 18:01:49,194][21195] Updated weights for policy 0, policy_version 56960 (0.0009) +[2023-10-08 18:01:51,315][21194] Updated weights for policy 1, policy_version 56520 (0.0008) +[2023-10-08 18:01:51,672][21194] Updated weights for policy 1, policy_version 56530 (0.0008) +[2023-10-08 18:01:52,042][21194] Updated weights for policy 1, policy_version 56540 (0.0010) +[2023-10-08 18:01:53,020][21195] Updated weights for policy 0, policy_version 56970 (0.0008) +[2023-10-08 18:01:53,387][21195] Updated weights for policy 0, policy_version 56980 (0.0009) +[2023-10-08 18:01:53,761][21195] Updated weights for policy 0, policy_version 56990 (0.0009) +[2023-10-08 18:01:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 116228096. Throughput: 0: 1747.9, 1: 1704.8. Samples: 29066688. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:01:53,803][19739] Avg episode reward: [(0, '770.130'), (1, '1030.240')] +[2023-10-08 18:01:56,079][21194] Updated weights for policy 1, policy_version 56550 (0.0009) +[2023-10-08 18:01:56,454][21194] Updated weights for policy 1, policy_version 56560 (0.0007) +[2023-10-08 18:01:56,827][21194] Updated weights for policy 1, policy_version 56570 (0.0007) +[2023-10-08 18:01:57,670][21195] Updated weights for policy 0, policy_version 57000 (0.0008) +[2023-10-08 18:01:58,040][21195] Updated weights for policy 0, policy_version 57010 (0.0007) +[2023-10-08 18:01:58,399][21195] Updated weights for policy 0, policy_version 57020 (0.0008) +[2023-10-08 18:01:58,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 116326400. Throughput: 0: 1739.0, 1: 1704.0. Samples: 29087388. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:01:58,803][19739] Avg episode reward: [(0, '757.230'), (1, '1044.890')] +[2023-10-08 18:01:58,810][20836] Saving new best policy, reward=1044.890! +[2023-10-08 18:02:00,663][21194] Updated weights for policy 1, policy_version 56580 (0.0008) +[2023-10-08 18:02:01,027][21194] Updated weights for policy 1, policy_version 56590 (0.0009) +[2023-10-08 18:02:01,392][21194] Updated weights for policy 1, policy_version 56600 (0.0008) +[2023-10-08 18:02:02,346][21195] Updated weights for policy 0, policy_version 57030 (0.0009) +[2023-10-08 18:02:02,698][21195] Updated weights for policy 0, policy_version 57040 (0.0009) +[2023-10-08 18:02:03,068][21195] Updated weights for policy 0, policy_version 57050 (0.0010) +[2023-10-08 18:02:03,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 116391936. Throughput: 0: 1716.5, 1: 1717.1. Samples: 29102678. Policy #0 lag: (min: 16.0, avg: 42.6, max: 48.0) +[2023-10-08 18:02:03,803][19739] Avg episode reward: [(0, '757.230'), (1, '1044.890')] +[2023-10-08 18:02:05,223][21194] Updated weights for policy 1, policy_version 56610 (0.0009) +[2023-10-08 18:02:05,584][21194] Updated weights for policy 1, policy_version 56620 (0.0010) +[2023-10-08 18:02:05,954][21194] Updated weights for policy 1, policy_version 56630 (0.0008) +[2023-10-08 18:02:06,313][21194] Updated weights for policy 1, policy_version 56640 (0.0008) +[2023-10-08 18:02:07,043][21195] Updated weights for policy 0, policy_version 57060 (0.0010) +[2023-10-08 18:02:07,419][21195] Updated weights for policy 0, policy_version 57070 (0.0008) +[2023-10-08 18:02:07,794][21195] Updated weights for policy 0, policy_version 57080 (0.0010) +[2023-10-08 18:02:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 116457472. Throughput: 0: 1747.2, 1: 1705.6. Samples: 29118764. Policy #0 lag: (min: 16.0, avg: 42.6, max: 48.0) +[2023-10-08 18:02:08,803][19739] Avg episode reward: [(0, '742.760'), (1, '1044.890')] +[2023-10-08 18:02:10,166][21194] Updated weights for policy 1, policy_version 56650 (0.0008) +[2023-10-08 18:02:10,535][21194] Updated weights for policy 1, policy_version 56660 (0.0007) +[2023-10-08 18:02:10,909][21194] Updated weights for policy 1, policy_version 56670 (0.0007) +[2023-10-08 18:02:11,722][21195] Updated weights for policy 0, policy_version 57090 (0.0009) +[2023-10-08 18:02:12,091][21195] Updated weights for policy 0, policy_version 57100 (0.0011) +[2023-10-08 18:02:12,451][21195] Updated weights for policy 0, policy_version 57110 (0.0010) +[2023-10-08 18:02:12,818][21195] Updated weights for policy 0, policy_version 57120 (0.0011) +[2023-10-08 18:02:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 116523008. Throughput: 0: 1716.0, 1: 1737.6. Samples: 29139328. Policy #0 lag: (min: 16.0, avg: 42.6, max: 48.0) +[2023-10-08 18:02:13,803][19739] Avg episode reward: [(0, '727.770'), (1, '1044.890')] +[2023-10-08 18:02:14,669][21194] Updated weights for policy 1, policy_version 56680 (0.0010) +[2023-10-08 18:02:15,044][21194] Updated weights for policy 1, policy_version 56690 (0.0008) +[2023-10-08 18:02:15,408][21194] Updated weights for policy 1, policy_version 56700 (0.0007) +[2023-10-08 18:02:16,763][21195] Updated weights for policy 0, policy_version 57130 (0.0008) +[2023-10-08 18:02:17,140][21195] Updated weights for policy 0, policy_version 57140 (0.0007) +[2023-10-08 18:02:17,500][21195] Updated weights for policy 0, policy_version 57150 (0.0007) +[2023-10-08 18:02:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 116588544. Throughput: 0: 1714.5, 1: 1712.8. Samples: 29154476. Policy #0 lag: (min: 16.0, avg: 42.6, max: 48.0) +[2023-10-08 18:02:18,803][19739] Avg episode reward: [(0, '727.770'), (1, '1079.260')] +[2023-10-08 18:02:18,804][20836] Saving new best policy, reward=1079.260! +[2023-10-08 18:02:19,376][21194] Updated weights for policy 1, policy_version 56710 (0.0009) +[2023-10-08 18:02:19,747][21194] Updated weights for policy 1, policy_version 56720 (0.0010) +[2023-10-08 18:02:20,129][21194] Updated weights for policy 1, policy_version 56730 (0.0008) +[2023-10-08 18:02:21,461][21195] Updated weights for policy 0, policy_version 57160 (0.0008) +[2023-10-08 18:02:21,833][21195] Updated weights for policy 0, policy_version 57170 (0.0009) +[2023-10-08 18:02:22,199][21195] Updated weights for policy 0, policy_version 57180 (0.0010) +[2023-10-08 18:02:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 116654080. Throughput: 0: 1730.4, 1: 1724.6. Samples: 29170624. Policy #0 lag: (min: 16.0, avg: 42.6, max: 48.0) +[2023-10-08 18:02:23,803][19739] Avg episode reward: [(0, '727.770'), (1, '1079.260')] +[2023-10-08 18:02:24,134][21194] Updated weights for policy 1, policy_version 56740 (0.0007) +[2023-10-08 18:02:24,502][21194] Updated weights for policy 1, policy_version 56750 (0.0009) +[2023-10-08 18:02:24,883][21194] Updated weights for policy 1, policy_version 56760 (0.0007) +[2023-10-08 18:02:26,020][21195] Updated weights for policy 0, policy_version 57190 (0.0010) +[2023-10-08 18:02:26,394][21195] Updated weights for policy 0, policy_version 57200 (0.0007) +[2023-10-08 18:02:26,771][21195] Updated weights for policy 0, policy_version 57210 (0.0008) +[2023-10-08 18:02:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 116719616. Throughput: 0: 1721.3, 1: 1747.6. Samples: 29191776. Policy #0 lag: (min: 16.0, avg: 42.6, max: 48.0) +[2023-10-08 18:02:28,804][19739] Avg episode reward: [(0, '727.770'), (1, '1064.410')] +[2023-10-08 18:02:28,872][21194] Updated weights for policy 1, policy_version 56770 (0.0008) +[2023-10-08 18:02:29,235][21194] Updated weights for policy 1, policy_version 56780 (0.0007) +[2023-10-08 18:02:29,595][21194] Updated weights for policy 1, policy_version 56790 (0.0008) +[2023-10-08 18:02:29,967][21194] Updated weights for policy 1, policy_version 56800 (0.0009) +[2023-10-08 18:02:30,608][21195] Updated weights for policy 0, policy_version 57220 (0.0007) +[2023-10-08 18:02:30,970][21195] Updated weights for policy 0, policy_version 57230 (0.0008) +[2023-10-08 18:02:31,333][21195] Updated weights for policy 0, policy_version 57240 (0.0007) +[2023-10-08 18:02:33,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 116785152. Throughput: 0: 1740.8, 1: 1719.9. Samples: 29207292. Policy #0 lag: (min: 16.0, avg: 42.6, max: 48.0) +[2023-10-08 18:02:33,803][19739] Avg episode reward: [(0, '743.040'), (1, '1079.250')] +[2023-10-08 18:02:33,947][21194] Updated weights for policy 1, policy_version 56810 (0.0009) +[2023-10-08 18:02:34,319][21194] Updated weights for policy 1, policy_version 56820 (0.0011) +[2023-10-08 18:02:34,697][21194] Updated weights for policy 1, policy_version 56830 (0.0010) +[2023-10-08 18:02:35,124][21195] Updated weights for policy 0, policy_version 57250 (0.0008) +[2023-10-08 18:02:35,501][21195] Updated weights for policy 0, policy_version 57260 (0.0010) +[2023-10-08 18:02:35,862][21195] Updated weights for policy 0, policy_version 57270 (0.0008) +[2023-10-08 18:02:36,229][21195] Updated weights for policy 0, policy_version 57280 (0.0008) +[2023-10-08 18:02:38,671][21194] Updated weights for policy 1, policy_version 56840 (0.0011) +[2023-10-08 18:02:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 116850688. Throughput: 0: 1723.0, 1: 1744.4. Samples: 29222720. Policy #0 lag: (min: 16.0, avg: 42.6, max: 48.0) +[2023-10-08 18:02:38,803][19739] Avg episode reward: [(0, '743.040'), (1, '1064.210')] +[2023-10-08 18:02:39,039][21194] Updated weights for policy 1, policy_version 56850 (0.0010) +[2023-10-08 18:02:39,404][21194] Updated weights for policy 1, policy_version 56860 (0.0007) +[2023-10-08 18:02:40,135][21195] Updated weights for policy 0, policy_version 57290 (0.0009) +[2023-10-08 18:02:40,498][21195] Updated weights for policy 0, policy_version 57300 (0.0008) +[2023-10-08 18:02:40,861][21195] Updated weights for policy 0, policy_version 57310 (0.0008) +[2023-10-08 18:02:43,426][21194] Updated weights for policy 1, policy_version 56870 (0.0008) +[2023-10-08 18:02:43,796][21194] Updated weights for policy 1, policy_version 56880 (0.0009) +[2023-10-08 18:02:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 116916224. Throughput: 0: 1733.1, 1: 1749.6. Samples: 29244112. Policy #0 lag: (min: 31.0, avg: 37.4, max: 63.0) +[2023-10-08 18:02:43,803][19739] Avg episode reward: [(0, '743.260'), (1, '1064.210')] +[2023-10-08 18:02:44,161][21194] Updated weights for policy 1, policy_version 56890 (0.0009) +[2023-10-08 18:02:44,839][21195] Updated weights for policy 0, policy_version 57320 (0.0009) +[2023-10-08 18:02:45,215][21195] Updated weights for policy 0, policy_version 57330 (0.0009) +[2023-10-08 18:02:45,578][21195] Updated weights for policy 0, policy_version 57340 (0.0008) +[2023-10-08 18:02:47,998][21194] Updated weights for policy 1, policy_version 56900 (0.0008) +[2023-10-08 18:02:48,367][21194] Updated weights for policy 1, policy_version 56910 (0.0008) +[2023-10-08 18:02:48,732][21194] Updated weights for policy 1, policy_version 56920 (0.0007) +[2023-10-08 18:02:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 116981760. Throughput: 0: 1747.2, 1: 1730.0. Samples: 29259154. Policy #0 lag: (min: 31.0, avg: 37.4, max: 63.0) +[2023-10-08 18:02:48,803][19739] Avg episode reward: [(0, '743.260'), (1, '1050.790')] +[2023-10-08 18:02:49,572][21195] Updated weights for policy 0, policy_version 57350 (0.0009) +[2023-10-08 18:02:49,951][21195] Updated weights for policy 0, policy_version 57360 (0.0010) +[2023-10-08 18:02:50,315][21195] Updated weights for policy 0, policy_version 57370 (0.0011) +[2023-10-08 18:02:52,642][21194] Updated weights for policy 1, policy_version 56930 (0.0010) +[2023-10-08 18:02:53,008][21194] Updated weights for policy 1, policy_version 56940 (0.0007) +[2023-10-08 18:02:53,384][21194] Updated weights for policy 1, policy_version 56950 (0.0009) +[2023-10-08 18:02:53,742][21194] Updated weights for policy 1, policy_version 56960 (0.0008) +[2023-10-08 18:02:53,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 117080064. Throughput: 0: 1719.6, 1: 1740.8. Samples: 29274484. Policy #0 lag: (min: 31.0, avg: 37.4, max: 63.0) +[2023-10-08 18:02:53,803][19739] Avg episode reward: [(0, '743.260'), (1, '1050.790')] +[2023-10-08 18:02:54,256][21195] Updated weights for policy 0, policy_version 57380 (0.0010) +[2023-10-08 18:02:54,615][21195] Updated weights for policy 0, policy_version 57390 (0.0011) +[2023-10-08 18:02:54,980][21195] Updated weights for policy 0, policy_version 57400 (0.0010) +[2023-10-08 18:02:57,687][21194] Updated weights for policy 1, policy_version 56970 (0.0009) +[2023-10-08 18:02:58,060][21194] Updated weights for policy 1, policy_version 56980 (0.0009) +[2023-10-08 18:02:58,429][21194] Updated weights for policy 1, policy_version 56990 (0.0009) +[2023-10-08 18:02:58,788][21195] Updated weights for policy 0, policy_version 57410 (0.0008) +[2023-10-08 18:02:58,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 117145600. Throughput: 0: 1753.7, 1: 1712.2. Samples: 29295292. Policy #0 lag: (min: 31.0, avg: 37.4, max: 63.0) +[2023-10-08 18:02:58,803][19739] Avg episode reward: [(0, '743.260'), (1, '1076.060')] +[2023-10-08 18:02:59,162][21195] Updated weights for policy 0, policy_version 57420 (0.0010) +[2023-10-08 18:02:59,531][21195] Updated weights for policy 0, policy_version 57430 (0.0010) +[2023-10-08 18:02:59,902][21195] Updated weights for policy 0, policy_version 57440 (0.0010) +[2023-10-08 18:03:02,270][21194] Updated weights for policy 1, policy_version 57000 (0.0008) +[2023-10-08 18:03:02,636][21194] Updated weights for policy 1, policy_version 57010 (0.0007) +[2023-10-08 18:03:03,014][21194] Updated weights for policy 1, policy_version 57020 (0.0008) +[2023-10-08 18:03:03,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 117211136. Throughput: 0: 1752.5, 1: 1731.8. Samples: 29311270. Policy #0 lag: (min: 31.0, avg: 37.4, max: 63.0) +[2023-10-08 18:03:03,803][19739] Avg episode reward: [(0, '743.260'), (1, '1061.500')] +[2023-10-08 18:03:03,853][21195] Updated weights for policy 0, policy_version 57450 (0.0009) +[2023-10-08 18:03:04,229][21195] Updated weights for policy 0, policy_version 57460 (0.0008) +[2023-10-08 18:03:04,590][21195] Updated weights for policy 0, policy_version 57470 (0.0007) +[2023-10-08 18:03:06,864][21194] Updated weights for policy 1, policy_version 57030 (0.0010) +[2023-10-08 18:03:07,228][21194] Updated weights for policy 1, policy_version 57040 (0.0007) +[2023-10-08 18:03:07,599][21194] Updated weights for policy 1, policy_version 57050 (0.0007) +[2023-10-08 18:03:08,581][21195] Updated weights for policy 0, policy_version 57480 (0.0008) +[2023-10-08 18:03:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 117276672. Throughput: 0: 1742.2, 1: 1724.9. Samples: 29326642. Policy #0 lag: (min: 31.0, avg: 37.4, max: 63.0) +[2023-10-08 18:03:08,803][19739] Avg episode reward: [(0, '743.260'), (1, '1076.610')] +[2023-10-08 18:03:08,949][21195] Updated weights for policy 0, policy_version 57490 (0.0008) +[2023-10-08 18:03:09,322][21195] Updated weights for policy 0, policy_version 57500 (0.0008) +[2023-10-08 18:03:11,653][21194] Updated weights for policy 1, policy_version 57060 (0.0008) +[2023-10-08 18:03:12,024][21194] Updated weights for policy 1, policy_version 57070 (0.0007) +[2023-10-08 18:03:12,383][21194] Updated weights for policy 1, policy_version 57080 (0.0007) +[2023-10-08 18:03:13,249][21195] Updated weights for policy 0, policy_version 57510 (0.0009) +[2023-10-08 18:03:13,622][21195] Updated weights for policy 0, policy_version 57520 (0.0010) +[2023-10-08 18:03:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 117342208. Throughput: 0: 1748.9, 1: 1704.8. Samples: 29347190. Policy #0 lag: (min: 31.0, avg: 37.4, max: 63.0) +[2023-10-08 18:03:13,803][19739] Avg episode reward: [(0, '743.260'), (1, '1076.610')] +[2023-10-08 18:03:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000057088_58458112.pth... +[2023-10-08 18:03:13,845][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000055488_56819712.pth +[2023-10-08 18:03:13,986][21195] Updated weights for policy 0, policy_version 57530 (0.0010) +[2023-10-08 18:03:14,206][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000057536_58916864.pth... +[2023-10-08 18:03:14,234][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000055904_57245696.pth +[2023-10-08 18:03:16,390][21194] Updated weights for policy 1, policy_version 57090 (0.0008) +[2023-10-08 18:03:16,754][21194] Updated weights for policy 1, policy_version 57100 (0.0007) +[2023-10-08 18:03:17,122][21194] Updated weights for policy 1, policy_version 57110 (0.0009) +[2023-10-08 18:03:17,495][21194] Updated weights for policy 1, policy_version 57120 (0.0009) +[2023-10-08 18:03:17,951][21195] Updated weights for policy 0, policy_version 57540 (0.0009) +[2023-10-08 18:03:18,331][21195] Updated weights for policy 0, policy_version 57550 (0.0009) +[2023-10-08 18:03:18,699][21195] Updated weights for policy 0, policy_version 57560 (0.0007) +[2023-10-08 18:03:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 117407744. Throughput: 0: 1720.4, 1: 1734.0. Samples: 29362738. Policy #0 lag: (min: 31.0, avg: 37.4, max: 63.0) +[2023-10-08 18:03:18,803][19739] Avg episode reward: [(0, '743.260'), (1, '1063.200')] +[2023-10-08 18:03:21,399][21194] Updated weights for policy 1, policy_version 57130 (0.0009) +[2023-10-08 18:03:21,775][21194] Updated weights for policy 1, policy_version 57140 (0.0009) +[2023-10-08 18:03:22,149][21194] Updated weights for policy 1, policy_version 57150 (0.0011) +[2023-10-08 18:03:22,601][21195] Updated weights for policy 0, policy_version 57570 (0.0007) +[2023-10-08 18:03:22,958][21195] Updated weights for policy 0, policy_version 57580 (0.0008) +[2023-10-08 18:03:23,335][21195] Updated weights for policy 0, policy_version 57590 (0.0009) +[2023-10-08 18:03:23,704][21195] Updated weights for policy 0, policy_version 57600 (0.0008) +[2023-10-08 18:03:23,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 117506048. Throughput: 0: 1740.0, 1: 1711.4. Samples: 29378032. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:03:23,803][19739] Avg episode reward: [(0, '743.260'), (1, '1063.550')] +[2023-10-08 18:03:26,103][21194] Updated weights for policy 1, policy_version 57160 (0.0008) +[2023-10-08 18:03:26,465][21194] Updated weights for policy 1, policy_version 57170 (0.0007) +[2023-10-08 18:03:26,828][21194] Updated weights for policy 1, policy_version 57180 (0.0008) +[2023-10-08 18:03:27,772][21195] Updated weights for policy 0, policy_version 57610 (0.0007) +[2023-10-08 18:03:28,137][21195] Updated weights for policy 0, policy_version 57620 (0.0008) +[2023-10-08 18:03:28,509][21195] Updated weights for policy 0, policy_version 57630 (0.0008) +[2023-10-08 18:03:28,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 117571584. Throughput: 0: 1727.9, 1: 1703.8. Samples: 29398538. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:03:28,803][19739] Avg episode reward: [(0, '743.260'), (1, '1063.550')] +[2023-10-08 18:03:30,995][21194] Updated weights for policy 1, policy_version 57190 (0.0009) +[2023-10-08 18:03:31,391][21194] Updated weights for policy 1, policy_version 57200 (0.0009) +[2023-10-08 18:03:31,751][21194] Updated weights for policy 1, policy_version 57210 (0.0008) +[2023-10-08 18:03:32,411][21195] Updated weights for policy 0, policy_version 57640 (0.0007) +[2023-10-08 18:03:32,794][21195] Updated weights for policy 0, policy_version 57650 (0.0007) +[2023-10-08 18:03:33,164][21195] Updated weights for policy 0, policy_version 57660 (0.0007) +[2023-10-08 18:03:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 117637120. Throughput: 0: 1710.4, 1: 1728.9. Samples: 29413924. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:03:33,803][19739] Avg episode reward: [(0, '743.610'), (1, '1063.550')] +[2023-10-08 18:03:35,706][21194] Updated weights for policy 1, policy_version 57220 (0.0009) +[2023-10-08 18:03:36,065][21194] Updated weights for policy 1, policy_version 57230 (0.0008) +[2023-10-08 18:03:36,426][21194] Updated weights for policy 1, policy_version 57240 (0.0007) +[2023-10-08 18:03:37,020][21195] Updated weights for policy 0, policy_version 57670 (0.0010) +[2023-10-08 18:03:37,385][21195] Updated weights for policy 0, policy_version 57680 (0.0009) +[2023-10-08 18:03:37,756][21195] Updated weights for policy 0, policy_version 57690 (0.0008) +[2023-10-08 18:03:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 117702656. Throughput: 0: 1742.2, 1: 1708.3. Samples: 29429756. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:03:38,803][19739] Avg episode reward: [(0, '743.610'), (1, '1063.550')] +[2023-10-08 18:03:40,263][21194] Updated weights for policy 1, policy_version 57250 (0.0008) +[2023-10-08 18:03:40,630][21194] Updated weights for policy 1, policy_version 57260 (0.0008) +[2023-10-08 18:03:40,990][21194] Updated weights for policy 1, policy_version 57270 (0.0008) +[2023-10-08 18:03:41,352][21194] Updated weights for policy 1, policy_version 57280 (0.0008) +[2023-10-08 18:03:41,754][21195] Updated weights for policy 0, policy_version 57700 (0.0009) +[2023-10-08 18:03:42,120][21195] Updated weights for policy 0, policy_version 57710 (0.0008) +[2023-10-08 18:03:42,485][21195] Updated weights for policy 0, policy_version 57720 (0.0009) +[2023-10-08 18:03:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 117768192. Throughput: 0: 1709.7, 1: 1731.7. Samples: 29450154. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:03:43,803][19739] Avg episode reward: [(0, '743.610'), (1, '1063.550')] +[2023-10-08 18:03:45,123][21194] Updated weights for policy 1, policy_version 57290 (0.0008) +[2023-10-08 18:03:45,487][21194] Updated weights for policy 1, policy_version 57300 (0.0007) +[2023-10-08 18:03:45,856][21194] Updated weights for policy 1, policy_version 57310 (0.0009) +[2023-10-08 18:03:46,433][21195] Updated weights for policy 0, policy_version 57730 (0.0009) +[2023-10-08 18:03:46,804][21195] Updated weights for policy 0, policy_version 57740 (0.0010) +[2023-10-08 18:03:47,181][21195] Updated weights for policy 0, policy_version 57750 (0.0009) +[2023-10-08 18:03:47,557][21195] Updated weights for policy 0, policy_version 57760 (0.0007) +[2023-10-08 18:03:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 117833728. Throughput: 0: 1706.9, 1: 1712.2. Samples: 29465132. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:03:48,803][19739] Avg episode reward: [(0, '743.610'), (1, '1063.550')] +[2023-10-08 18:03:49,741][21194] Updated weights for policy 1, policy_version 57320 (0.0009) +[2023-10-08 18:03:50,104][21194] Updated weights for policy 1, policy_version 57330 (0.0008) +[2023-10-08 18:03:50,472][21194] Updated weights for policy 1, policy_version 57340 (0.0008) +[2023-10-08 18:03:51,556][21195] Updated weights for policy 0, policy_version 57770 (0.0008) +[2023-10-08 18:03:51,919][21195] Updated weights for policy 0, policy_version 57780 (0.0010) +[2023-10-08 18:03:52,291][21195] Updated weights for policy 0, policy_version 57790 (0.0009) +[2023-10-08 18:03:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 117899264. Throughput: 0: 1716.9, 1: 1722.7. Samples: 29481422. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:03:53,803][19739] Avg episode reward: [(0, '743.610'), (1, '1063.550')] +[2023-10-08 18:03:54,355][21194] Updated weights for policy 1, policy_version 57350 (0.0008) +[2023-10-08 18:03:54,722][21194] Updated weights for policy 1, policy_version 57360 (0.0009) +[2023-10-08 18:03:55,097][21194] Updated weights for policy 1, policy_version 57370 (0.0009) +[2023-10-08 18:03:55,994][21195] Updated weights for policy 0, policy_version 57800 (0.0007) +[2023-10-08 18:03:56,358][21195] Updated weights for policy 0, policy_version 57810 (0.0007) +[2023-10-08 18:03:56,730][21195] Updated weights for policy 0, policy_version 57820 (0.0007) +[2023-10-08 18:03:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 117964800. Throughput: 0: 1710.7, 1: 1745.6. Samples: 29502724. Policy #0 lag: (min: 21.0, avg: 24.1, max: 53.0) +[2023-10-08 18:03:58,803][19739] Avg episode reward: [(0, '743.620'), (1, '1063.550')] +[2023-10-08 18:03:58,992][21194] Updated weights for policy 1, policy_version 57380 (0.0009) +[2023-10-08 18:03:59,370][21194] Updated weights for policy 1, policy_version 57390 (0.0007) +[2023-10-08 18:03:59,735][21194] Updated weights for policy 1, policy_version 57400 (0.0008) +[2023-10-08 18:04:00,544][21195] Updated weights for policy 0, policy_version 57830 (0.0007) +[2023-10-08 18:04:00,903][21195] Updated weights for policy 0, policy_version 57840 (0.0007) +[2023-10-08 18:04:01,274][21195] Updated weights for policy 0, policy_version 57850 (0.0010) +[2023-10-08 18:04:03,719][21194] Updated weights for policy 1, policy_version 57410 (0.0011) +[2023-10-08 18:04:03,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 118030336. Throughput: 0: 1736.4, 1: 1715.2. Samples: 29518058. Policy #0 lag: (min: 21.0, avg: 24.1, max: 53.0) +[2023-10-08 18:04:03,803][19739] Avg episode reward: [(0, '758.150'), (1, '1063.540')] +[2023-10-08 18:04:04,086][21194] Updated weights for policy 1, policy_version 57420 (0.0007) +[2023-10-08 18:04:04,445][21194] Updated weights for policy 1, policy_version 57430 (0.0007) +[2023-10-08 18:04:04,809][21194] Updated weights for policy 1, policy_version 57440 (0.0009) +[2023-10-08 18:04:05,245][21195] Updated weights for policy 0, policy_version 57860 (0.0008) +[2023-10-08 18:04:05,604][21195] Updated weights for policy 0, policy_version 57870 (0.0010) +[2023-10-08 18:04:05,977][21195] Updated weights for policy 0, policy_version 57880 (0.0008) +[2023-10-08 18:04:08,748][21194] Updated weights for policy 1, policy_version 57450 (0.0009) +[2023-10-08 18:04:08,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 118095872. Throughput: 0: 1713.0, 1: 1735.9. Samples: 29533234. Policy #0 lag: (min: 21.0, avg: 24.1, max: 53.0) +[2023-10-08 18:04:08,803][19739] Avg episode reward: [(0, '786.910'), (1, '1077.870')] +[2023-10-08 18:04:09,114][21194] Updated weights for policy 1, policy_version 57460 (0.0008) +[2023-10-08 18:04:09,476][21194] Updated weights for policy 1, policy_version 57470 (0.0008) +[2023-10-08 18:04:10,038][21195] Updated weights for policy 0, policy_version 57890 (0.0007) +[2023-10-08 18:04:10,406][21195] Updated weights for policy 0, policy_version 57900 (0.0009) +[2023-10-08 18:04:10,775][21195] Updated weights for policy 0, policy_version 57910 (0.0007) +[2023-10-08 18:04:11,140][21195] Updated weights for policy 0, policy_version 57920 (0.0009) +[2023-10-08 18:04:13,416][21194] Updated weights for policy 1, policy_version 57480 (0.0009) +[2023-10-08 18:04:13,779][21194] Updated weights for policy 1, policy_version 57490 (0.0009) +[2023-10-08 18:04:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 118161408. Throughput: 0: 1726.7, 1: 1745.7. Samples: 29554796. Policy #0 lag: (min: 21.0, avg: 24.1, max: 53.0) +[2023-10-08 18:04:13,803][19739] Avg episode reward: [(0, '786.910'), (1, '1077.870')] +[2023-10-08 18:04:14,153][21194] Updated weights for policy 1, policy_version 57500 (0.0009) +[2023-10-08 18:04:15,044][21195] Updated weights for policy 0, policy_version 57930 (0.0008) +[2023-10-08 18:04:15,417][21195] Updated weights for policy 0, policy_version 57940 (0.0008) +[2023-10-08 18:04:15,778][21195] Updated weights for policy 0, policy_version 57950 (0.0009) +[2023-10-08 18:04:18,051][21194] Updated weights for policy 1, policy_version 57510 (0.0009) +[2023-10-08 18:04:18,425][21194] Updated weights for policy 1, policy_version 57520 (0.0011) +[2023-10-08 18:04:18,791][21194] Updated weights for policy 1, policy_version 57530 (0.0007) +[2023-10-08 18:04:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 118226944. Throughput: 0: 1752.3, 1: 1725.3. Samples: 29570414. Policy #0 lag: (min: 21.0, avg: 24.1, max: 53.0) +[2023-10-08 18:04:18,803][19739] Avg episode reward: [(0, '802.280'), (1, '1077.870')] +[2023-10-08 18:04:19,570][21195] Updated weights for policy 0, policy_version 57960 (0.0009) +[2023-10-08 18:04:19,938][21195] Updated weights for policy 0, policy_version 57970 (0.0008) +[2023-10-08 18:04:20,316][21195] Updated weights for policy 0, policy_version 57980 (0.0008) +[2023-10-08 18:04:22,845][21194] Updated weights for policy 1, policy_version 57540 (0.0008) +[2023-10-08 18:04:23,210][21194] Updated weights for policy 1, policy_version 57550 (0.0007) +[2023-10-08 18:04:23,581][21194] Updated weights for policy 1, policy_version 57560 (0.0008) +[2023-10-08 18:04:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 118292480. Throughput: 0: 1720.3, 1: 1745.6. Samples: 29585722. Policy #0 lag: (min: 21.0, avg: 24.1, max: 53.0) +[2023-10-08 18:04:23,803][19739] Avg episode reward: [(0, '803.150'), (1, '1077.870')] +[2023-10-08 18:04:24,262][21195] Updated weights for policy 0, policy_version 57990 (0.0010) +[2023-10-08 18:04:24,643][21195] Updated weights for policy 0, policy_version 58000 (0.0009) +[2023-10-08 18:04:25,008][21195] Updated weights for policy 0, policy_version 58010 (0.0008) +[2023-10-08 18:04:27,465][21194] Updated weights for policy 1, policy_version 57570 (0.0008) +[2023-10-08 18:04:27,825][21194] Updated weights for policy 1, policy_version 57580 (0.0010) +[2023-10-08 18:04:28,186][21194] Updated weights for policy 1, policy_version 57590 (0.0008) +[2023-10-08 18:04:28,546][21194] Updated weights for policy 1, policy_version 57600 (0.0012) +[2023-10-08 18:04:28,803][19739] Fps is (10 sec: 16383.5, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 118390784. Throughput: 0: 1747.8, 1: 1724.3. Samples: 29606400. Policy #0 lag: (min: 21.0, avg: 24.1, max: 53.0) +[2023-10-08 18:04:28,804][19739] Avg episode reward: [(0, '802.000'), (1, '1077.870')] +[2023-10-08 18:04:28,927][21195] Updated weights for policy 0, policy_version 58020 (0.0009) +[2023-10-08 18:04:29,291][21195] Updated weights for policy 0, policy_version 58030 (0.0008) +[2023-10-08 18:04:29,660][21195] Updated weights for policy 0, policy_version 58040 (0.0009) +[2023-10-08 18:04:32,609][21194] Updated weights for policy 1, policy_version 57610 (0.0008) +[2023-10-08 18:04:32,975][21194] Updated weights for policy 1, policy_version 57620 (0.0007) +[2023-10-08 18:04:33,344][21194] Updated weights for policy 1, policy_version 57630 (0.0009) +[2023-10-08 18:04:33,572][21195] Updated weights for policy 0, policy_version 58050 (0.0009) +[2023-10-08 18:04:33,802][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 118456320. Throughput: 0: 1750.8, 1: 1741.8. Samples: 29622300. Policy #0 lag: (min: 21.0, avg: 24.1, max: 53.0) +[2023-10-08 18:04:33,803][19739] Avg episode reward: [(0, '789.510'), (1, '1077.870')] +[2023-10-08 18:04:33,945][21195] Updated weights for policy 0, policy_version 58060 (0.0007) +[2023-10-08 18:04:34,321][21195] Updated weights for policy 0, policy_version 58070 (0.0008) +[2023-10-08 18:04:34,690][21195] Updated weights for policy 0, policy_version 58080 (0.0007) +[2023-10-08 18:04:37,358][21194] Updated weights for policy 1, policy_version 57640 (0.0008) +[2023-10-08 18:04:37,734][21194] Updated weights for policy 1, policy_version 57650 (0.0007) +[2023-10-08 18:04:38,093][21194] Updated weights for policy 1, policy_version 57660 (0.0007) +[2023-10-08 18:04:38,615][21195] Updated weights for policy 0, policy_version 58090 (0.0010) +[2023-10-08 18:04:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 118521856. Throughput: 0: 1744.3, 1: 1742.8. Samples: 29638344. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 18:04:38,804][19739] Avg episode reward: [(0, '774.590'), (1, '1077.870')] +[2023-10-08 18:04:38,981][21195] Updated weights for policy 0, policy_version 58100 (0.0008) +[2023-10-08 18:04:39,336][21195] Updated weights for policy 0, policy_version 58110 (0.0008) +[2023-10-08 18:04:41,931][21194] Updated weights for policy 1, policy_version 57670 (0.0008) +[2023-10-08 18:04:42,312][21194] Updated weights for policy 1, policy_version 57680 (0.0010) +[2023-10-08 18:04:42,673][21194] Updated weights for policy 1, policy_version 57690 (0.0009) +[2023-10-08 18:04:43,272][21195] Updated weights for policy 0, policy_version 58120 (0.0010) +[2023-10-08 18:04:43,637][21195] Updated weights for policy 0, policy_version 58130 (0.0010) +[2023-10-08 18:04:43,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 118587392. Throughput: 0: 1752.0, 1: 1711.8. Samples: 29658598. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 18:04:43,803][19739] Avg episode reward: [(0, '774.660'), (1, '1077.870')] +[2023-10-08 18:04:43,994][21195] Updated weights for policy 0, policy_version 58140 (0.0010) +[2023-10-08 18:04:46,543][21194] Updated weights for policy 1, policy_version 57700 (0.0007) +[2023-10-08 18:04:46,908][21194] Updated weights for policy 1, policy_version 57710 (0.0009) +[2023-10-08 18:04:47,271][21194] Updated weights for policy 1, policy_version 57720 (0.0008) +[2023-10-08 18:04:47,745][21195] Updated weights for policy 0, policy_version 58150 (0.0009) +[2023-10-08 18:04:48,114][21195] Updated weights for policy 0, policy_version 58160 (0.0010) +[2023-10-08 18:04:48,489][21195] Updated weights for policy 0, policy_version 58170 (0.0008) +[2023-10-08 18:04:48,803][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 118685696. Throughput: 0: 1724.1, 1: 1744.1. Samples: 29674128. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 18:04:48,803][19739] Avg episode reward: [(0, '774.660'), (1, '1077.870')] +[2023-10-08 18:04:51,273][21194] Updated weights for policy 1, policy_version 57730 (0.0009) +[2023-10-08 18:04:51,638][21194] Updated weights for policy 1, policy_version 57740 (0.0009) +[2023-10-08 18:04:52,012][21194] Updated weights for policy 1, policy_version 57750 (0.0009) +[2023-10-08 18:04:52,378][21194] Updated weights for policy 1, policy_version 57760 (0.0008) +[2023-10-08 18:04:52,538][21195] Updated weights for policy 0, policy_version 58180 (0.0009) +[2023-10-08 18:04:52,914][21195] Updated weights for policy 0, policy_version 58190 (0.0010) +[2023-10-08 18:04:53,285][21195] Updated weights for policy 0, policy_version 58200 (0.0007) +[2023-10-08 18:04:53,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 118751232. Throughput: 0: 1756.6, 1: 1723.7. Samples: 29689848. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 18:04:53,804][19739] Avg episode reward: [(0, '775.550'), (1, '1078.710')] +[2023-10-08 18:04:56,297][21194] Updated weights for policy 1, policy_version 57770 (0.0009) +[2023-10-08 18:04:56,674][21194] Updated weights for policy 1, policy_version 57780 (0.0009) +[2023-10-08 18:04:57,036][21194] Updated weights for policy 1, policy_version 57790 (0.0009) +[2023-10-08 18:04:57,119][21195] Updated weights for policy 0, policy_version 58210 (0.0007) +[2023-10-08 18:04:57,488][21195] Updated weights for policy 0, policy_version 58220 (0.0008) +[2023-10-08 18:04:57,859][21195] Updated weights for policy 0, policy_version 58230 (0.0008) +[2023-10-08 18:04:58,223][21195] Updated weights for policy 0, policy_version 58240 (0.0007) +[2023-10-08 18:04:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 118816768. Throughput: 0: 1736.8, 1: 1712.6. Samples: 29710020. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 18:04:58,803][19739] Avg episode reward: [(0, '775.550'), (1, '1078.710')] +[2023-10-08 18:05:00,790][21194] Updated weights for policy 1, policy_version 57800 (0.0009) +[2023-10-08 18:05:01,163][21194] Updated weights for policy 1, policy_version 57810 (0.0008) +[2023-10-08 18:05:01,532][21194] Updated weights for policy 1, policy_version 57820 (0.0008) +[2023-10-08 18:05:02,077][21195] Updated weights for policy 0, policy_version 58250 (0.0010) +[2023-10-08 18:05:02,445][21195] Updated weights for policy 0, policy_version 58260 (0.0009) +[2023-10-08 18:05:02,809][21195] Updated weights for policy 0, policy_version 58270 (0.0008) +[2023-10-08 18:05:03,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 118882304. Throughput: 0: 1725.9, 1: 1730.5. Samples: 29725952. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 18:05:03,803][19739] Avg episode reward: [(0, '775.760'), (1, '1078.710')] +[2023-10-08 18:05:05,507][21194] Updated weights for policy 1, policy_version 57830 (0.0008) +[2023-10-08 18:05:05,877][21194] Updated weights for policy 1, policy_version 57840 (0.0009) +[2023-10-08 18:05:06,245][21194] Updated weights for policy 1, policy_version 57850 (0.0008) +[2023-10-08 18:05:06,464][21195] Updated weights for policy 0, policy_version 58280 (0.0008) +[2023-10-08 18:05:06,838][21195] Updated weights for policy 0, policy_version 58290 (0.0008) +[2023-10-08 18:05:07,203][21195] Updated weights for policy 0, policy_version 58300 (0.0008) +[2023-10-08 18:05:08,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 118947840. Throughput: 0: 1747.2, 1: 1716.0. Samples: 29741566. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 18:05:08,803][19739] Avg episode reward: [(0, '775.760'), (1, '1078.710')] +[2023-10-08 18:05:10,305][21194] Updated weights for policy 1, policy_version 57860 (0.0008) +[2023-10-08 18:05:10,682][21194] Updated weights for policy 1, policy_version 57870 (0.0010) +[2023-10-08 18:05:11,040][21194] Updated weights for policy 1, policy_version 57880 (0.0009) +[2023-10-08 18:05:11,287][21195] Updated weights for policy 0, policy_version 58310 (0.0009) +[2023-10-08 18:05:11,669][21195] Updated weights for policy 0, policy_version 58320 (0.0007) +[2023-10-08 18:05:12,027][21195] Updated weights for policy 0, policy_version 58330 (0.0008) +[2023-10-08 18:05:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 119013376. Throughput: 0: 1734.8, 1: 1730.1. Samples: 29762324. Policy #0 lag: (min: 7.0, avg: 7.6, max: 23.0) +[2023-10-08 18:05:13,803][19739] Avg episode reward: [(0, '775.870'), (1, '1078.850')] +[2023-10-08 18:05:13,811][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000057888_59277312.pth... +[2023-10-08 18:05:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000058336_59736064.pth... +[2023-10-08 18:05:13,853][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000056288_57638912.pth +[2023-10-08 18:05:13,853][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000056704_58064896.pth +[2023-10-08 18:05:15,032][21194] Updated weights for policy 1, policy_version 57890 (0.0007) +[2023-10-08 18:05:15,391][21194] Updated weights for policy 1, policy_version 57900 (0.0007) +[2023-10-08 18:05:15,755][21194] Updated weights for policy 1, policy_version 57910 (0.0009) +[2023-10-08 18:05:15,922][21195] Updated weights for policy 0, policy_version 58340 (0.0007) +[2023-10-08 18:05:16,118][21194] Updated weights for policy 1, policy_version 57920 (0.0008) +[2023-10-08 18:05:16,288][21195] Updated weights for policy 0, policy_version 58350 (0.0009) +[2023-10-08 18:05:16,663][21195] Updated weights for policy 0, policy_version 58360 (0.0010) +[2023-10-08 18:05:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 119078912. Throughput: 0: 1736.6, 1: 1716.4. Samples: 29777686. Policy #0 lag: (min: 7.0, avg: 7.6, max: 23.0) +[2023-10-08 18:05:18,803][19739] Avg episode reward: [(0, '775.870'), (1, '1078.850')] +[2023-10-08 18:05:19,828][21194] Updated weights for policy 1, policy_version 57930 (0.0008) +[2023-10-08 18:05:20,198][21194] Updated weights for policy 1, policy_version 57940 (0.0009) +[2023-10-08 18:05:20,557][21194] Updated weights for policy 1, policy_version 57950 (0.0011) +[2023-10-08 18:05:20,733][21195] Updated weights for policy 0, policy_version 58370 (0.0009) +[2023-10-08 18:05:21,097][21195] Updated weights for policy 0, policy_version 58380 (0.0008) +[2023-10-08 18:05:21,465][21195] Updated weights for policy 0, policy_version 58390 (0.0009) +[2023-10-08 18:05:21,828][21195] Updated weights for policy 0, policy_version 58400 (0.0008) +[2023-10-08 18:05:23,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 119144448. Throughput: 0: 1726.8, 1: 1711.3. Samples: 29793058. Policy #0 lag: (min: 7.0, avg: 7.6, max: 23.0) +[2023-10-08 18:05:23,803][19739] Avg episode reward: [(0, '775.870'), (1, '1078.850')] +[2023-10-08 18:05:24,724][21194] Updated weights for policy 1, policy_version 57960 (0.0010) +[2023-10-08 18:05:25,086][21194] Updated weights for policy 1, policy_version 57970 (0.0009) +[2023-10-08 18:05:25,449][21194] Updated weights for policy 1, policy_version 57980 (0.0009) +[2023-10-08 18:05:25,514][21195] Updated weights for policy 0, policy_version 58410 (0.0009) +[2023-10-08 18:05:25,878][21195] Updated weights for policy 0, policy_version 58420 (0.0008) +[2023-10-08 18:05:26,240][21195] Updated weights for policy 0, policy_version 58430 (0.0007) +[2023-10-08 18:05:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 119209984. Throughput: 0: 1729.5, 1: 1736.0. Samples: 29814544. Policy #0 lag: (min: 7.0, avg: 7.6, max: 23.0) +[2023-10-08 18:05:28,803][19739] Avg episode reward: [(0, '776.170'), (1, '1078.850')] +[2023-10-08 18:05:29,474][21194] Updated weights for policy 1, policy_version 57990 (0.0008) +[2023-10-08 18:05:29,835][21194] Updated weights for policy 1, policy_version 58000 (0.0007) +[2023-10-08 18:05:30,198][21194] Updated weights for policy 1, policy_version 58010 (0.0008) +[2023-10-08 18:05:30,217][21195] Updated weights for policy 0, policy_version 58440 (0.0008) +[2023-10-08 18:05:30,578][21195] Updated weights for policy 0, policy_version 58450 (0.0008) +[2023-10-08 18:05:30,946][21195] Updated weights for policy 0, policy_version 58460 (0.0008) +[2023-10-08 18:05:33,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 119275520. Throughput: 0: 1765.5, 1: 1702.5. Samples: 29830190. Policy #0 lag: (min: 7.0, avg: 7.6, max: 23.0) +[2023-10-08 18:05:33,803][19739] Avg episode reward: [(0, '776.170'), (1, '1078.850')] +[2023-10-08 18:05:34,201][21194] Updated weights for policy 1, policy_version 58020 (0.0007) +[2023-10-08 18:05:34,566][21194] Updated weights for policy 1, policy_version 58030 (0.0008) +[2023-10-08 18:05:34,753][21195] Updated weights for policy 0, policy_version 58470 (0.0008) +[2023-10-08 18:05:34,930][21194] Updated weights for policy 1, policy_version 58040 (0.0008) +[2023-10-08 18:05:35,119][21195] Updated weights for policy 0, policy_version 58480 (0.0009) +[2023-10-08 18:05:35,486][21195] Updated weights for policy 0, policy_version 58490 (0.0009) +[2023-10-08 18:05:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 119341056. Throughput: 0: 1736.7, 1: 1728.5. Samples: 29845780. Policy #0 lag: (min: 7.0, avg: 7.6, max: 23.0) +[2023-10-08 18:05:38,803][19739] Avg episode reward: [(0, '761.610'), (1, '1078.850')] +[2023-10-08 18:05:38,907][21194] Updated weights for policy 1, policy_version 58050 (0.0009) +[2023-10-08 18:05:39,281][21194] Updated weights for policy 1, policy_version 58060 (0.0009) +[2023-10-08 18:05:39,494][21195] Updated weights for policy 0, policy_version 58500 (0.0010) +[2023-10-08 18:05:39,638][21194] Updated weights for policy 1, policy_version 58070 (0.0009) +[2023-10-08 18:05:39,869][21195] Updated weights for policy 0, policy_version 58510 (0.0008) +[2023-10-08 18:05:40,007][21194] Updated weights for policy 1, policy_version 58080 (0.0009) +[2023-10-08 18:05:40,227][21195] Updated weights for policy 0, policy_version 58520 (0.0009) +[2023-10-08 18:05:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 119406592. Throughput: 0: 1753.0, 1: 1739.8. Samples: 29867196. Policy #0 lag: (min: 7.0, avg: 7.6, max: 23.0) +[2023-10-08 18:05:43,803][19739] Avg episode reward: [(0, '761.610'), (1, '1078.850')] +[2023-10-08 18:05:44,016][21194] Updated weights for policy 1, policy_version 58090 (0.0008) +[2023-10-08 18:05:44,127][21195] Updated weights for policy 0, policy_version 58530 (0.0007) +[2023-10-08 18:05:44,378][21194] Updated weights for policy 1, policy_version 58100 (0.0009) +[2023-10-08 18:05:44,501][21195] Updated weights for policy 0, policy_version 58540 (0.0008) +[2023-10-08 18:05:44,744][21194] Updated weights for policy 1, policy_version 58110 (0.0008) +[2023-10-08 18:05:44,869][21195] Updated weights for policy 0, policy_version 58550 (0.0009) +[2023-10-08 18:05:45,226][21195] Updated weights for policy 0, policy_version 58560 (0.0008) +[2023-10-08 18:05:48,531][21194] Updated weights for policy 1, policy_version 58120 (0.0008) +[2023-10-08 18:05:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 119472128. Throughput: 0: 1761.9, 1: 1717.2. Samples: 29882510. Policy #0 lag: (min: 7.0, avg: 7.6, max: 23.0) +[2023-10-08 18:05:48,803][19739] Avg episode reward: [(0, '761.610'), (1, '1078.720')] +[2023-10-08 18:05:48,898][21194] Updated weights for policy 1, policy_version 58130 (0.0010) +[2023-10-08 18:05:49,159][21195] Updated weights for policy 0, policy_version 58570 (0.0007) +[2023-10-08 18:05:49,263][21194] Updated weights for policy 1, policy_version 58140 (0.0009) +[2023-10-08 18:05:49,533][21195] Updated weights for policy 0, policy_version 58580 (0.0009) +[2023-10-08 18:05:49,893][21195] Updated weights for policy 0, policy_version 58590 (0.0011) +[2023-10-08 18:05:53,211][21194] Updated weights for policy 1, policy_version 58150 (0.0008) +[2023-10-08 18:05:53,587][21194] Updated weights for policy 1, policy_version 58160 (0.0010) +[2023-10-08 18:05:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.3, 300 sec: 13773.7). Total num frames: 119537664. Throughput: 0: 1737.6, 1: 1734.6. Samples: 29897818. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:05:53,803][19739] Avg episode reward: [(0, '761.610'), (1, '1078.720')] +[2023-10-08 18:05:53,854][21195] Updated weights for policy 0, policy_version 58600 (0.0011) +[2023-10-08 18:05:53,951][21194] Updated weights for policy 1, policy_version 58170 (0.0007) +[2023-10-08 18:05:54,226][21195] Updated weights for policy 0, policy_version 58610 (0.0007) +[2023-10-08 18:05:54,582][21195] Updated weights for policy 0, policy_version 58620 (0.0008) +[2023-10-08 18:05:57,874][21194] Updated weights for policy 1, policy_version 58180 (0.0009) +[2023-10-08 18:05:58,244][21194] Updated weights for policy 1, policy_version 58190 (0.0010) +[2023-10-08 18:05:58,577][21195] Updated weights for policy 0, policy_version 58630 (0.0008) +[2023-10-08 18:05:58,609][21194] Updated weights for policy 1, policy_version 58200 (0.0007) +[2023-10-08 18:05:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 119603200. Throughput: 0: 1756.4, 1: 1721.5. Samples: 29918830. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:05:58,803][19739] Avg episode reward: [(0, '761.610'), (1, '1078.720')] +[2023-10-08 18:05:58,957][21195] Updated weights for policy 0, policy_version 58640 (0.0007) +[2023-10-08 18:05:59,318][21195] Updated weights for policy 0, policy_version 58650 (0.0007) +[2023-10-08 18:06:02,613][21194] Updated weights for policy 1, policy_version 58210 (0.0008) +[2023-10-08 18:06:02,977][21194] Updated weights for policy 1, policy_version 58220 (0.0007) +[2023-10-08 18:06:03,094][21195] Updated weights for policy 0, policy_version 58660 (0.0008) +[2023-10-08 18:06:03,335][21194] Updated weights for policy 1, policy_version 58230 (0.0008) +[2023-10-08 18:06:03,469][21195] Updated weights for policy 0, policy_version 58670 (0.0009) +[2023-10-08 18:06:03,700][21194] Updated weights for policy 1, policy_version 58240 (0.0007) +[2023-10-08 18:06:03,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 119701504. Throughput: 0: 1739.3, 1: 1725.6. Samples: 29933610. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:06:03,803][19739] Avg episode reward: [(0, '761.050'), (1, '1078.720')] +[2023-10-08 18:06:03,834][21195] Updated weights for policy 0, policy_version 58680 (0.0008) +[2023-10-08 18:06:07,589][21194] Updated weights for policy 1, policy_version 58250 (0.0008) +[2023-10-08 18:06:07,773][21195] Updated weights for policy 0, policy_version 58690 (0.0009) +[2023-10-08 18:06:07,954][21194] Updated weights for policy 1, policy_version 58260 (0.0008) +[2023-10-08 18:06:08,148][21195] Updated weights for policy 0, policy_version 58700 (0.0008) +[2023-10-08 18:06:08,329][21194] Updated weights for policy 1, policy_version 58270 (0.0008) +[2023-10-08 18:06:08,507][21195] Updated weights for policy 0, policy_version 58710 (0.0009) +[2023-10-08 18:06:08,802][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 119767040. Throughput: 0: 1760.5, 1: 1729.4. Samples: 29950102. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:06:08,803][19739] Avg episode reward: [(0, '730.960'), (1, '1078.700')] +[2023-10-08 18:06:08,879][21195] Updated weights for policy 0, policy_version 58720 (0.0008) +[2023-10-08 18:06:12,088][21194] Updated weights for policy 1, policy_version 58280 (0.0007) +[2023-10-08 18:06:12,457][21194] Updated weights for policy 1, policy_version 58290 (0.0007) +[2023-10-08 18:06:12,744][21195] Updated weights for policy 0, policy_version 58730 (0.0007) +[2023-10-08 18:06:12,819][21194] Updated weights for policy 1, policy_version 58300 (0.0008) +[2023-10-08 18:06:13,112][21195] Updated weights for policy 0, policy_version 58740 (0.0009) +[2023-10-08 18:06:13,487][21195] Updated weights for policy 0, policy_version 58750 (0.0008) +[2023-10-08 18:06:13,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 119865344. Throughput: 0: 1748.5, 1: 1705.0. Samples: 29969954. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:06:13,803][19739] Avg episode reward: [(0, '730.960'), (1, '1063.610')] +[2023-10-08 18:06:16,774][21194] Updated weights for policy 1, policy_version 58310 (0.0007) +[2023-10-08 18:06:17,136][21194] Updated weights for policy 1, policy_version 58320 (0.0008) +[2023-10-08 18:06:17,365][21195] Updated weights for policy 0, policy_version 58760 (0.0009) +[2023-10-08 18:06:17,508][21194] Updated weights for policy 1, policy_version 58330 (0.0010) +[2023-10-08 18:06:17,737][21195] Updated weights for policy 0, policy_version 58770 (0.0007) +[2023-10-08 18:06:18,110][21195] Updated weights for policy 0, policy_version 58780 (0.0009) +[2023-10-08 18:06:18,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 119930880. Throughput: 0: 1720.3, 1: 1737.9. Samples: 29985806. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:06:18,803][19739] Avg episode reward: [(0, '730.960'), (1, '1063.610')] +[2023-10-08 18:06:21,631][21194] Updated weights for policy 1, policy_version 58340 (0.0008) +[2023-10-08 18:06:21,995][21194] Updated weights for policy 1, policy_version 58350 (0.0010) +[2023-10-08 18:06:22,050][21195] Updated weights for policy 0, policy_version 58790 (0.0008) +[2023-10-08 18:06:22,359][21194] Updated weights for policy 1, policy_version 58360 (0.0008) +[2023-10-08 18:06:22,424][21195] Updated weights for policy 0, policy_version 58800 (0.0007) +[2023-10-08 18:06:22,790][21195] Updated weights for policy 0, policy_version 58810 (0.0009) +[2023-10-08 18:06:23,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 119996416. Throughput: 0: 1745.2, 1: 1719.1. Samples: 30001676. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:06:23,804][19739] Avg episode reward: [(0, '730.960'), (1, '1063.600')] +[2023-10-08 18:06:26,290][21194] Updated weights for policy 1, policy_version 58370 (0.0007) +[2023-10-08 18:06:26,659][21195] Updated weights for policy 0, policy_version 58820 (0.0008) +[2023-10-08 18:06:26,661][21194] Updated weights for policy 1, policy_version 58380 (0.0007) +[2023-10-08 18:06:27,024][21194] Updated weights for policy 1, policy_version 58390 (0.0007) +[2023-10-08 18:06:27,025][21195] Updated weights for policy 0, policy_version 58830 (0.0010) +[2023-10-08 18:06:27,387][21195] Updated weights for policy 0, policy_version 58840 (0.0007) +[2023-10-08 18:06:27,390][21194] Updated weights for policy 1, policy_version 58400 (0.0008) +[2023-10-08 18:06:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 120061952. Throughput: 0: 1716.6, 1: 1701.8. Samples: 30021026. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:06:28,803][19739] Avg episode reward: [(0, '730.960'), (1, '1060.620')] +[2023-10-08 18:06:31,168][21195] Updated weights for policy 0, policy_version 58850 (0.0008) +[2023-10-08 18:06:31,435][21194] Updated weights for policy 1, policy_version 58410 (0.0010) +[2023-10-08 18:06:31,542][21195] Updated weights for policy 0, policy_version 58860 (0.0009) +[2023-10-08 18:06:31,798][21194] Updated weights for policy 1, policy_version 58420 (0.0009) +[2023-10-08 18:06:31,923][21195] Updated weights for policy 0, policy_version 58870 (0.0007) +[2023-10-08 18:06:32,166][21194] Updated weights for policy 1, policy_version 58430 (0.0008) +[2023-10-08 18:06:32,288][21195] Updated weights for policy 0, policy_version 58880 (0.0007) +[2023-10-08 18:06:33,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 120127488. Throughput: 0: 1716.8, 1: 1730.2. Samples: 30037624. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:06:33,803][19739] Avg episode reward: [(0, '730.960'), (1, '1046.060')] +[2023-10-08 18:06:36,078][21194] Updated weights for policy 1, policy_version 58440 (0.0008) +[2023-10-08 18:06:36,276][21195] Updated weights for policy 0, policy_version 58890 (0.0007) +[2023-10-08 18:06:36,445][21194] Updated weights for policy 1, policy_version 58450 (0.0008) +[2023-10-08 18:06:36,643][21195] Updated weights for policy 0, policy_version 58900 (0.0009) +[2023-10-08 18:06:36,808][21194] Updated weights for policy 1, policy_version 58460 (0.0008) +[2023-10-08 18:06:37,019][21195] Updated weights for policy 0, policy_version 58910 (0.0008) +[2023-10-08 18:06:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 120193024. Throughput: 0: 1725.6, 1: 1696.9. Samples: 30051830. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:06:38,803][19739] Avg episode reward: [(0, '730.960'), (1, '1000.580')] +[2023-10-08 18:06:40,811][21194] Updated weights for policy 1, policy_version 58470 (0.0010) +[2023-10-08 18:06:40,961][21195] Updated weights for policy 0, policy_version 58920 (0.0009) +[2023-10-08 18:06:41,189][21194] Updated weights for policy 1, policy_version 58480 (0.0007) +[2023-10-08 18:06:41,318][21195] Updated weights for policy 0, policy_version 58930 (0.0007) +[2023-10-08 18:06:41,554][21194] Updated weights for policy 1, policy_version 58490 (0.0007) +[2023-10-08 18:06:41,684][21195] Updated weights for policy 0, policy_version 58940 (0.0008) +[2023-10-08 18:06:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 120258560. Throughput: 0: 1711.1, 1: 1708.6. Samples: 30072714. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:06:43,803][19739] Avg episode reward: [(0, '730.960'), (1, '955.890')] +[2023-10-08 18:06:45,623][21194] Updated weights for policy 1, policy_version 58500 (0.0009) +[2023-10-08 18:06:45,908][21195] Updated weights for policy 0, policy_version 58950 (0.0008) +[2023-10-08 18:06:45,992][21194] Updated weights for policy 1, policy_version 58510 (0.0008) +[2023-10-08 18:06:46,281][21195] Updated weights for policy 0, policy_version 58960 (0.0007) +[2023-10-08 18:06:46,361][21194] Updated weights for policy 1, policy_version 58520 (0.0008) +[2023-10-08 18:06:46,652][21195] Updated weights for policy 0, policy_version 58970 (0.0008) +[2023-10-08 18:06:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 120324096. Throughput: 0: 1722.5, 1: 1715.5. Samples: 30088322. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:06:48,803][19739] Avg episode reward: [(0, '731.090'), (1, '954.050')] +[2023-10-08 18:06:50,279][21194] Updated weights for policy 1, policy_version 58530 (0.0008) +[2023-10-08 18:06:50,603][21195] Updated weights for policy 0, policy_version 58980 (0.0008) +[2023-10-08 18:06:50,652][21194] Updated weights for policy 1, policy_version 58540 (0.0008) +[2023-10-08 18:06:50,965][21195] Updated weights for policy 0, policy_version 58990 (0.0008) +[2023-10-08 18:06:51,011][21194] Updated weights for policy 1, policy_version 58550 (0.0009) +[2023-10-08 18:06:51,333][21195] Updated weights for policy 0, policy_version 59000 (0.0008) +[2023-10-08 18:06:51,375][21194] Updated weights for policy 1, policy_version 58560 (0.0009) +[2023-10-08 18:06:53,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 120389632. Throughput: 0: 1699.2, 1: 1695.3. Samples: 30102858. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:06:53,804][19739] Avg episode reward: [(0, '731.360'), (1, '923.740')] +[2023-10-08 18:06:55,338][21195] Updated weights for policy 0, policy_version 59010 (0.0010) +[2023-10-08 18:06:55,416][21194] Updated weights for policy 1, policy_version 58570 (0.0010) +[2023-10-08 18:06:55,712][21195] Updated weights for policy 0, policy_version 59020 (0.0009) +[2023-10-08 18:06:55,777][21194] Updated weights for policy 1, policy_version 58580 (0.0009) +[2023-10-08 18:06:56,073][21195] Updated weights for policy 0, policy_version 59030 (0.0007) +[2023-10-08 18:06:56,147][21194] Updated weights for policy 1, policy_version 58590 (0.0009) +[2023-10-08 18:06:56,441][21195] Updated weights for policy 0, policy_version 59040 (0.0007) +[2023-10-08 18:06:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 120455168. Throughput: 0: 1711.3, 1: 1719.2. Samples: 30124330. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:06:58,803][19739] Avg episode reward: [(0, '731.360'), (1, '923.740')] +[2023-10-08 18:07:00,142][21194] Updated weights for policy 1, policy_version 58600 (0.0008) +[2023-10-08 18:07:00,326][21195] Updated weights for policy 0, policy_version 59050 (0.0008) +[2023-10-08 18:07:00,508][21194] Updated weights for policy 1, policy_version 58610 (0.0008) +[2023-10-08 18:07:00,707][21195] Updated weights for policy 0, policy_version 59060 (0.0008) +[2023-10-08 18:07:00,871][21194] Updated weights for policy 1, policy_version 58620 (0.0007) +[2023-10-08 18:07:01,069][21195] Updated weights for policy 0, policy_version 59070 (0.0008) +[2023-10-08 18:07:03,803][19739] Fps is (10 sec: 13107.7, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 120520704. Throughput: 0: 1733.8, 1: 1688.4. Samples: 30139804. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:07:03,803][19739] Avg episode reward: [(0, '731.360'), (1, '923.740')] +[2023-10-08 18:07:04,861][21194] Updated weights for policy 1, policy_version 58630 (0.0007) +[2023-10-08 18:07:04,965][21195] Updated weights for policy 0, policy_version 59080 (0.0008) +[2023-10-08 18:07:05,219][21194] Updated weights for policy 1, policy_version 58640 (0.0007) +[2023-10-08 18:07:05,333][21195] Updated weights for policy 0, policy_version 59090 (0.0009) +[2023-10-08 18:07:05,579][21194] Updated weights for policy 1, policy_version 58650 (0.0009) +[2023-10-08 18:07:05,703][21195] Updated weights for policy 0, policy_version 59100 (0.0007) +[2023-10-08 18:07:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 120586240. Throughput: 0: 1709.1, 1: 1703.8. Samples: 30155256. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:07:08,803][19739] Avg episode reward: [(0, '731.360'), (1, '923.740')] +[2023-10-08 18:07:09,465][21194] Updated weights for policy 1, policy_version 58660 (0.0008) +[2023-10-08 18:07:09,529][21195] Updated weights for policy 0, policy_version 59110 (0.0008) +[2023-10-08 18:07:09,833][21194] Updated weights for policy 1, policy_version 58670 (0.0007) +[2023-10-08 18:07:09,900][21195] Updated weights for policy 0, policy_version 59120 (0.0009) +[2023-10-08 18:07:10,196][21194] Updated weights for policy 1, policy_version 58680 (0.0008) +[2023-10-08 18:07:10,264][21195] Updated weights for policy 0, policy_version 59130 (0.0010) +[2023-10-08 18:07:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 120651776. Throughput: 0: 1741.0, 1: 1721.4. Samples: 30176832. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:07:13,803][19739] Avg episode reward: [(0, '731.360'), (1, '912.750')] +[2023-10-08 18:07:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000059136_60555264.pth... +[2023-10-08 18:07:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000058688_60096512.pth... +[2023-10-08 18:07:13,842][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000057536_58916864.pth +[2023-10-08 18:07:13,843][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000057088_58458112.pth +[2023-10-08 18:07:14,160][21195] Updated weights for policy 0, policy_version 59140 (0.0010) +[2023-10-08 18:07:14,234][21194] Updated weights for policy 1, policy_version 58690 (0.0007) +[2023-10-08 18:07:14,527][21195] Updated weights for policy 0, policy_version 59150 (0.0008) +[2023-10-08 18:07:14,603][21194] Updated weights for policy 1, policy_version 58700 (0.0008) +[2023-10-08 18:07:14,896][21195] Updated weights for policy 0, policy_version 59160 (0.0007) +[2023-10-08 18:07:14,967][21194] Updated weights for policy 1, policy_version 58710 (0.0007) +[2023-10-08 18:07:15,334][21194] Updated weights for policy 1, policy_version 58720 (0.0009) +[2023-10-08 18:07:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 120717312. Throughput: 0: 1734.9, 1: 1693.5. Samples: 30191902. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:07:18,803][19739] Avg episode reward: [(0, '731.360'), (1, '912.750')] +[2023-10-08 18:07:18,931][21195] Updated weights for policy 0, policy_version 59170 (0.0007) +[2023-10-08 18:07:19,297][21195] Updated weights for policy 0, policy_version 59180 (0.0007) +[2023-10-08 18:07:19,458][21194] Updated weights for policy 1, policy_version 58730 (0.0007) +[2023-10-08 18:07:19,664][21195] Updated weights for policy 0, policy_version 59190 (0.0009) +[2023-10-08 18:07:19,823][21194] Updated weights for policy 1, policy_version 58740 (0.0007) +[2023-10-08 18:07:20,030][21195] Updated weights for policy 0, policy_version 59200 (0.0009) +[2023-10-08 18:07:20,190][21194] Updated weights for policy 1, policy_version 58750 (0.0008) +[2023-10-08 18:07:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 120782848. Throughput: 0: 1728.8, 1: 1723.6. Samples: 30207186. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:07:23,803][19739] Avg episode reward: [(0, '731.360'), (1, '897.640')] +[2023-10-08 18:07:24,051][21195] Updated weights for policy 0, policy_version 59210 (0.0007) +[2023-10-08 18:07:24,080][21194] Updated weights for policy 1, policy_version 58760 (0.0007) +[2023-10-08 18:07:24,425][21195] Updated weights for policy 0, policy_version 59220 (0.0007) +[2023-10-08 18:07:24,445][21194] Updated weights for policy 1, policy_version 58770 (0.0008) +[2023-10-08 18:07:24,791][21195] Updated weights for policy 0, policy_version 59230 (0.0007) +[2023-10-08 18:07:24,813][21194] Updated weights for policy 1, policy_version 58780 (0.0007) +[2023-10-08 18:07:28,582][21195] Updated weights for policy 0, policy_version 59240 (0.0008) +[2023-10-08 18:07:28,609][21194] Updated weights for policy 1, policy_version 58790 (0.0008) +[2023-10-08 18:07:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 120848384. Throughput: 0: 1740.4, 1: 1728.8. Samples: 30228832. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:07:28,803][19739] Avg episode reward: [(0, '731.360'), (1, '912.720')] +[2023-10-08 18:07:28,959][21195] Updated weights for policy 0, policy_version 59250 (0.0009) +[2023-10-08 18:07:28,980][21194] Updated weights for policy 1, policy_version 58800 (0.0008) +[2023-10-08 18:07:29,319][21195] Updated weights for policy 0, policy_version 59260 (0.0007) +[2023-10-08 18:07:29,352][21194] Updated weights for policy 1, policy_version 58810 (0.0008) +[2023-10-08 18:07:33,300][21194] Updated weights for policy 1, policy_version 58820 (0.0007) +[2023-10-08 18:07:33,393][21195] Updated weights for policy 0, policy_version 59270 (0.0008) +[2023-10-08 18:07:33,662][21194] Updated weights for policy 1, policy_version 58830 (0.0008) +[2023-10-08 18:07:33,776][21195] Updated weights for policy 0, policy_version 59280 (0.0008) +[2023-10-08 18:07:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 120913920. Throughput: 0: 1729.7, 1: 1715.7. Samples: 30243368. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:07:33,803][19739] Avg episode reward: [(0, '731.360'), (1, '898.070')] +[2023-10-08 18:07:34,031][21194] Updated weights for policy 1, policy_version 58840 (0.0007) +[2023-10-08 18:07:34,144][21195] Updated weights for policy 0, policy_version 59290 (0.0007) +[2023-10-08 18:07:38,044][21194] Updated weights for policy 1, policy_version 58850 (0.0007) +[2023-10-08 18:07:38,115][21195] Updated weights for policy 0, policy_version 59300 (0.0008) +[2023-10-08 18:07:38,408][21194] Updated weights for policy 1, policy_version 58860 (0.0009) +[2023-10-08 18:07:38,492][21195] Updated weights for policy 0, policy_version 59310 (0.0008) +[2023-10-08 18:07:38,777][21194] Updated weights for policy 1, policy_version 58870 (0.0008) +[2023-10-08 18:07:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 120979456. Throughput: 0: 1741.7, 1: 1737.2. Samples: 30259408. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:07:38,803][19739] Avg episode reward: [(0, '731.360'), (1, '898.070')] +[2023-10-08 18:07:38,857][21195] Updated weights for policy 0, policy_version 59320 (0.0008) +[2023-10-08 18:07:39,138][21194] Updated weights for policy 1, policy_version 58880 (0.0008) +[2023-10-08 18:07:42,754][21195] Updated weights for policy 0, policy_version 59330 (0.0008) +[2023-10-08 18:07:43,029][21194] Updated weights for policy 1, policy_version 58890 (0.0007) +[2023-10-08 18:07:43,117][21195] Updated weights for policy 0, policy_version 59340 (0.0007) +[2023-10-08 18:07:43,396][21194] Updated weights for policy 1, policy_version 58900 (0.0008) +[2023-10-08 18:07:43,491][21195] Updated weights for policy 0, policy_version 59350 (0.0007) +[2023-10-08 18:07:43,754][21194] Updated weights for policy 1, policy_version 58910 (0.0008) +[2023-10-08 18:07:43,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 121044992. Throughput: 0: 1736.7, 1: 1734.0. Samples: 30280514. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:07:43,804][19739] Avg episode reward: [(0, '731.960'), (1, '898.070')] +[2023-10-08 18:07:43,865][21195] Updated weights for policy 0, policy_version 59360 (0.0008) +[2023-10-08 18:07:47,725][21194] Updated weights for policy 1, policy_version 58920 (0.0008) +[2023-10-08 18:07:47,896][21195] Updated weights for policy 0, policy_version 59370 (0.0007) +[2023-10-08 18:07:48,094][21194] Updated weights for policy 1, policy_version 58930 (0.0009) +[2023-10-08 18:07:48,266][21195] Updated weights for policy 0, policy_version 59380 (0.0007) +[2023-10-08 18:07:48,454][21194] Updated weights for policy 1, policy_version 58940 (0.0009) +[2023-10-08 18:07:48,638][21195] Updated weights for policy 0, policy_version 59390 (0.0008) +[2023-10-08 18:07:48,803][19739] Fps is (10 sec: 19660.6, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 121176064. Throughput: 0: 1707.9, 1: 1741.5. Samples: 30295028. Policy #0 lag: (min: 5.0, avg: 7.4, max: 37.0) +[2023-10-08 18:07:48,803][19739] Avg episode reward: [(0, '731.960'), (1, '898.070')] +[2023-10-08 18:07:52,376][21194] Updated weights for policy 1, policy_version 58950 (0.0008) +[2023-10-08 18:07:52,483][21195] Updated weights for policy 0, policy_version 59400 (0.0008) +[2023-10-08 18:07:52,734][21194] Updated weights for policy 1, policy_version 58960 (0.0008) +[2023-10-08 18:07:52,844][21195] Updated weights for policy 0, policy_version 59410 (0.0009) +[2023-10-08 18:07:53,100][21194] Updated weights for policy 1, policy_version 58970 (0.0008) +[2023-10-08 18:07:53,210][21195] Updated weights for policy 0, policy_version 59420 (0.0007) +[2023-10-08 18:07:53,802][19739] Fps is (10 sec: 19661.5, 60 sec: 14199.6, 300 sec: 13884.7). Total num frames: 121241600. Throughput: 0: 1736.9, 1: 1739.5. Samples: 30311694. Policy #0 lag: (min: 5.0, avg: 7.4, max: 37.0) +[2023-10-08 18:07:53,803][19739] Avg episode reward: [(0, '731.960'), (1, '898.070')] +[2023-10-08 18:07:57,133][21195] Updated weights for policy 0, policy_version 59430 (0.0007) +[2023-10-08 18:07:57,134][21194] Updated weights for policy 1, policy_version 58980 (0.0007) +[2023-10-08 18:07:57,497][21195] Updated weights for policy 0, policy_version 59440 (0.0008) +[2023-10-08 18:07:57,511][21194] Updated weights for policy 1, policy_version 58990 (0.0007) +[2023-10-08 18:07:57,864][21195] Updated weights for policy 0, policy_version 59450 (0.0008) +[2023-10-08 18:07:57,878][21194] Updated weights for policy 1, policy_version 59000 (0.0007) +[2023-10-08 18:07:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 121307136. Throughput: 0: 1711.9, 1: 1711.1. Samples: 30330868. Policy #0 lag: (min: 5.0, avg: 7.4, max: 37.0) +[2023-10-08 18:07:58,803][19739] Avg episode reward: [(0, '731.960'), (1, '898.070')] +[2023-10-08 18:08:01,776][21194] Updated weights for policy 1, policy_version 59010 (0.0010) +[2023-10-08 18:08:01,782][21195] Updated weights for policy 0, policy_version 59460 (0.0009) +[2023-10-08 18:08:02,145][21194] Updated weights for policy 1, policy_version 59020 (0.0008) +[2023-10-08 18:08:02,155][21195] Updated weights for policy 0, policy_version 59470 (0.0009) +[2023-10-08 18:08:02,498][21194] Updated weights for policy 1, policy_version 59030 (0.0007) +[2023-10-08 18:08:02,530][21195] Updated weights for policy 0, policy_version 59480 (0.0008) +[2023-10-08 18:08:02,857][21194] Updated weights for policy 1, policy_version 59040 (0.0009) +[2023-10-08 18:08:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 121372672. Throughput: 0: 1713.7, 1: 1735.0. Samples: 30347096. Policy #0 lag: (min: 5.0, avg: 7.4, max: 37.0) +[2023-10-08 18:08:03,803][19739] Avg episode reward: [(0, '731.960'), (1, '898.070')] +[2023-10-08 18:08:06,351][21195] Updated weights for policy 0, policy_version 59490 (0.0009) +[2023-10-08 18:08:06,718][21195] Updated weights for policy 0, policy_version 59500 (0.0008) +[2023-10-08 18:08:06,909][21194] Updated weights for policy 1, policy_version 59050 (0.0008) +[2023-10-08 18:08:07,082][21195] Updated weights for policy 0, policy_version 59510 (0.0007) +[2023-10-08 18:08:07,277][21194] Updated weights for policy 1, policy_version 59060 (0.0009) +[2023-10-08 18:08:07,453][21195] Updated weights for policy 0, policy_version 59520 (0.0007) +[2023-10-08 18:08:07,644][21194] Updated weights for policy 1, policy_version 59070 (0.0010) +[2023-10-08 18:08:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 121438208. Throughput: 0: 1730.3, 1: 1723.2. Samples: 30362592. Policy #0 lag: (min: 5.0, avg: 7.4, max: 37.0) +[2023-10-08 18:08:08,803][19739] Avg episode reward: [(0, '747.290'), (1, '898.070')] +[2023-10-08 18:08:11,311][21195] Updated weights for policy 0, policy_version 59530 (0.0007) +[2023-10-08 18:08:11,630][21194] Updated weights for policy 1, policy_version 59080 (0.0008) +[2023-10-08 18:08:11,676][21195] Updated weights for policy 0, policy_version 59540 (0.0008) +[2023-10-08 18:08:12,001][21194] Updated weights for policy 1, policy_version 59090 (0.0009) +[2023-10-08 18:08:12,046][21195] Updated weights for policy 0, policy_version 59550 (0.0008) +[2023-10-08 18:08:12,369][21194] Updated weights for policy 1, policy_version 59100 (0.0008) +[2023-10-08 18:08:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 121503744. Throughput: 0: 1711.5, 1: 1700.0. Samples: 30382346. Policy #0 lag: (min: 5.0, avg: 7.4, max: 37.0) +[2023-10-08 18:08:13,803][19739] Avg episode reward: [(0, '747.290'), (1, '898.020')] +[2023-10-08 18:08:16,014][21195] Updated weights for policy 0, policy_version 59560 (0.0008) +[2023-10-08 18:08:16,356][21194] Updated weights for policy 1, policy_version 59110 (0.0009) +[2023-10-08 18:08:16,383][21195] Updated weights for policy 0, policy_version 59570 (0.0008) +[2023-10-08 18:08:16,728][21194] Updated weights for policy 1, policy_version 59120 (0.0008) +[2023-10-08 18:08:16,748][21195] Updated weights for policy 0, policy_version 59580 (0.0008) +[2023-10-08 18:08:17,099][21194] Updated weights for policy 1, policy_version 59130 (0.0007) +[2023-10-08 18:08:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 121569280. Throughput: 0: 1727.5, 1: 1730.2. Samples: 30398964. Policy #0 lag: (min: 5.0, avg: 7.4, max: 37.0) +[2023-10-08 18:08:18,803][19739] Avg episode reward: [(0, '766.750'), (1, '898.020')] +[2023-10-08 18:08:20,653][21195] Updated weights for policy 0, policy_version 59590 (0.0008) +[2023-10-08 18:08:21,018][21195] Updated weights for policy 0, policy_version 59600 (0.0007) +[2023-10-08 18:08:21,105][21194] Updated weights for policy 1, policy_version 59140 (0.0009) +[2023-10-08 18:08:21,394][21195] Updated weights for policy 0, policy_version 59610 (0.0009) +[2023-10-08 18:08:21,471][21194] Updated weights for policy 1, policy_version 59150 (0.0009) +[2023-10-08 18:08:21,834][21194] Updated weights for policy 1, policy_version 59160 (0.0010) +[2023-10-08 18:08:23,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 121634816. Throughput: 0: 1719.7, 1: 1697.5. Samples: 30413180. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:08:23,803][19739] Avg episode reward: [(0, '766.750'), (1, '896.820')] +[2023-10-08 18:08:25,227][21195] Updated weights for policy 0, policy_version 59620 (0.0009) +[2023-10-08 18:08:25,618][21195] Updated weights for policy 0, policy_version 59630 (0.0010) +[2023-10-08 18:08:25,874][21194] Updated weights for policy 1, policy_version 59170 (0.0010) +[2023-10-08 18:08:25,979][21195] Updated weights for policy 0, policy_version 59640 (0.0010) +[2023-10-08 18:08:26,245][21194] Updated weights for policy 1, policy_version 59180 (0.0007) +[2023-10-08 18:08:26,605][21194] Updated weights for policy 1, policy_version 59190 (0.0007) +[2023-10-08 18:08:26,961][21194] Updated weights for policy 1, policy_version 59200 (0.0007) +[2023-10-08 18:08:28,803][19739] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 121700352. Throughput: 0: 1724.6, 1: 1698.3. Samples: 30434542. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:08:28,804][19739] Avg episode reward: [(0, '780.860'), (1, '896.820')] +[2023-10-08 18:08:30,005][21195] Updated weights for policy 0, policy_version 59650 (0.0009) +[2023-10-08 18:08:30,372][21195] Updated weights for policy 0, policy_version 59660 (0.0010) +[2023-10-08 18:08:30,740][21195] Updated weights for policy 0, policy_version 59670 (0.0010) +[2023-10-08 18:08:30,983][21194] Updated weights for policy 1, policy_version 59210 (0.0007) +[2023-10-08 18:08:31,108][21195] Updated weights for policy 0, policy_version 59680 (0.0007) +[2023-10-08 18:08:31,359][21194] Updated weights for policy 1, policy_version 59220 (0.0008) +[2023-10-08 18:08:31,731][21194] Updated weights for policy 1, policy_version 59230 (0.0010) +[2023-10-08 18:08:33,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 121765888. Throughput: 0: 1746.9, 1: 1709.6. Samples: 30450572. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:08:33,803][19739] Avg episode reward: [(0, '780.860'), (1, '896.820')] +[2023-10-08 18:08:35,152][21195] Updated weights for policy 0, policy_version 59690 (0.0008) +[2023-10-08 18:08:35,522][21195] Updated weights for policy 0, policy_version 59700 (0.0009) +[2023-10-08 18:08:35,692][21194] Updated weights for policy 1, policy_version 59240 (0.0007) +[2023-10-08 18:08:35,884][21195] Updated weights for policy 0, policy_version 59710 (0.0008) +[2023-10-08 18:08:36,057][21194] Updated weights for policy 1, policy_version 59250 (0.0007) +[2023-10-08 18:08:36,422][21194] Updated weights for policy 1, policy_version 59260 (0.0008) +[2023-10-08 18:08:38,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 121831424. Throughput: 0: 1715.4, 1: 1690.8. Samples: 30464972. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:08:38,803][19739] Avg episode reward: [(0, '780.860'), (1, '896.820')] +[2023-10-08 18:08:39,756][21195] Updated weights for policy 0, policy_version 59720 (0.0008) +[2023-10-08 18:08:40,123][21195] Updated weights for policy 0, policy_version 59730 (0.0010) +[2023-10-08 18:08:40,493][21194] Updated weights for policy 1, policy_version 59270 (0.0008) +[2023-10-08 18:08:40,495][21195] Updated weights for policy 0, policy_version 59740 (0.0008) +[2023-10-08 18:08:40,858][21194] Updated weights for policy 1, policy_version 59280 (0.0008) +[2023-10-08 18:08:41,219][21194] Updated weights for policy 1, policy_version 59290 (0.0008) +[2023-10-08 18:08:43,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 121896960. Throughput: 0: 1743.0, 1: 1713.7. Samples: 30486420. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:08:43,803][19739] Avg episode reward: [(0, '781.560'), (1, '896.820')] +[2023-10-08 18:08:44,276][21195] Updated weights for policy 0, policy_version 59750 (0.0011) +[2023-10-08 18:08:44,651][21195] Updated weights for policy 0, policy_version 59760 (0.0009) +[2023-10-08 18:08:45,022][21195] Updated weights for policy 0, policy_version 59770 (0.0008) +[2023-10-08 18:08:45,114][21194] Updated weights for policy 1, policy_version 59300 (0.0009) +[2023-10-08 18:08:45,472][21194] Updated weights for policy 1, policy_version 59310 (0.0008) +[2023-10-08 18:08:45,835][21194] Updated weights for policy 1, policy_version 59320 (0.0011) +[2023-10-08 18:08:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 121962496. Throughput: 0: 1740.6, 1: 1695.7. Samples: 30501728. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:08:48,803][19739] Avg episode reward: [(0, '781.750'), (1, '896.820')] +[2023-10-08 18:08:49,069][21195] Updated weights for policy 0, policy_version 59780 (0.0008) +[2023-10-08 18:08:49,442][21195] Updated weights for policy 0, policy_version 59790 (0.0010) +[2023-10-08 18:08:49,805][21195] Updated weights for policy 0, policy_version 59800 (0.0010) +[2023-10-08 18:08:49,868][21194] Updated weights for policy 1, policy_version 59330 (0.0011) +[2023-10-08 18:08:50,245][21194] Updated weights for policy 1, policy_version 59340 (0.0008) +[2023-10-08 18:08:50,606][21194] Updated weights for policy 1, policy_version 59350 (0.0008) +[2023-10-08 18:08:50,972][21194] Updated weights for policy 1, policy_version 59360 (0.0007) +[2023-10-08 18:08:53,712][21195] Updated weights for policy 0, policy_version 59810 (0.0007) +[2023-10-08 18:08:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 122028032. Throughput: 0: 1724.9, 1: 1700.9. Samples: 30516752. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:08:53,803][19739] Avg episode reward: [(0, '782.640'), (1, '896.820')] +[2023-10-08 18:08:54,084][21195] Updated weights for policy 0, policy_version 59820 (0.0008) +[2023-10-08 18:08:54,452][21195] Updated weights for policy 0, policy_version 59830 (0.0007) +[2023-10-08 18:08:54,786][21194] Updated weights for policy 1, policy_version 59370 (0.0009) +[2023-10-08 18:08:54,813][21195] Updated weights for policy 0, policy_version 59840 (0.0009) +[2023-10-08 18:08:55,150][21194] Updated weights for policy 1, policy_version 59380 (0.0009) +[2023-10-08 18:08:55,515][21194] Updated weights for policy 1, policy_version 59390 (0.0011) +[2023-10-08 18:08:58,617][21195] Updated weights for policy 0, policy_version 59850 (0.0007) +[2023-10-08 18:08:58,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 122093568. Throughput: 0: 1744.5, 1: 1724.4. Samples: 30538446. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:08:58,803][19739] Avg episode reward: [(0, '798.200'), (1, '896.820')] +[2023-10-08 18:08:58,977][21195] Updated weights for policy 0, policy_version 59860 (0.0010) +[2023-10-08 18:08:59,352][21195] Updated weights for policy 0, policy_version 59870 (0.0008) +[2023-10-08 18:08:59,498][21194] Updated weights for policy 1, policy_version 59400 (0.0010) +[2023-10-08 18:08:59,857][21194] Updated weights for policy 1, policy_version 59410 (0.0009) +[2023-10-08 18:09:00,233][21194] Updated weights for policy 1, policy_version 59420 (0.0008) +[2023-10-08 18:09:03,273][21195] Updated weights for policy 0, policy_version 59880 (0.0007) +[2023-10-08 18:09:03,636][21195] Updated weights for policy 0, policy_version 59890 (0.0008) +[2023-10-08 18:09:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 122159104. Throughput: 0: 1724.9, 1: 1693.7. Samples: 30552800. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:09:03,803][19739] Avg episode reward: [(0, '798.200'), (1, '896.820')] +[2023-10-08 18:09:04,010][21195] Updated weights for policy 0, policy_version 59900 (0.0008) +[2023-10-08 18:09:04,142][21194] Updated weights for policy 1, policy_version 59430 (0.0010) +[2023-10-08 18:09:04,528][21194] Updated weights for policy 1, policy_version 59440 (0.0010) +[2023-10-08 18:09:04,905][21194] Updated weights for policy 1, policy_version 59450 (0.0009) +[2023-10-08 18:09:07,732][21195] Updated weights for policy 0, policy_version 59910 (0.0008) +[2023-10-08 18:09:08,106][21195] Updated weights for policy 0, policy_version 59920 (0.0007) +[2023-10-08 18:09:08,476][21195] Updated weights for policy 0, policy_version 59930 (0.0007) +[2023-10-08 18:09:08,786][21194] Updated weights for policy 1, policy_version 59460 (0.0009) +[2023-10-08 18:09:08,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 122257408. Throughput: 0: 1742.3, 1: 1719.8. Samples: 30568972. Policy #0 lag: (min: 31.0, avg: 31.8, max: 50.0) +[2023-10-08 18:09:08,803][19739] Avg episode reward: [(0, '798.200'), (1, '897.690')] +[2023-10-08 18:09:09,146][21194] Updated weights for policy 1, policy_version 59470 (0.0007) +[2023-10-08 18:09:09,509][21194] Updated weights for policy 1, policy_version 59480 (0.0008) +[2023-10-08 18:09:12,467][21195] Updated weights for policy 0, policy_version 59940 (0.0007) +[2023-10-08 18:09:12,865][21195] Updated weights for policy 0, policy_version 59950 (0.0008) +[2023-10-08 18:09:13,236][21195] Updated weights for policy 0, policy_version 59960 (0.0009) +[2023-10-08 18:09:13,571][21194] Updated weights for policy 1, policy_version 59490 (0.0009) +[2023-10-08 18:09:13,803][19739] Fps is (10 sec: 16383.7, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 122322944. Throughput: 0: 1727.0, 1: 1725.5. Samples: 30589906. Policy #0 lag: (min: 31.0, avg: 31.8, max: 50.0) +[2023-10-08 18:09:13,804][19739] Avg episode reward: [(0, '813.670'), (1, '897.690')] +[2023-10-08 18:09:13,815][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000059968_61407232.pth... +[2023-10-08 18:09:13,847][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000058336_59736064.pth +[2023-10-08 18:09:13,851][20740] Saving new best policy, reward=813.670! +[2023-10-08 18:09:13,937][21194] Updated weights for policy 1, policy_version 59500 (0.0008) +[2023-10-08 18:09:14,305][21194] Updated weights for policy 1, policy_version 59510 (0.0008) +[2023-10-08 18:09:14,662][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000059520_60948480.pth... +[2023-10-08 18:09:14,663][21194] Updated weights for policy 1, policy_version 59520 (0.0008) +[2023-10-08 18:09:14,701][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000057888_59277312.pth +[2023-10-08 18:09:17,254][21195] Updated weights for policy 0, policy_version 59970 (0.0008) +[2023-10-08 18:09:17,620][21195] Updated weights for policy 0, policy_version 59980 (0.0007) +[2023-10-08 18:09:17,985][21195] Updated weights for policy 0, policy_version 59990 (0.0008) +[2023-10-08 18:09:18,350][21195] Updated weights for policy 0, policy_version 60000 (0.0008) +[2023-10-08 18:09:18,739][21194] Updated weights for policy 1, policy_version 59530 (0.0009) +[2023-10-08 18:09:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 122388480. Throughput: 0: 1711.5, 1: 1706.0. Samples: 30604360. Policy #0 lag: (min: 31.0, avg: 31.8, max: 50.0) +[2023-10-08 18:09:18,803][19739] Avg episode reward: [(0, '813.670'), (1, '897.690')] +[2023-10-08 18:09:19,105][21194] Updated weights for policy 1, policy_version 59540 (0.0009) +[2023-10-08 18:09:19,476][21194] Updated weights for policy 1, policy_version 59550 (0.0009) +[2023-10-08 18:09:22,420][21195] Updated weights for policy 0, policy_version 60010 (0.0007) +[2023-10-08 18:09:22,795][21195] Updated weights for policy 0, policy_version 60020 (0.0007) +[2023-10-08 18:09:23,158][21195] Updated weights for policy 0, policy_version 60030 (0.0007) +[2023-10-08 18:09:23,516][21194] Updated weights for policy 1, policy_version 59560 (0.0008) +[2023-10-08 18:09:23,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 122454016. Throughput: 0: 1739.7, 1: 1723.7. Samples: 30620828. Policy #0 lag: (min: 31.0, avg: 31.8, max: 50.0) +[2023-10-08 18:09:23,803][19739] Avg episode reward: [(0, '828.980'), (1, '897.690')] +[2023-10-08 18:09:23,804][20740] Saving new best policy, reward=828.980! +[2023-10-08 18:09:23,880][21194] Updated weights for policy 1, policy_version 59570 (0.0008) +[2023-10-08 18:09:24,252][21194] Updated weights for policy 1, policy_version 59580 (0.0007) +[2023-10-08 18:09:27,255][21195] Updated weights for policy 0, policy_version 60040 (0.0009) +[2023-10-08 18:09:27,625][21195] Updated weights for policy 0, policy_version 60050 (0.0008) +[2023-10-08 18:09:28,001][21195] Updated weights for policy 0, policy_version 60060 (0.0010) +[2023-10-08 18:09:28,268][21194] Updated weights for policy 1, policy_version 59590 (0.0010) +[2023-10-08 18:09:28,631][21194] Updated weights for policy 1, policy_version 59600 (0.0009) +[2023-10-08 18:09:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 122519552. Throughput: 0: 1712.6, 1: 1729.4. Samples: 30641312. Policy #0 lag: (min: 31.0, avg: 31.8, max: 50.0) +[2023-10-08 18:09:28,803][19739] Avg episode reward: [(0, '828.980'), (1, '898.440')] +[2023-10-08 18:09:29,006][21194] Updated weights for policy 1, policy_version 59610 (0.0009) +[2023-10-08 18:09:31,902][21195] Updated weights for policy 0, policy_version 60070 (0.0008) +[2023-10-08 18:09:32,266][21195] Updated weights for policy 0, policy_version 60080 (0.0008) +[2023-10-08 18:09:32,630][21195] Updated weights for policy 0, policy_version 60090 (0.0007) +[2023-10-08 18:09:32,852][21194] Updated weights for policy 1, policy_version 59620 (0.0009) +[2023-10-08 18:09:33,215][21194] Updated weights for policy 1, policy_version 59630 (0.0010) +[2023-10-08 18:09:33,585][21194] Updated weights for policy 1, policy_version 59640 (0.0009) +[2023-10-08 18:09:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 122585088. Throughput: 0: 1718.5, 1: 1720.8. Samples: 30656496. Policy #0 lag: (min: 31.0, avg: 31.8, max: 50.0) +[2023-10-08 18:09:33,804][19739] Avg episode reward: [(0, '828.730'), (1, '898.780')] +[2023-10-08 18:09:36,290][21195] Updated weights for policy 0, policy_version 60100 (0.0008) +[2023-10-08 18:09:36,651][21195] Updated weights for policy 0, policy_version 60110 (0.0010) +[2023-10-08 18:09:37,021][21195] Updated weights for policy 0, policy_version 60120 (0.0010) +[2023-10-08 18:09:37,524][21194] Updated weights for policy 1, policy_version 59650 (0.0009) +[2023-10-08 18:09:37,892][21194] Updated weights for policy 1, policy_version 59660 (0.0010) +[2023-10-08 18:09:38,260][21194] Updated weights for policy 1, policy_version 59670 (0.0010) +[2023-10-08 18:09:38,626][21194] Updated weights for policy 1, policy_version 59680 (0.0009) +[2023-10-08 18:09:38,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 122683392. Throughput: 0: 1735.2, 1: 1732.8. Samples: 30672812. Policy #0 lag: (min: 31.0, avg: 31.8, max: 50.0) +[2023-10-08 18:09:38,804][19739] Avg episode reward: [(0, '828.730'), (1, '898.780')] +[2023-10-08 18:09:40,871][21195] Updated weights for policy 0, policy_version 60130 (0.0009) +[2023-10-08 18:09:41,238][21195] Updated weights for policy 0, policy_version 60140 (0.0008) +[2023-10-08 18:09:41,612][21195] Updated weights for policy 0, policy_version 60150 (0.0009) +[2023-10-08 18:09:41,985][21195] Updated weights for policy 0, policy_version 60160 (0.0009) +[2023-10-08 18:09:42,516][21194] Updated weights for policy 1, policy_version 59690 (0.0011) +[2023-10-08 18:09:42,880][21194] Updated weights for policy 1, policy_version 59700 (0.0010) +[2023-10-08 18:09:43,244][21194] Updated weights for policy 1, policy_version 59710 (0.0007) +[2023-10-08 18:09:43,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 122748928. Throughput: 0: 1723.9, 1: 1707.1. Samples: 30692842. Policy #0 lag: (min: 31.0, avg: 31.8, max: 50.0) +[2023-10-08 18:09:43,803][19739] Avg episode reward: [(0, '828.730'), (1, '898.780')] +[2023-10-08 18:09:45,786][21195] Updated weights for policy 0, policy_version 60170 (0.0007) +[2023-10-08 18:09:46,144][21195] Updated weights for policy 0, policy_version 60180 (0.0010) +[2023-10-08 18:09:46,517][21195] Updated weights for policy 0, policy_version 60190 (0.0008) +[2023-10-08 18:09:47,162][21194] Updated weights for policy 1, policy_version 59720 (0.0009) +[2023-10-08 18:09:47,526][21194] Updated weights for policy 1, policy_version 59730 (0.0009) +[2023-10-08 18:09:47,893][21194] Updated weights for policy 1, policy_version 59740 (0.0008) +[2023-10-08 18:09:48,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 122814464. Throughput: 0: 1749.8, 1: 1727.9. Samples: 30709296. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:09:48,803][19739] Avg episode reward: [(0, '828.730'), (1, '898.780')] +[2023-10-08 18:09:50,472][21195] Updated weights for policy 0, policy_version 60200 (0.0010) +[2023-10-08 18:09:50,842][21195] Updated weights for policy 0, policy_version 60210 (0.0008) +[2023-10-08 18:09:51,209][21195] Updated weights for policy 0, policy_version 60220 (0.0008) +[2023-10-08 18:09:51,870][21194] Updated weights for policy 1, policy_version 59750 (0.0011) +[2023-10-08 18:09:52,258][21194] Updated weights for policy 1, policy_version 59760 (0.0010) +[2023-10-08 18:09:52,620][21194] Updated weights for policy 1, policy_version 59770 (0.0009) +[2023-10-08 18:09:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 122880000. Throughput: 0: 1728.8, 1: 1721.2. Samples: 30724222. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:09:53,803][19739] Avg episode reward: [(0, '828.730'), (1, '898.780')] +[2023-10-08 18:09:55,091][21195] Updated weights for policy 0, policy_version 60230 (0.0007) +[2023-10-08 18:09:55,460][21195] Updated weights for policy 0, policy_version 60240 (0.0008) +[2023-10-08 18:09:55,822][21195] Updated weights for policy 0, policy_version 60250 (0.0010) +[2023-10-08 18:09:56,549][21194] Updated weights for policy 1, policy_version 59780 (0.0008) +[2023-10-08 18:09:56,915][21194] Updated weights for policy 1, policy_version 59790 (0.0010) +[2023-10-08 18:09:57,284][21194] Updated weights for policy 1, policy_version 59800 (0.0008) +[2023-10-08 18:09:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 122945536. Throughput: 0: 1742.1, 1: 1699.6. Samples: 30744780. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:09:58,803][19739] Avg episode reward: [(0, '828.730'), (1, '898.780')] +[2023-10-08 18:09:59,717][21195] Updated weights for policy 0, policy_version 60260 (0.0007) +[2023-10-08 18:10:00,087][21195] Updated weights for policy 0, policy_version 60270 (0.0008) +[2023-10-08 18:10:00,455][21195] Updated weights for policy 0, policy_version 60280 (0.0010) +[2023-10-08 18:10:01,297][21194] Updated weights for policy 1, policy_version 59810 (0.0008) +[2023-10-08 18:10:01,661][21194] Updated weights for policy 1, policy_version 59820 (0.0009) +[2023-10-08 18:10:02,029][21194] Updated weights for policy 1, policy_version 59830 (0.0010) +[2023-10-08 18:10:02,398][21194] Updated weights for policy 1, policy_version 59840 (0.0010) +[2023-10-08 18:10:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 123011072. Throughput: 0: 1771.3, 1: 1730.8. Samples: 30761956. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:10:03,803][19739] Avg episode reward: [(0, '815.170'), (1, '899.140')] +[2023-10-08 18:10:04,257][21195] Updated weights for policy 0, policy_version 60290 (0.0009) +[2023-10-08 18:10:04,623][21195] Updated weights for policy 0, policy_version 60300 (0.0010) +[2023-10-08 18:10:04,992][21195] Updated weights for policy 0, policy_version 60310 (0.0008) +[2023-10-08 18:10:05,354][21195] Updated weights for policy 0, policy_version 60320 (0.0010) +[2023-10-08 18:10:06,334][21194] Updated weights for policy 1, policy_version 59850 (0.0010) +[2023-10-08 18:10:06,694][21194] Updated weights for policy 1, policy_version 59860 (0.0010) +[2023-10-08 18:10:07,066][21194] Updated weights for policy 1, policy_version 59870 (0.0009) +[2023-10-08 18:10:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 123076608. Throughput: 0: 1740.0, 1: 1706.4. Samples: 30775916. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:10:08,803][19739] Avg episode reward: [(0, '830.420'), (1, '899.140')] +[2023-10-08 18:10:09,170][21195] Updated weights for policy 0, policy_version 60330 (0.0008) +[2023-10-08 18:10:09,545][21195] Updated weights for policy 0, policy_version 60340 (0.0008) +[2023-10-08 18:10:09,911][21195] Updated weights for policy 0, policy_version 60350 (0.0007) +[2023-10-08 18:10:09,980][20740] Saving new best policy, reward=830.420! +[2023-10-08 18:10:11,212][21194] Updated weights for policy 1, policy_version 59880 (0.0009) +[2023-10-08 18:10:11,578][21194] Updated weights for policy 1, policy_version 59890 (0.0008) +[2023-10-08 18:10:11,949][21194] Updated weights for policy 1, policy_version 59900 (0.0009) +[2023-10-08 18:10:13,753][21195] Updated weights for policy 0, policy_version 60360 (0.0007) +[2023-10-08 18:10:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 123142144. Throughput: 0: 1769.3, 1: 1696.7. Samples: 30797284. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:10:13,803][19739] Avg episode reward: [(0, '830.580'), (1, '899.140')] +[2023-10-08 18:10:14,122][21195] Updated weights for policy 0, policy_version 60370 (0.0007) +[2023-10-08 18:10:14,490][21195] Updated weights for policy 0, policy_version 60380 (0.0009) +[2023-10-08 18:10:14,631][20740] Saving new best policy, reward=830.580! +[2023-10-08 18:10:15,951][21194] Updated weights for policy 1, policy_version 59910 (0.0008) +[2023-10-08 18:10:16,314][21194] Updated weights for policy 1, policy_version 59920 (0.0007) +[2023-10-08 18:10:16,679][21194] Updated weights for policy 1, policy_version 59930 (0.0007) +[2023-10-08 18:10:18,335][21195] Updated weights for policy 0, policy_version 60390 (0.0011) +[2023-10-08 18:10:18,702][21195] Updated weights for policy 0, policy_version 60400 (0.0010) +[2023-10-08 18:10:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 123207680. Throughput: 0: 1755.0, 1: 1720.6. Samples: 30812896. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:10:18,803][19739] Avg episode reward: [(0, '830.580'), (1, '914.210')] +[2023-10-08 18:10:19,068][21195] Updated weights for policy 0, policy_version 60410 (0.0011) +[2023-10-08 18:10:20,514][21194] Updated weights for policy 1, policy_version 59940 (0.0009) +[2023-10-08 18:10:20,881][21194] Updated weights for policy 1, policy_version 59950 (0.0009) +[2023-10-08 18:10:21,256][21194] Updated weights for policy 1, policy_version 59960 (0.0009) +[2023-10-08 18:10:22,953][21195] Updated weights for policy 0, policy_version 60420 (0.0009) +[2023-10-08 18:10:23,315][21195] Updated weights for policy 0, policy_version 60430 (0.0008) +[2023-10-08 18:10:23,694][21195] Updated weights for policy 0, policy_version 60440 (0.0007) +[2023-10-08 18:10:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 123273216. Throughput: 0: 1754.4, 1: 1696.9. Samples: 30828122. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:10:23,803][19739] Avg episode reward: [(0, '830.580'), (1, '914.170')] +[2023-10-08 18:10:25,154][21194] Updated weights for policy 1, policy_version 59970 (0.0008) +[2023-10-08 18:10:25,529][21194] Updated weights for policy 1, policy_version 59980 (0.0009) +[2023-10-08 18:10:25,893][21194] Updated weights for policy 1, policy_version 59990 (0.0011) +[2023-10-08 18:10:26,257][21194] Updated weights for policy 1, policy_version 60000 (0.0010) +[2023-10-08 18:10:27,774][21195] Updated weights for policy 0, policy_version 60450 (0.0008) +[2023-10-08 18:10:28,144][21195] Updated weights for policy 0, policy_version 60460 (0.0008) +[2023-10-08 18:10:28,511][21195] Updated weights for policy 0, policy_version 60470 (0.0010) +[2023-10-08 18:10:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 123338752. Throughput: 0: 1759.6, 1: 1721.7. Samples: 30849504. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:10:28,803][19739] Avg episode reward: [(0, '831.410'), (1, '899.010')] +[2023-10-08 18:10:28,871][20740] Saving new best policy, reward=831.410! +[2023-10-08 18:10:28,873][21195] Updated weights for policy 0, policy_version 60480 (0.0008) +[2023-10-08 18:10:30,326][21194] Updated weights for policy 1, policy_version 60010 (0.0008) +[2023-10-08 18:10:30,684][21194] Updated weights for policy 1, policy_version 60020 (0.0008) +[2023-10-08 18:10:31,049][21194] Updated weights for policy 1, policy_version 60030 (0.0008) +[2023-10-08 18:10:32,735][21195] Updated weights for policy 0, policy_version 60490 (0.0009) +[2023-10-08 18:10:33,102][21195] Updated weights for policy 0, policy_version 60500 (0.0008) +[2023-10-08 18:10:33,468][21195] Updated weights for policy 0, policy_version 60510 (0.0009) +[2023-10-08 18:10:33,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 123437056. Throughput: 0: 1727.5, 1: 1704.6. Samples: 30863738. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:10:33,803][19739] Avg episode reward: [(0, '831.410'), (1, '879.740')] +[2023-10-08 18:10:35,052][21194] Updated weights for policy 1, policy_version 60040 (0.0008) +[2023-10-08 18:10:35,413][21194] Updated weights for policy 1, policy_version 60050 (0.0010) +[2023-10-08 18:10:35,776][21194] Updated weights for policy 1, policy_version 60060 (0.0009) +[2023-10-08 18:10:37,404][21195] Updated weights for policy 0, policy_version 60520 (0.0009) +[2023-10-08 18:10:37,774][21195] Updated weights for policy 0, policy_version 60530 (0.0009) +[2023-10-08 18:10:38,147][21195] Updated weights for policy 0, policy_version 60540 (0.0008) +[2023-10-08 18:10:38,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 123502592. Throughput: 0: 1763.3, 1: 1709.9. Samples: 30880518. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:10:38,803][19739] Avg episode reward: [(0, '831.410'), (1, '879.740')] +[2023-10-08 18:10:39,754][21194] Updated weights for policy 1, policy_version 60070 (0.0008) +[2023-10-08 18:10:40,140][21194] Updated weights for policy 1, policy_version 60080 (0.0007) +[2023-10-08 18:10:40,511][21194] Updated weights for policy 1, policy_version 60090 (0.0008) +[2023-10-08 18:10:42,208][21195] Updated weights for policy 0, policy_version 60550 (0.0007) +[2023-10-08 18:10:42,568][21195] Updated weights for policy 0, policy_version 60560 (0.0007) +[2023-10-08 18:10:42,942][21195] Updated weights for policy 0, policy_version 60570 (0.0007) +[2023-10-08 18:10:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 123568128. Throughput: 0: 1736.1, 1: 1727.7. Samples: 30900650. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:10:43,804][19739] Avg episode reward: [(0, '831.410'), (1, '893.690')] +[2023-10-08 18:10:44,240][21194] Updated weights for policy 1, policy_version 60100 (0.0009) +[2023-10-08 18:10:44,606][21194] Updated weights for policy 1, policy_version 60110 (0.0009) +[2023-10-08 18:10:44,970][21194] Updated weights for policy 1, policy_version 60120 (0.0008) +[2023-10-08 18:10:46,838][21195] Updated weights for policy 0, policy_version 60580 (0.0008) +[2023-10-08 18:10:47,233][21195] Updated weights for policy 0, policy_version 60590 (0.0007) +[2023-10-08 18:10:47,597][21195] Updated weights for policy 0, policy_version 60600 (0.0007) +[2023-10-08 18:10:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 123633664. Throughput: 0: 1715.6, 1: 1694.3. Samples: 30915404. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:10:48,804][19739] Avg episode reward: [(0, '831.410'), (1, '877.840')] +[2023-10-08 18:10:48,994][21194] Updated weights for policy 1, policy_version 60130 (0.0008) +[2023-10-08 18:10:49,363][21194] Updated weights for policy 1, policy_version 60140 (0.0008) +[2023-10-08 18:10:49,732][21194] Updated weights for policy 1, policy_version 60150 (0.0008) +[2023-10-08 18:10:50,095][21194] Updated weights for policy 1, policy_version 60160 (0.0008) +[2023-10-08 18:10:51,438][21195] Updated weights for policy 0, policy_version 60610 (0.0008) +[2023-10-08 18:10:51,801][21195] Updated weights for policy 0, policy_version 60620 (0.0007) +[2023-10-08 18:10:52,165][21195] Updated weights for policy 0, policy_version 60630 (0.0008) +[2023-10-08 18:10:52,541][21195] Updated weights for policy 0, policy_version 60640 (0.0007) +[2023-10-08 18:10:53,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 123699200. Throughput: 0: 1740.8, 1: 1723.6. Samples: 30931812. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:10:53,803][19739] Avg episode reward: [(0, '831.410'), (1, '877.840')] +[2023-10-08 18:10:54,091][21194] Updated weights for policy 1, policy_version 60170 (0.0007) +[2023-10-08 18:10:54,454][21194] Updated weights for policy 1, policy_version 60180 (0.0007) +[2023-10-08 18:10:54,815][21194] Updated weights for policy 1, policy_version 60190 (0.0008) +[2023-10-08 18:10:56,443][21195] Updated weights for policy 0, policy_version 60650 (0.0008) +[2023-10-08 18:10:56,801][21195] Updated weights for policy 0, policy_version 60660 (0.0008) +[2023-10-08 18:10:57,164][21195] Updated weights for policy 0, policy_version 60670 (0.0008) +[2023-10-08 18:10:58,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 123764736. Throughput: 0: 1716.2, 1: 1731.8. Samples: 30952444. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:10:58,803][19739] Avg episode reward: [(0, '831.810'), (1, '877.840')] +[2023-10-08 18:10:58,810][20740] Saving new best policy, reward=831.810! +[2023-10-08 18:10:58,983][21194] Updated weights for policy 1, policy_version 60200 (0.0009) +[2023-10-08 18:10:59,352][21194] Updated weights for policy 1, policy_version 60210 (0.0008) +[2023-10-08 18:10:59,723][21194] Updated weights for policy 1, policy_version 60220 (0.0008) +[2023-10-08 18:11:01,121][21195] Updated weights for policy 0, policy_version 60680 (0.0008) +[2023-10-08 18:11:01,498][21195] Updated weights for policy 0, policy_version 60690 (0.0010) +[2023-10-08 18:11:01,858][21195] Updated weights for policy 0, policy_version 60700 (0.0009) +[2023-10-08 18:11:03,558][21194] Updated weights for policy 1, policy_version 60230 (0.0009) +[2023-10-08 18:11:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 123830272. Throughput: 0: 1727.9, 1: 1711.5. Samples: 30967672. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:11:03,804][19739] Avg episode reward: [(0, '842.830'), (1, '878.400')] +[2023-10-08 18:11:03,805][20740] Saving new best policy, reward=842.830! +[2023-10-08 18:11:03,914][21194] Updated weights for policy 1, policy_version 60240 (0.0011) +[2023-10-08 18:11:04,283][21194] Updated weights for policy 1, policy_version 60250 (0.0010) +[2023-10-08 18:11:05,769][21195] Updated weights for policy 0, policy_version 60710 (0.0009) +[2023-10-08 18:11:06,131][21195] Updated weights for policy 0, policy_version 60720 (0.0008) +[2023-10-08 18:11:06,504][21195] Updated weights for policy 0, policy_version 60730 (0.0008) +[2023-10-08 18:11:08,289][21194] Updated weights for policy 1, policy_version 60260 (0.0010) +[2023-10-08 18:11:08,650][21194] Updated weights for policy 1, policy_version 60270 (0.0008) +[2023-10-08 18:11:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 123895808. Throughput: 0: 1712.0, 1: 1730.4. Samples: 30983030. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:11:08,803][19739] Avg episode reward: [(0, '842.830'), (1, '878.400')] +[2023-10-08 18:11:09,015][21194] Updated weights for policy 1, policy_version 60280 (0.0008) +[2023-10-08 18:11:10,431][21195] Updated weights for policy 0, policy_version 60740 (0.0009) +[2023-10-08 18:11:10,799][21195] Updated weights for policy 0, policy_version 60750 (0.0008) +[2023-10-08 18:11:11,168][21195] Updated weights for policy 0, policy_version 60760 (0.0009) +[2023-10-08 18:11:12,883][21194] Updated weights for policy 1, policy_version 60290 (0.0007) +[2023-10-08 18:11:13,248][21194] Updated weights for policy 1, policy_version 60300 (0.0009) +[2023-10-08 18:11:13,610][21194] Updated weights for policy 1, policy_version 60310 (0.0007) +[2023-10-08 18:11:13,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 123961344. Throughput: 0: 1717.4, 1: 1723.6. Samples: 31004350. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 18:11:13,803][19739] Avg episode reward: [(0, '842.830'), (1, '892.830')] +[2023-10-08 18:11:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000060768_62226432.pth... +[2023-10-08 18:11:13,844][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000059136_60555264.pth +[2023-10-08 18:11:13,970][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000060320_61767680.pth... +[2023-10-08 18:11:13,973][21194] Updated weights for policy 1, policy_version 60320 (0.0008) +[2023-10-08 18:11:14,008][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000058688_60096512.pth +[2023-10-08 18:11:15,031][21195] Updated weights for policy 0, policy_version 60770 (0.0007) +[2023-10-08 18:11:15,398][21195] Updated weights for policy 0, policy_version 60780 (0.0007) +[2023-10-08 18:11:15,763][21195] Updated weights for policy 0, policy_version 60790 (0.0012) +[2023-10-08 18:11:16,142][21195] Updated weights for policy 0, policy_version 60800 (0.0011) +[2023-10-08 18:11:17,921][21194] Updated weights for policy 1, policy_version 60330 (0.0010) +[2023-10-08 18:11:18,290][21194] Updated weights for policy 1, policy_version 60340 (0.0011) +[2023-10-08 18:11:18,657][21194] Updated weights for policy 1, policy_version 60350 (0.0010) +[2023-10-08 18:11:18,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 124059648. Throughput: 0: 1748.1, 1: 1729.9. Samples: 31020248. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 18:11:18,804][19739] Avg episode reward: [(0, '842.830'), (1, '847.390')] +[2023-10-08 18:11:20,145][21195] Updated weights for policy 0, policy_version 60810 (0.0008) +[2023-10-08 18:11:20,508][21195] Updated weights for policy 0, policy_version 60820 (0.0007) +[2023-10-08 18:11:20,874][21195] Updated weights for policy 0, policy_version 60830 (0.0008) +[2023-10-08 18:11:22,493][21194] Updated weights for policy 1, policy_version 60360 (0.0009) +[2023-10-08 18:11:22,851][21194] Updated weights for policy 1, policy_version 60370 (0.0007) +[2023-10-08 18:11:23,221][21194] Updated weights for policy 1, policy_version 60380 (0.0007) +[2023-10-08 18:11:23,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 124125184. Throughput: 0: 1711.3, 1: 1740.2. Samples: 31035838. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 18:11:23,803][19739] Avg episode reward: [(0, '842.830'), (1, '848.470')] +[2023-10-08 18:11:24,841][21195] Updated weights for policy 0, policy_version 60840 (0.0010) +[2023-10-08 18:11:25,206][21195] Updated weights for policy 0, policy_version 60850 (0.0009) +[2023-10-08 18:11:25,563][21195] Updated weights for policy 0, policy_version 60860 (0.0008) +[2023-10-08 18:11:27,065][21194] Updated weights for policy 1, policy_version 60390 (0.0010) +[2023-10-08 18:11:27,448][21194] Updated weights for policy 1, policy_version 60400 (0.0008) +[2023-10-08 18:11:27,816][21194] Updated weights for policy 1, policy_version 60410 (0.0008) +[2023-10-08 18:11:28,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 124190720. Throughput: 0: 1742.4, 1: 1716.2. Samples: 31056284. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 18:11:28,803][19739] Avg episode reward: [(0, '842.830'), (1, '848.290')] +[2023-10-08 18:11:29,474][21195] Updated weights for policy 0, policy_version 60870 (0.0007) +[2023-10-08 18:11:29,838][21195] Updated weights for policy 0, policy_version 60880 (0.0009) +[2023-10-08 18:11:30,208][21195] Updated weights for policy 0, policy_version 60890 (0.0009) +[2023-10-08 18:11:31,582][21194] Updated weights for policy 1, policy_version 60420 (0.0010) +[2023-10-08 18:11:31,939][21194] Updated weights for policy 1, policy_version 60430 (0.0010) +[2023-10-08 18:11:32,298][21194] Updated weights for policy 1, policy_version 60440 (0.0009) +[2023-10-08 18:11:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 124256256. Throughput: 0: 1753.2, 1: 1750.8. Samples: 31073086. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 18:11:33,803][19739] Avg episode reward: [(0, '837.930'), (1, '848.290')] +[2023-10-08 18:11:34,150][21195] Updated weights for policy 0, policy_version 60900 (0.0008) +[2023-10-08 18:11:34,527][21195] Updated weights for policy 0, policy_version 60910 (0.0010) +[2023-10-08 18:11:34,894][21195] Updated weights for policy 0, policy_version 60920 (0.0010) +[2023-10-08 18:11:36,294][21194] Updated weights for policy 1, policy_version 60450 (0.0009) +[2023-10-08 18:11:36,653][21194] Updated weights for policy 1, policy_version 60460 (0.0008) +[2023-10-08 18:11:37,021][21194] Updated weights for policy 1, policy_version 60470 (0.0009) +[2023-10-08 18:11:37,381][21194] Updated weights for policy 1, policy_version 60480 (0.0008) +[2023-10-08 18:11:38,652][21195] Updated weights for policy 0, policy_version 60930 (0.0009) +[2023-10-08 18:11:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 124321792. Throughput: 0: 1732.1, 1: 1734.4. Samples: 31087804. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 18:11:38,803][19739] Avg episode reward: [(0, '837.930'), (1, '848.490')] +[2023-10-08 18:11:39,019][21195] Updated weights for policy 0, policy_version 60940 (0.0010) +[2023-10-08 18:11:39,384][21195] Updated weights for policy 0, policy_version 60950 (0.0007) +[2023-10-08 18:11:39,744][21195] Updated weights for policy 0, policy_version 60960 (0.0009) +[2023-10-08 18:11:41,341][21194] Updated weights for policy 1, policy_version 60490 (0.0009) +[2023-10-08 18:11:41,703][21194] Updated weights for policy 1, policy_version 60500 (0.0008) +[2023-10-08 18:11:42,074][21194] Updated weights for policy 1, policy_version 60510 (0.0010) +[2023-10-08 18:11:43,738][21195] Updated weights for policy 0, policy_version 60970 (0.0010) +[2023-10-08 18:11:43,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 124387328. Throughput: 0: 1750.5, 1: 1724.5. Samples: 31108818. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 18:11:43,804][19739] Avg episode reward: [(0, '837.930'), (1, '837.810')] +[2023-10-08 18:11:44,105][21195] Updated weights for policy 0, policy_version 60980 (0.0009) +[2023-10-08 18:11:44,478][21195] Updated weights for policy 0, policy_version 60990 (0.0007) +[2023-10-08 18:11:45,942][21194] Updated weights for policy 1, policy_version 60520 (0.0008) +[2023-10-08 18:11:46,304][21194] Updated weights for policy 1, policy_version 60530 (0.0007) +[2023-10-08 18:11:46,672][21194] Updated weights for policy 1, policy_version 60540 (0.0007) +[2023-10-08 18:11:48,243][21195] Updated weights for policy 0, policy_version 61000 (0.0009) +[2023-10-08 18:11:48,612][21195] Updated weights for policy 0, policy_version 61010 (0.0009) +[2023-10-08 18:11:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 124452864. Throughput: 0: 1735.7, 1: 1746.7. Samples: 31124378. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 18:11:48,803][19739] Avg episode reward: [(0, '852.490'), (1, '822.980')] +[2023-10-08 18:11:48,982][21195] Updated weights for policy 0, policy_version 61020 (0.0008) +[2023-10-08 18:11:49,128][20740] Saving new best policy, reward=852.490! +[2023-10-08 18:11:50,571][21194] Updated weights for policy 1, policy_version 60550 (0.0008) +[2023-10-08 18:11:50,944][21194] Updated weights for policy 1, policy_version 60560 (0.0008) +[2023-10-08 18:11:51,306][21194] Updated weights for policy 1, policy_version 60570 (0.0008) +[2023-10-08 18:11:52,928][21195] Updated weights for policy 0, policy_version 61030 (0.0010) +[2023-10-08 18:11:53,306][21195] Updated weights for policy 0, policy_version 61040 (0.0008) +[2023-10-08 18:11:53,675][21195] Updated weights for policy 0, policy_version 61050 (0.0008) +[2023-10-08 18:11:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 124518400. Throughput: 0: 1754.7, 1: 1726.7. Samples: 31139694. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 18:11:53,804][19739] Avg episode reward: [(0, '852.490'), (1, '822.980')] +[2023-10-08 18:11:55,350][21194] Updated weights for policy 1, policy_version 60580 (0.0008) +[2023-10-08 18:11:55,719][21194] Updated weights for policy 1, policy_version 60590 (0.0008) +[2023-10-08 18:11:56,086][21194] Updated weights for policy 1, policy_version 60600 (0.0008) +[2023-10-08 18:11:57,614][21195] Updated weights for policy 0, policy_version 61060 (0.0008) +[2023-10-08 18:11:57,971][21195] Updated weights for policy 0, policy_version 61070 (0.0007) +[2023-10-08 18:11:58,355][21195] Updated weights for policy 0, policy_version 61080 (0.0009) +[2023-10-08 18:11:58,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 124616704. Throughput: 0: 1749.0, 1: 1724.2. Samples: 31160642. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:11:58,804][19739] Avg episode reward: [(0, '852.490'), (1, '822.980')] +[2023-10-08 18:12:00,084][21194] Updated weights for policy 1, policy_version 60610 (0.0008) +[2023-10-08 18:12:00,446][21194] Updated weights for policy 1, policy_version 60620 (0.0008) +[2023-10-08 18:12:00,818][21194] Updated weights for policy 1, policy_version 60630 (0.0009) +[2023-10-08 18:12:01,182][21194] Updated weights for policy 1, policy_version 60640 (0.0010) +[2023-10-08 18:12:02,251][21195] Updated weights for policy 0, policy_version 61090 (0.0007) +[2023-10-08 18:12:02,631][21195] Updated weights for policy 0, policy_version 61100 (0.0008) +[2023-10-08 18:12:02,995][21195] Updated weights for policy 0, policy_version 61110 (0.0008) +[2023-10-08 18:12:03,366][21195] Updated weights for policy 0, policy_version 61120 (0.0009) +[2023-10-08 18:12:03,803][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 124682240. Throughput: 0: 1721.2, 1: 1721.3. Samples: 31175156. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:12:03,803][19739] Avg episode reward: [(0, '852.490'), (1, '822.980')] +[2023-10-08 18:12:05,038][21194] Updated weights for policy 1, policy_version 60650 (0.0007) +[2023-10-08 18:12:05,403][21194] Updated weights for policy 1, policy_version 60660 (0.0008) +[2023-10-08 18:12:05,764][21194] Updated weights for policy 1, policy_version 60670 (0.0010) +[2023-10-08 18:12:07,292][21195] Updated weights for policy 0, policy_version 61130 (0.0008) +[2023-10-08 18:12:07,670][21195] Updated weights for policy 0, policy_version 61140 (0.0009) +[2023-10-08 18:12:08,027][21195] Updated weights for policy 0, policy_version 61150 (0.0008) +[2023-10-08 18:12:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 124747776. Throughput: 0: 1752.3, 1: 1713.7. Samples: 31191806. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:12:08,803][19739] Avg episode reward: [(0, '852.490'), (1, '822.980')] +[2023-10-08 18:12:09,899][21194] Updated weights for policy 1, policy_version 60680 (0.0008) +[2023-10-08 18:12:10,274][21194] Updated weights for policy 1, policy_version 60690 (0.0011) +[2023-10-08 18:12:10,637][21194] Updated weights for policy 1, policy_version 60700 (0.0011) +[2023-10-08 18:12:11,984][21195] Updated weights for policy 0, policy_version 61160 (0.0007) +[2023-10-08 18:12:12,357][21195] Updated weights for policy 0, policy_version 61170 (0.0008) +[2023-10-08 18:12:12,722][21195] Updated weights for policy 0, policy_version 61180 (0.0008) +[2023-10-08 18:12:13,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 124813312. Throughput: 0: 1721.1, 1: 1736.5. Samples: 31211878. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:12:13,804][19739] Avg episode reward: [(0, '867.980'), (1, '822.980')] +[2023-10-08 18:12:13,817][20740] Saving new best policy, reward=867.980! +[2023-10-08 18:12:14,719][21194] Updated weights for policy 1, policy_version 60710 (0.0009) +[2023-10-08 18:12:15,105][21194] Updated weights for policy 1, policy_version 60720 (0.0007) +[2023-10-08 18:12:15,464][21194] Updated weights for policy 1, policy_version 60730 (0.0009) +[2023-10-08 18:12:16,751][21195] Updated weights for policy 0, policy_version 61190 (0.0008) +[2023-10-08 18:12:17,118][21195] Updated weights for policy 0, policy_version 61200 (0.0011) +[2023-10-08 18:12:17,491][21195] Updated weights for policy 0, policy_version 61210 (0.0009) +[2023-10-08 18:12:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 124878848. Throughput: 0: 1719.0, 1: 1698.1. Samples: 31226856. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:12:18,803][19739] Avg episode reward: [(0, '867.980'), (1, '837.280')] +[2023-10-08 18:12:19,497][21194] Updated weights for policy 1, policy_version 60740 (0.0010) +[2023-10-08 18:12:19,856][21194] Updated weights for policy 1, policy_version 60750 (0.0007) +[2023-10-08 18:12:20,224][21194] Updated weights for policy 1, policy_version 60760 (0.0009) +[2023-10-08 18:12:21,523][21195] Updated weights for policy 0, policy_version 61220 (0.0009) +[2023-10-08 18:12:21,909][21195] Updated weights for policy 0, policy_version 61230 (0.0009) +[2023-10-08 18:12:22,286][21195] Updated weights for policy 0, policy_version 61240 (0.0011) +[2023-10-08 18:12:23,802][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 124944384. Throughput: 0: 1733.3, 1: 1712.7. Samples: 31242874. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:12:23,803][19739] Avg episode reward: [(0, '867.980'), (1, '822.520')] +[2023-10-08 18:12:24,179][21194] Updated weights for policy 1, policy_version 60770 (0.0008) +[2023-10-08 18:12:24,534][21194] Updated weights for policy 1, policy_version 60780 (0.0009) +[2023-10-08 18:12:24,902][21194] Updated weights for policy 1, policy_version 60790 (0.0007) +[2023-10-08 18:12:25,268][21194] Updated weights for policy 1, policy_version 60800 (0.0008) +[2023-10-08 18:12:26,157][21195] Updated weights for policy 0, policy_version 61250 (0.0010) +[2023-10-08 18:12:26,529][21195] Updated weights for policy 0, policy_version 61260 (0.0010) +[2023-10-08 18:12:26,913][21195] Updated weights for policy 0, policy_version 61270 (0.0010) +[2023-10-08 18:12:27,286][21195] Updated weights for policy 0, policy_version 61280 (0.0009) +[2023-10-08 18:12:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 125009920. Throughput: 0: 1712.3, 1: 1722.0. Samples: 31263360. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:12:28,803][19739] Avg episode reward: [(0, '883.290'), (1, '822.520')] +[2023-10-08 18:12:28,811][20740] Saving new best policy, reward=883.290! +[2023-10-08 18:12:29,300][21194] Updated weights for policy 1, policy_version 60810 (0.0009) +[2023-10-08 18:12:29,657][21194] Updated weights for policy 1, policy_version 60820 (0.0009) +[2023-10-08 18:12:30,024][21194] Updated weights for policy 1, policy_version 60830 (0.0009) +[2023-10-08 18:12:31,107][21195] Updated weights for policy 0, policy_version 61290 (0.0008) +[2023-10-08 18:12:31,482][21195] Updated weights for policy 0, policy_version 61300 (0.0008) +[2023-10-08 18:12:31,847][21195] Updated weights for policy 0, policy_version 61310 (0.0008) +[2023-10-08 18:12:33,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 125075456. Throughput: 0: 1732.3, 1: 1696.4. Samples: 31278668. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:12:33,804][19739] Avg episode reward: [(0, '883.290'), (1, '822.520')] +[2023-10-08 18:12:33,959][21194] Updated weights for policy 1, policy_version 60840 (0.0009) +[2023-10-08 18:12:34,339][21194] Updated weights for policy 1, policy_version 60850 (0.0008) +[2023-10-08 18:12:34,712][21194] Updated weights for policy 1, policy_version 60860 (0.0007) +[2023-10-08 18:12:35,711][21195] Updated weights for policy 0, policy_version 61320 (0.0009) +[2023-10-08 18:12:36,071][21195] Updated weights for policy 0, policy_version 61330 (0.0008) +[2023-10-08 18:12:36,436][21195] Updated weights for policy 0, policy_version 61340 (0.0007) +[2023-10-08 18:12:38,651][21194] Updated weights for policy 1, policy_version 60870 (0.0007) +[2023-10-08 18:12:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 125140992. Throughput: 0: 1714.5, 1: 1721.1. Samples: 31294298. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:12:38,803][19739] Avg episode reward: [(0, '887.200'), (1, '822.590')] +[2023-10-08 18:12:38,804][20740] Saving new best policy, reward=887.200! +[2023-10-08 18:12:39,019][21194] Updated weights for policy 1, policy_version 60880 (0.0008) +[2023-10-08 18:12:39,384][21194] Updated weights for policy 1, policy_version 60890 (0.0010) +[2023-10-08 18:12:40,482][21195] Updated weights for policy 0, policy_version 61350 (0.0008) +[2023-10-08 18:12:40,859][21195] Updated weights for policy 0, policy_version 61360 (0.0007) +[2023-10-08 18:12:41,231][21195] Updated weights for policy 0, policy_version 61370 (0.0007) +[2023-10-08 18:12:43,288][21194] Updated weights for policy 1, policy_version 60900 (0.0009) +[2023-10-08 18:12:43,653][21194] Updated weights for policy 1, policy_version 60910 (0.0009) +[2023-10-08 18:12:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 125206528. Throughput: 0: 1715.6, 1: 1726.8. Samples: 31315550. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:12:43,803][19739] Avg episode reward: [(0, '887.200'), (1, '807.730')] +[2023-10-08 18:12:44,019][21194] Updated weights for policy 1, policy_version 60920 (0.0007) +[2023-10-08 18:12:44,977][21195] Updated weights for policy 0, policy_version 61380 (0.0008) +[2023-10-08 18:12:45,363][21195] Updated weights for policy 0, policy_version 61390 (0.0009) +[2023-10-08 18:12:45,723][21195] Updated weights for policy 0, policy_version 61400 (0.0009) +[2023-10-08 18:12:47,822][21194] Updated weights for policy 1, policy_version 60930 (0.0008) +[2023-10-08 18:12:48,189][21194] Updated weights for policy 1, policy_version 60940 (0.0008) +[2023-10-08 18:12:48,550][21194] Updated weights for policy 1, policy_version 60950 (0.0007) +[2023-10-08 18:12:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 125272064. Throughput: 0: 1746.6, 1: 1723.6. Samples: 31331314. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:12:48,803][19739] Avg episode reward: [(0, '887.200'), (1, '807.730')] +[2023-10-08 18:12:48,914][21194] Updated weights for policy 1, policy_version 60960 (0.0007) +[2023-10-08 18:12:49,659][21195] Updated weights for policy 0, policy_version 61410 (0.0010) +[2023-10-08 18:12:50,032][21195] Updated weights for policy 0, policy_version 61420 (0.0008) +[2023-10-08 18:12:50,405][21195] Updated weights for policy 0, policy_version 61430 (0.0009) +[2023-10-08 18:12:50,774][21195] Updated weights for policy 0, policy_version 61440 (0.0008) +[2023-10-08 18:12:52,847][21194] Updated weights for policy 1, policy_version 60970 (0.0008) +[2023-10-08 18:12:53,222][21194] Updated weights for policy 1, policy_version 60980 (0.0007) +[2023-10-08 18:12:53,588][21194] Updated weights for policy 1, policy_version 60990 (0.0009) +[2023-10-08 18:12:53,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 125370368. Throughput: 0: 1713.8, 1: 1724.9. Samples: 31346550. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:12:53,803][19739] Avg episode reward: [(0, '902.630'), (1, '807.730')] +[2023-10-08 18:12:53,804][20740] Saving new best policy, reward=902.630! +[2023-10-08 18:12:54,771][21195] Updated weights for policy 0, policy_version 61450 (0.0009) +[2023-10-08 18:12:55,150][21195] Updated weights for policy 0, policy_version 61460 (0.0007) +[2023-10-08 18:12:55,511][21195] Updated weights for policy 0, policy_version 61470 (0.0010) +[2023-10-08 18:12:57,463][21194] Updated weights for policy 1, policy_version 61000 (0.0009) +[2023-10-08 18:12:57,824][21194] Updated weights for policy 1, policy_version 61010 (0.0009) +[2023-10-08 18:12:58,184][21194] Updated weights for policy 1, policy_version 61020 (0.0010) +[2023-10-08 18:12:58,803][19739] Fps is (10 sec: 16383.8, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 125435904. Throughput: 0: 1740.1, 1: 1711.2. Samples: 31367186. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:12:58,803][19739] Avg episode reward: [(0, '933.490'), (1, '807.730')] +[2023-10-08 18:12:58,812][20740] Saving new best policy, reward=933.490! +[2023-10-08 18:12:59,568][21195] Updated weights for policy 0, policy_version 61480 (0.0010) +[2023-10-08 18:12:59,928][21195] Updated weights for policy 0, policy_version 61490 (0.0010) +[2023-10-08 18:13:00,297][21195] Updated weights for policy 0, policy_version 61500 (0.0010) +[2023-10-08 18:13:02,158][21194] Updated weights for policy 1, policy_version 61030 (0.0009) +[2023-10-08 18:13:02,534][21194] Updated weights for policy 1, policy_version 61040 (0.0011) +[2023-10-08 18:13:02,900][21194] Updated weights for policy 1, policy_version 61050 (0.0008) +[2023-10-08 18:13:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 125501440. Throughput: 0: 1738.1, 1: 1743.2. Samples: 31383514. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:13:03,804][19739] Avg episode reward: [(0, '933.490'), (1, '807.730')] +[2023-10-08 18:13:04,282][21195] Updated weights for policy 0, policy_version 61510 (0.0009) +[2023-10-08 18:13:04,646][21195] Updated weights for policy 0, policy_version 61520 (0.0008) +[2023-10-08 18:13:05,015][21195] Updated weights for policy 0, policy_version 61530 (0.0008) +[2023-10-08 18:13:06,928][21194] Updated weights for policy 1, policy_version 61060 (0.0009) +[2023-10-08 18:13:07,309][21194] Updated weights for policy 1, policy_version 61070 (0.0010) +[2023-10-08 18:13:07,676][21194] Updated weights for policy 1, policy_version 61080 (0.0008) +[2023-10-08 18:13:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 125566976. Throughput: 0: 1718.8, 1: 1734.4. Samples: 31398266. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:13:08,803][19739] Avg episode reward: [(0, '934.430'), (1, '807.730')] +[2023-10-08 18:13:08,886][21195] Updated weights for policy 0, policy_version 61540 (0.0009) +[2023-10-08 18:13:09,263][21195] Updated weights for policy 0, policy_version 61550 (0.0009) +[2023-10-08 18:13:09,627][21195] Updated weights for policy 0, policy_version 61560 (0.0010) +[2023-10-08 18:13:09,921][20740] Saving new best policy, reward=934.430! +[2023-10-08 18:13:11,842][21194] Updated weights for policy 1, policy_version 61090 (0.0009) +[2023-10-08 18:13:12,198][21194] Updated weights for policy 1, policy_version 61100 (0.0009) +[2023-10-08 18:13:12,566][21194] Updated weights for policy 1, policy_version 61110 (0.0009) +[2023-10-08 18:13:12,922][21194] Updated weights for policy 1, policy_version 61120 (0.0009) +[2023-10-08 18:13:13,555][21195] Updated weights for policy 0, policy_version 61570 (0.0009) +[2023-10-08 18:13:13,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 125632512. Throughput: 0: 1736.0, 1: 1707.4. Samples: 31418310. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:13:13,803][19739] Avg episode reward: [(0, '934.430'), (1, '807.730')] +[2023-10-08 18:13:13,810][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000061120_62586880.pth... +[2023-10-08 18:13:13,845][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000059520_60948480.pth +[2023-10-08 18:13:13,937][21195] Updated weights for policy 0, policy_version 61580 (0.0009) +[2023-10-08 18:13:14,301][21195] Updated weights for policy 0, policy_version 61590 (0.0008) +[2023-10-08 18:13:14,666][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000061600_63078400.pth... +[2023-10-08 18:13:14,669][21195] Updated weights for policy 0, policy_version 61600 (0.0008) +[2023-10-08 18:13:14,695][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000059968_61407232.pth +[2023-10-08 18:13:16,912][21194] Updated weights for policy 1, policy_version 61130 (0.0007) +[2023-10-08 18:13:17,273][21194] Updated weights for policy 1, policy_version 61140 (0.0010) +[2023-10-08 18:13:17,647][21194] Updated weights for policy 1, policy_version 61150 (0.0008) +[2023-10-08 18:13:18,536][21195] Updated weights for policy 0, policy_version 61610 (0.0008) +[2023-10-08 18:13:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 125698048. Throughput: 0: 1721.3, 1: 1739.6. Samples: 31434408. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 18:13:18,803][19739] Avg episode reward: [(0, '934.880'), (1, '807.260')] +[2023-10-08 18:13:18,906][21195] Updated weights for policy 0, policy_version 61620 (0.0008) +[2023-10-08 18:13:19,262][21195] Updated weights for policy 0, policy_version 61630 (0.0008) +[2023-10-08 18:13:19,334][20740] Saving new best policy, reward=934.880! +[2023-10-08 18:13:21,755][21194] Updated weights for policy 1, policy_version 61160 (0.0009) +[2023-10-08 18:13:22,133][21194] Updated weights for policy 1, policy_version 61170 (0.0010) +[2023-10-08 18:13:22,503][21194] Updated weights for policy 1, policy_version 61180 (0.0008) +[2023-10-08 18:13:23,252][21195] Updated weights for policy 0, policy_version 61640 (0.0008) +[2023-10-08 18:13:23,627][21195] Updated weights for policy 0, policy_version 61650 (0.0009) +[2023-10-08 18:13:23,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 125763584. Throughput: 0: 1731.5, 1: 1722.2. Samples: 31449716. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:13:23,803][19739] Avg episode reward: [(0, '950.090'), (1, '798.490')] +[2023-10-08 18:13:23,994][21195] Updated weights for policy 0, policy_version 61660 (0.0009) +[2023-10-08 18:13:24,134][20740] Saving new best policy, reward=950.090! +[2023-10-08 18:13:26,139][21194] Updated weights for policy 1, policy_version 61190 (0.0008) +[2023-10-08 18:13:26,509][21194] Updated weights for policy 1, policy_version 61200 (0.0007) +[2023-10-08 18:13:26,874][21194] Updated weights for policy 1, policy_version 61210 (0.0007) +[2023-10-08 18:13:27,877][21195] Updated weights for policy 0, policy_version 61670 (0.0008) +[2023-10-08 18:13:28,240][21195] Updated weights for policy 0, policy_version 61680 (0.0010) +[2023-10-08 18:13:28,609][21195] Updated weights for policy 0, policy_version 61690 (0.0008) +[2023-10-08 18:13:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 125829120. Throughput: 0: 1735.8, 1: 1710.8. Samples: 31470648. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:13:28,803][19739] Avg episode reward: [(0, '965.640'), (1, '798.490')] +[2023-10-08 18:13:28,823][20740] Saving new best policy, reward=965.640! +[2023-10-08 18:13:30,907][21194] Updated weights for policy 1, policy_version 61220 (0.0007) +[2023-10-08 18:13:31,271][21194] Updated weights for policy 1, policy_version 61230 (0.0008) +[2023-10-08 18:13:31,633][21194] Updated weights for policy 1, policy_version 61240 (0.0008) +[2023-10-08 18:13:32,607][21195] Updated weights for policy 0, policy_version 61700 (0.0008) +[2023-10-08 18:13:32,971][21195] Updated weights for policy 0, policy_version 61710 (0.0008) +[2023-10-08 18:13:33,341][21195] Updated weights for policy 0, policy_version 61720 (0.0008) +[2023-10-08 18:13:33,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 125927424. Throughput: 0: 1704.5, 1: 1732.9. Samples: 31485996. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:13:33,804][19739] Avg episode reward: [(0, '965.640'), (1, '797.640')] +[2023-10-08 18:13:35,527][21194] Updated weights for policy 1, policy_version 61250 (0.0008) +[2023-10-08 18:13:35,890][21194] Updated weights for policy 1, policy_version 61260 (0.0007) +[2023-10-08 18:13:36,253][21194] Updated weights for policy 1, policy_version 61270 (0.0008) +[2023-10-08 18:13:36,617][21194] Updated weights for policy 1, policy_version 61280 (0.0007) +[2023-10-08 18:13:37,247][21195] Updated weights for policy 0, policy_version 61730 (0.0007) +[2023-10-08 18:13:37,612][21195] Updated weights for policy 0, policy_version 61740 (0.0007) +[2023-10-08 18:13:37,986][21195] Updated weights for policy 0, policy_version 61750 (0.0008) +[2023-10-08 18:13:38,352][21195] Updated weights for policy 0, policy_version 61760 (0.0008) +[2023-10-08 18:13:38,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 125992960. Throughput: 0: 1738.6, 1: 1709.2. Samples: 31501704. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:13:38,803][19739] Avg episode reward: [(0, '965.640'), (1, '783.540')] +[2023-10-08 18:13:40,544][21194] Updated weights for policy 1, policy_version 61290 (0.0008) +[2023-10-08 18:13:40,910][21194] Updated weights for policy 1, policy_version 61300 (0.0008) +[2023-10-08 18:13:41,274][21194] Updated weights for policy 1, policy_version 61310 (0.0008) +[2023-10-08 18:13:42,302][21195] Updated weights for policy 0, policy_version 61770 (0.0008) +[2023-10-08 18:13:42,680][21195] Updated weights for policy 0, policy_version 61780 (0.0008) +[2023-10-08 18:13:43,058][21195] Updated weights for policy 0, policy_version 61790 (0.0009) +[2023-10-08 18:13:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 126058496. Throughput: 0: 1716.9, 1: 1730.1. Samples: 31522302. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:13:43,803][19739] Avg episode reward: [(0, '979.780'), (1, '783.540')] +[2023-10-08 18:13:43,814][20740] Saving new best policy, reward=979.780! +[2023-10-08 18:13:45,153][21194] Updated weights for policy 1, policy_version 61320 (0.0008) +[2023-10-08 18:13:45,522][21194] Updated weights for policy 1, policy_version 61330 (0.0010) +[2023-10-08 18:13:45,887][21194] Updated weights for policy 1, policy_version 61340 (0.0009) +[2023-10-08 18:13:46,963][21195] Updated weights for policy 0, policy_version 61800 (0.0008) +[2023-10-08 18:13:47,327][21195] Updated weights for policy 0, policy_version 61810 (0.0007) +[2023-10-08 18:13:47,691][21195] Updated weights for policy 0, policy_version 61820 (0.0008) +[2023-10-08 18:13:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 126124032. Throughput: 0: 1709.7, 1: 1707.1. Samples: 31537270. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:13:48,803][19739] Avg episode reward: [(0, '979.780'), (1, '783.540')] +[2023-10-08 18:13:49,840][21194] Updated weights for policy 1, policy_version 61350 (0.0007) +[2023-10-08 18:13:50,211][21194] Updated weights for policy 1, policy_version 61360 (0.0008) +[2023-10-08 18:13:50,566][21194] Updated weights for policy 1, policy_version 61370 (0.0008) +[2023-10-08 18:13:51,526][21195] Updated weights for policy 0, policy_version 61830 (0.0012) +[2023-10-08 18:13:51,898][21195] Updated weights for policy 0, policy_version 61840 (0.0010) +[2023-10-08 18:13:52,262][21195] Updated weights for policy 0, policy_version 61850 (0.0007) +[2023-10-08 18:13:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 126189568. Throughput: 0: 1730.4, 1: 1714.6. Samples: 31553292. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:13:53,803][19739] Avg episode reward: [(0, '979.780'), (1, '783.540')] +[2023-10-08 18:13:54,517][21194] Updated weights for policy 1, policy_version 61380 (0.0010) +[2023-10-08 18:13:54,876][21194] Updated weights for policy 1, policy_version 61390 (0.0011) +[2023-10-08 18:13:55,235][21194] Updated weights for policy 1, policy_version 61400 (0.0010) +[2023-10-08 18:13:56,241][21195] Updated weights for policy 0, policy_version 61860 (0.0007) +[2023-10-08 18:13:56,643][21195] Updated weights for policy 0, policy_version 61870 (0.0007) +[2023-10-08 18:13:57,009][21195] Updated weights for policy 0, policy_version 61880 (0.0007) +[2023-10-08 18:13:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 126255104. Throughput: 0: 1714.8, 1: 1741.3. Samples: 31573836. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:13:58,803][19739] Avg episode reward: [(0, '979.780'), (1, '783.540')] +[2023-10-08 18:13:59,267][21194] Updated weights for policy 1, policy_version 61410 (0.0010) +[2023-10-08 18:13:59,634][21194] Updated weights for policy 1, policy_version 61420 (0.0009) +[2023-10-08 18:13:59,998][21194] Updated weights for policy 1, policy_version 61430 (0.0009) +[2023-10-08 18:14:00,360][21194] Updated weights for policy 1, policy_version 61440 (0.0009) +[2023-10-08 18:14:00,949][21195] Updated weights for policy 0, policy_version 61890 (0.0008) +[2023-10-08 18:14:01,327][21195] Updated weights for policy 0, policy_version 61900 (0.0007) +[2023-10-08 18:14:01,699][21195] Updated weights for policy 0, policy_version 61910 (0.0007) +[2023-10-08 18:14:02,074][21195] Updated weights for policy 0, policy_version 61920 (0.0010) +[2023-10-08 18:14:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 126320640. Throughput: 0: 1733.8, 1: 1710.8. Samples: 31589414. Policy #0 lag: (min: 17.0, avg: 21.7, max: 49.0) +[2023-10-08 18:14:03,803][19739] Avg episode reward: [(0, '979.780'), (1, '783.540')] +[2023-10-08 18:14:04,291][21194] Updated weights for policy 1, policy_version 61450 (0.0008) +[2023-10-08 18:14:04,656][21194] Updated weights for policy 1, policy_version 61460 (0.0007) +[2023-10-08 18:14:05,029][21194] Updated weights for policy 1, policy_version 61470 (0.0008) +[2023-10-08 18:14:05,786][21195] Updated weights for policy 0, policy_version 61930 (0.0008) +[2023-10-08 18:14:06,149][21195] Updated weights for policy 0, policy_version 61940 (0.0007) +[2023-10-08 18:14:06,524][21195] Updated weights for policy 0, policy_version 61950 (0.0007) +[2023-10-08 18:14:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 126386176. Throughput: 0: 1726.8, 1: 1726.5. Samples: 31605112. Policy #0 lag: (min: 17.0, avg: 21.7, max: 49.0) +[2023-10-08 18:14:08,803][19739] Avg episode reward: [(0, '979.780'), (1, '778.910')] +[2023-10-08 18:14:08,857][21194] Updated weights for policy 1, policy_version 61480 (0.0010) +[2023-10-08 18:14:09,220][21194] Updated weights for policy 1, policy_version 61490 (0.0011) +[2023-10-08 18:14:09,582][21194] Updated weights for policy 1, policy_version 61500 (0.0008) +[2023-10-08 18:14:10,514][21195] Updated weights for policy 0, policy_version 61960 (0.0009) +[2023-10-08 18:14:10,877][21195] Updated weights for policy 0, policy_version 61970 (0.0008) +[2023-10-08 18:14:11,244][21195] Updated weights for policy 0, policy_version 61980 (0.0009) +[2023-10-08 18:14:13,444][21194] Updated weights for policy 1, policy_version 61510 (0.0009) +[2023-10-08 18:14:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 126451712. Throughput: 0: 1723.3, 1: 1737.0. Samples: 31626364. Policy #0 lag: (min: 17.0, avg: 21.7, max: 49.0) +[2023-10-08 18:14:13,803][19739] Avg episode reward: [(0, '994.810'), (1, '778.910')] +[2023-10-08 18:14:13,809][21194] Updated weights for policy 1, policy_version 61520 (0.0009) +[2023-10-08 18:14:13,809][20740] Saving new best policy, reward=994.810! +[2023-10-08 18:14:14,179][21194] Updated weights for policy 1, policy_version 61530 (0.0008) +[2023-10-08 18:14:15,328][21195] Updated weights for policy 0, policy_version 61990 (0.0009) +[2023-10-08 18:14:15,696][21195] Updated weights for policy 0, policy_version 62000 (0.0009) +[2023-10-08 18:14:16,075][21195] Updated weights for policy 0, policy_version 62010 (0.0008) +[2023-10-08 18:14:18,066][21194] Updated weights for policy 1, policy_version 61540 (0.0009) +[2023-10-08 18:14:18,433][21194] Updated weights for policy 1, policy_version 61550 (0.0007) +[2023-10-08 18:14:18,798][21194] Updated weights for policy 1, policy_version 61560 (0.0009) +[2023-10-08 18:14:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 126517248. Throughput: 0: 1749.9, 1: 1714.3. Samples: 31641884. Policy #0 lag: (min: 17.0, avg: 21.7, max: 49.0) +[2023-10-08 18:14:18,803][19739] Avg episode reward: [(0, '994.380'), (1, '794.100')] +[2023-10-08 18:14:19,905][21195] Updated weights for policy 0, policy_version 62020 (0.0008) +[2023-10-08 18:14:20,272][21195] Updated weights for policy 0, policy_version 62030 (0.0009) +[2023-10-08 18:14:20,637][21195] Updated weights for policy 0, policy_version 62040 (0.0009) +[2023-10-08 18:14:22,798][21194] Updated weights for policy 1, policy_version 61570 (0.0010) +[2023-10-08 18:14:23,166][21194] Updated weights for policy 1, policy_version 61580 (0.0009) +[2023-10-08 18:14:23,528][21194] Updated weights for policy 1, policy_version 61590 (0.0011) +[2023-10-08 18:14:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 126582784. Throughput: 0: 1717.0, 1: 1738.4. Samples: 31657198. Policy #0 lag: (min: 17.0, avg: 21.7, max: 49.0) +[2023-10-08 18:14:23,803][19739] Avg episode reward: [(0, '964.240'), (1, '790.890')] +[2023-10-08 18:14:23,897][21194] Updated weights for policy 1, policy_version 61600 (0.0011) +[2023-10-08 18:14:24,662][21195] Updated weights for policy 0, policy_version 62050 (0.0008) +[2023-10-08 18:14:25,024][21195] Updated weights for policy 0, policy_version 62060 (0.0007) +[2023-10-08 18:14:25,398][21195] Updated weights for policy 0, policy_version 62070 (0.0008) +[2023-10-08 18:14:25,768][21195] Updated weights for policy 0, policy_version 62080 (0.0007) +[2023-10-08 18:14:27,856][21194] Updated weights for policy 1, policy_version 61610 (0.0007) +[2023-10-08 18:14:28,227][21194] Updated weights for policy 1, policy_version 61620 (0.0009) +[2023-10-08 18:14:28,594][21194] Updated weights for policy 1, policy_version 61630 (0.0007) +[2023-10-08 18:14:28,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 126681088. Throughput: 0: 1739.9, 1: 1721.0. Samples: 31678042. Policy #0 lag: (min: 17.0, avg: 21.7, max: 49.0) +[2023-10-08 18:14:28,803][19739] Avg episode reward: [(0, '964.240'), (1, '790.890')] +[2023-10-08 18:14:29,573][21195] Updated weights for policy 0, policy_version 62090 (0.0010) +[2023-10-08 18:14:29,945][21195] Updated weights for policy 0, policy_version 62100 (0.0007) +[2023-10-08 18:14:30,304][21195] Updated weights for policy 0, policy_version 62110 (0.0008) +[2023-10-08 18:14:32,625][21194] Updated weights for policy 1, policy_version 61640 (0.0008) +[2023-10-08 18:14:32,983][21194] Updated weights for policy 1, policy_version 61650 (0.0008) +[2023-10-08 18:14:33,351][21194] Updated weights for policy 1, policy_version 61660 (0.0009) +[2023-10-08 18:14:33,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 126746624. Throughput: 0: 1748.9, 1: 1730.9. Samples: 31693862. Policy #0 lag: (min: 17.0, avg: 21.7, max: 49.0) +[2023-10-08 18:14:33,803][19739] Avg episode reward: [(0, '949.950'), (1, '775.560')] +[2023-10-08 18:14:34,250][21195] Updated weights for policy 0, policy_version 62120 (0.0008) +[2023-10-08 18:14:34,618][21195] Updated weights for policy 0, policy_version 62130 (0.0007) +[2023-10-08 18:14:34,995][21195] Updated weights for policy 0, policy_version 62140 (0.0008) +[2023-10-08 18:14:37,527][21194] Updated weights for policy 1, policy_version 61670 (0.0008) +[2023-10-08 18:14:37,907][21194] Updated weights for policy 1, policy_version 61680 (0.0008) +[2023-10-08 18:14:38,279][21194] Updated weights for policy 1, policy_version 61690 (0.0008) +[2023-10-08 18:14:38,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 126812160. Throughput: 0: 1731.6, 1: 1732.3. Samples: 31709168. Policy #0 lag: (min: 17.0, avg: 21.7, max: 49.0) +[2023-10-08 18:14:38,803][19739] Avg episode reward: [(0, '949.950'), (1, '774.880')] +[2023-10-08 18:14:38,852][21195] Updated weights for policy 0, policy_version 62150 (0.0008) +[2023-10-08 18:14:39,223][21195] Updated weights for policy 0, policy_version 62160 (0.0008) +[2023-10-08 18:14:39,586][21195] Updated weights for policy 0, policy_version 62170 (0.0009) +[2023-10-08 18:14:42,193][21194] Updated weights for policy 1, policy_version 61700 (0.0007) +[2023-10-08 18:14:42,552][21194] Updated weights for policy 1, policy_version 61710 (0.0007) +[2023-10-08 18:14:42,929][21194] Updated weights for policy 1, policy_version 61720 (0.0008) +[2023-10-08 18:14:43,388][21195] Updated weights for policy 0, policy_version 62180 (0.0008) +[2023-10-08 18:14:43,773][21195] Updated weights for policy 0, policy_version 62190 (0.0008) +[2023-10-08 18:14:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 126877696. Throughput: 0: 1756.4, 1: 1708.4. Samples: 31729748. Policy #0 lag: (min: 17.0, avg: 21.7, max: 49.0) +[2023-10-08 18:14:43,803][19739] Avg episode reward: [(0, '941.240'), (1, '774.880')] +[2023-10-08 18:14:44,143][21195] Updated weights for policy 0, policy_version 62200 (0.0011) +[2023-10-08 18:14:46,869][21194] Updated weights for policy 1, policy_version 61730 (0.0008) +[2023-10-08 18:14:47,234][21194] Updated weights for policy 1, policy_version 61740 (0.0009) +[2023-10-08 18:14:47,608][21194] Updated weights for policy 1, policy_version 61750 (0.0008) +[2023-10-08 18:14:47,969][21194] Updated weights for policy 1, policy_version 61760 (0.0009) +[2023-10-08 18:14:48,175][21195] Updated weights for policy 0, policy_version 62210 (0.0010) +[2023-10-08 18:14:48,543][21195] Updated weights for policy 0, policy_version 62220 (0.0007) +[2023-10-08 18:14:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 126943232. Throughput: 0: 1728.3, 1: 1733.9. Samples: 31745210. Policy #0 lag: (min: 21.0, avg: 23.6, max: 53.0) +[2023-10-08 18:14:48,803][19739] Avg episode reward: [(0, '941.240'), (1, '774.880')] +[2023-10-08 18:14:48,905][21195] Updated weights for policy 0, policy_version 62230 (0.0007) +[2023-10-08 18:14:49,272][21195] Updated weights for policy 0, policy_version 62240 (0.0008) +[2023-10-08 18:14:51,853][21194] Updated weights for policy 1, policy_version 61770 (0.0009) +[2023-10-08 18:14:52,224][21194] Updated weights for policy 1, policy_version 61780 (0.0009) +[2023-10-08 18:14:52,592][21194] Updated weights for policy 1, policy_version 61790 (0.0009) +[2023-10-08 18:14:53,082][21195] Updated weights for policy 0, policy_version 62250 (0.0007) +[2023-10-08 18:14:53,448][21195] Updated weights for policy 0, policy_version 62260 (0.0007) +[2023-10-08 18:14:53,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 127008768. Throughput: 0: 1742.4, 1: 1719.5. Samples: 31760898. Policy #0 lag: (min: 21.0, avg: 23.6, max: 53.0) +[2023-10-08 18:14:53,804][19739] Avg episode reward: [(0, '941.240'), (1, '729.180')] +[2023-10-08 18:14:53,806][21195] Updated weights for policy 0, policy_version 62270 (0.0007) +[2023-10-08 18:14:56,451][21194] Updated weights for policy 1, policy_version 61800 (0.0007) +[2023-10-08 18:14:56,824][21194] Updated weights for policy 1, policy_version 61810 (0.0007) +[2023-10-08 18:14:57,193][21194] Updated weights for policy 1, policy_version 61820 (0.0008) +[2023-10-08 18:14:57,722][21195] Updated weights for policy 0, policy_version 62280 (0.0008) +[2023-10-08 18:14:58,088][21195] Updated weights for policy 0, policy_version 62290 (0.0010) +[2023-10-08 18:14:58,459][21195] Updated weights for policy 0, policy_version 62300 (0.0010) +[2023-10-08 18:14:58,803][19739] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 127107072. Throughput: 0: 1741.2, 1: 1709.2. Samples: 31781634. Policy #0 lag: (min: 21.0, avg: 23.6, max: 53.0) +[2023-10-08 18:14:58,804][19739] Avg episode reward: [(0, '941.240'), (1, '729.180')] +[2023-10-08 18:15:01,411][21194] Updated weights for policy 1, policy_version 61830 (0.0009) +[2023-10-08 18:15:01,776][21194] Updated weights for policy 1, policy_version 61840 (0.0008) +[2023-10-08 18:15:02,134][21194] Updated weights for policy 1, policy_version 61850 (0.0007) +[2023-10-08 18:15:02,573][21195] Updated weights for policy 0, policy_version 62310 (0.0008) +[2023-10-08 18:15:02,946][21195] Updated weights for policy 0, policy_version 62320 (0.0008) +[2023-10-08 18:15:03,316][21195] Updated weights for policy 0, policy_version 62330 (0.0007) +[2023-10-08 18:15:03,802][19739] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 127172608. Throughput: 0: 1716.5, 1: 1733.1. Samples: 31797116. Policy #0 lag: (min: 21.0, avg: 23.6, max: 53.0) +[2023-10-08 18:15:03,803][19739] Avg episode reward: [(0, '941.240'), (1, '750.240')] +[2023-10-08 18:15:06,055][21194] Updated weights for policy 1, policy_version 61860 (0.0007) +[2023-10-08 18:15:06,415][21194] Updated weights for policy 1, policy_version 61870 (0.0008) +[2023-10-08 18:15:06,775][21194] Updated weights for policy 1, policy_version 61880 (0.0010) +[2023-10-08 18:15:07,203][21195] Updated weights for policy 0, policy_version 62340 (0.0009) +[2023-10-08 18:15:07,577][21195] Updated weights for policy 0, policy_version 62350 (0.0009) +[2023-10-08 18:15:07,946][21195] Updated weights for policy 0, policy_version 62360 (0.0008) +[2023-10-08 18:15:08,802][19739] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 127238144. Throughput: 0: 1745.9, 1: 1706.0. Samples: 31812532. Policy #0 lag: (min: 21.0, avg: 23.6, max: 53.0) +[2023-10-08 18:15:08,803][19739] Avg episode reward: [(0, '941.240'), (1, '750.240')] +[2023-10-08 18:15:10,462][21194] Updated weights for policy 1, policy_version 61890 (0.0010) +[2023-10-08 18:15:10,831][21194] Updated weights for policy 1, policy_version 61900 (0.0008) +[2023-10-08 18:15:11,192][21194] Updated weights for policy 1, policy_version 61910 (0.0008) +[2023-10-08 18:15:11,564][21194] Updated weights for policy 1, policy_version 61920 (0.0007) +[2023-10-08 18:15:11,796][21195] Updated weights for policy 0, policy_version 62370 (0.0009) +[2023-10-08 18:15:12,165][21195] Updated weights for policy 0, policy_version 62380 (0.0011) +[2023-10-08 18:15:12,524][21195] Updated weights for policy 0, policy_version 62390 (0.0011) +[2023-10-08 18:15:12,889][21195] Updated weights for policy 0, policy_version 62400 (0.0010) +[2023-10-08 18:15:13,803][19739] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 127303680. Throughput: 0: 1717.2, 1: 1720.8. Samples: 31832750. Policy #0 lag: (min: 21.0, avg: 23.6, max: 53.0) +[2023-10-08 18:15:13,804][19739] Avg episode reward: [(0, '942.140'), (1, '738.270')] +[2023-10-08 18:15:13,817][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000061920_63406080.pth... +[2023-10-08 18:15:13,817][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000062400_63897600.pth... +[2023-10-08 18:15:13,847][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000060320_61767680.pth +[2023-10-08 18:15:13,860][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000060768_62226432.pth +[2023-10-08 18:15:15,325][21194] Updated weights for policy 1, policy_version 61930 (0.0008) +[2023-10-08 18:15:15,691][21194] Updated weights for policy 1, policy_version 61940 (0.0008) +[2023-10-08 18:15:16,053][21194] Updated weights for policy 1, policy_version 61950 (0.0008) +[2023-10-08 18:15:16,886][21195] Updated weights for policy 0, policy_version 62410 (0.0009) +[2023-10-08 18:15:17,258][21195] Updated weights for policy 0, policy_version 62420 (0.0007) +[2023-10-08 18:15:17,627][21195] Updated weights for policy 0, policy_version 62430 (0.0007) +[2023-10-08 18:15:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 127369216. Throughput: 0: 1717.9, 1: 1715.7. Samples: 31848372. Policy #0 lag: (min: 21.0, avg: 23.6, max: 53.0) +[2023-10-08 18:15:18,803][19739] Avg episode reward: [(0, '942.140'), (1, '727.770')] +[2023-10-08 18:15:19,898][21194] Updated weights for policy 1, policy_version 61960 (0.0009) +[2023-10-08 18:15:20,266][21194] Updated weights for policy 1, policy_version 61970 (0.0007) +[2023-10-08 18:15:20,626][21194] Updated weights for policy 1, policy_version 61980 (0.0008) +[2023-10-08 18:15:21,506][21195] Updated weights for policy 0, policy_version 62440 (0.0007) +[2023-10-08 18:15:21,871][21195] Updated weights for policy 0, policy_version 62450 (0.0009) +[2023-10-08 18:15:22,239][21195] Updated weights for policy 0, policy_version 62460 (0.0009) +[2023-10-08 18:15:23,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 127434752. Throughput: 0: 1737.6, 1: 1717.4. Samples: 31864644. Policy #0 lag: (min: 21.0, avg: 23.6, max: 53.0) +[2023-10-08 18:15:23,803][19739] Avg episode reward: [(0, '942.140'), (1, '727.770')] +[2023-10-08 18:15:24,749][21194] Updated weights for policy 1, policy_version 61990 (0.0008) +[2023-10-08 18:15:25,130][21194] Updated weights for policy 1, policy_version 62000 (0.0008) +[2023-10-08 18:15:25,497][21194] Updated weights for policy 1, policy_version 62010 (0.0008) +[2023-10-08 18:15:25,869][21195] Updated weights for policy 0, policy_version 62470 (0.0008) +[2023-10-08 18:15:26,245][21195] Updated weights for policy 0, policy_version 62480 (0.0009) +[2023-10-08 18:15:26,613][21195] Updated weights for policy 0, policy_version 62490 (0.0008) +[2023-10-08 18:15:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 127500288. Throughput: 0: 1722.3, 1: 1737.4. Samples: 31885432. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:15:28,803][19739] Avg episode reward: [(0, '942.140'), (1, '742.280')] +[2023-10-08 18:15:29,465][21194] Updated weights for policy 1, policy_version 62020 (0.0008) +[2023-10-08 18:15:29,842][21194] Updated weights for policy 1, policy_version 62030 (0.0008) +[2023-10-08 18:15:30,203][21194] Updated weights for policy 1, policy_version 62040 (0.0007) +[2023-10-08 18:15:30,697][21195] Updated weights for policy 0, policy_version 62500 (0.0008) +[2023-10-08 18:15:31,091][21195] Updated weights for policy 0, policy_version 62510 (0.0008) +[2023-10-08 18:15:31,457][21195] Updated weights for policy 0, policy_version 62520 (0.0007) +[2023-10-08 18:15:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 127565824. Throughput: 0: 1740.8, 1: 1712.8. Samples: 31900622. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:15:33,804][19739] Avg episode reward: [(0, '942.140'), (1, '728.570')] +[2023-10-08 18:15:34,169][21194] Updated weights for policy 1, policy_version 62050 (0.0009) +[2023-10-08 18:15:34,540][21194] Updated weights for policy 1, policy_version 62060 (0.0008) +[2023-10-08 18:15:34,895][21194] Updated weights for policy 1, policy_version 62070 (0.0010) +[2023-10-08 18:15:35,263][21194] Updated weights for policy 1, policy_version 62080 (0.0011) +[2023-10-08 18:15:35,519][21195] Updated weights for policy 0, policy_version 62530 (0.0008) +[2023-10-08 18:15:35,881][21195] Updated weights for policy 0, policy_version 62540 (0.0010) +[2023-10-08 18:15:36,250][21195] Updated weights for policy 0, policy_version 62550 (0.0010) +[2023-10-08 18:15:36,623][21195] Updated weights for policy 0, policy_version 62560 (0.0007) +[2023-10-08 18:15:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 127631360. Throughput: 0: 1721.5, 1: 1722.3. Samples: 31915870. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:15:38,803][19739] Avg episode reward: [(0, '942.140'), (1, '713.760')] +[2023-10-08 18:15:39,480][21194] Updated weights for policy 1, policy_version 62090 (0.0007) +[2023-10-08 18:15:39,842][21194] Updated weights for policy 1, policy_version 62100 (0.0007) +[2023-10-08 18:15:40,207][21194] Updated weights for policy 1, policy_version 62110 (0.0008) +[2023-10-08 18:15:40,538][21195] Updated weights for policy 0, policy_version 62570 (0.0009) +[2023-10-08 18:15:40,901][21195] Updated weights for policy 0, policy_version 62580 (0.0008) +[2023-10-08 18:15:41,269][21195] Updated weights for policy 0, policy_version 62590 (0.0010) +[2023-10-08 18:15:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 127696896. Throughput: 0: 1726.6, 1: 1730.9. Samples: 31937222. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:15:43,803][19739] Avg episode reward: [(0, '942.140'), (1, '668.740')] +[2023-10-08 18:15:44,249][21194] Updated weights for policy 1, policy_version 62120 (0.0008) +[2023-10-08 18:15:44,621][21194] Updated weights for policy 1, policy_version 62130 (0.0008) +[2023-10-08 18:15:44,984][21194] Updated weights for policy 1, policy_version 62140 (0.0009) +[2023-10-08 18:15:45,066][21195] Updated weights for policy 0, policy_version 62600 (0.0009) +[2023-10-08 18:15:45,439][21195] Updated weights for policy 0, policy_version 62610 (0.0008) +[2023-10-08 18:15:45,810][21195] Updated weights for policy 0, policy_version 62620 (0.0009) +[2023-10-08 18:15:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 127762432. Throughput: 0: 1751.6, 1: 1705.7. Samples: 31952698. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:15:48,803][19739] Avg episode reward: [(0, '942.140'), (1, '683.570')] +[2023-10-08 18:15:48,912][21194] Updated weights for policy 1, policy_version 62150 (0.0008) +[2023-10-08 18:15:49,276][21194] Updated weights for policy 1, policy_version 62160 (0.0008) +[2023-10-08 18:15:49,644][21194] Updated weights for policy 1, policy_version 62170 (0.0008) +[2023-10-08 18:15:49,829][21195] Updated weights for policy 0, policy_version 62630 (0.0008) +[2023-10-08 18:15:50,207][21195] Updated weights for policy 0, policy_version 62640 (0.0009) +[2023-10-08 18:15:50,577][21195] Updated weights for policy 0, policy_version 62650 (0.0010) +[2023-10-08 18:15:53,401][21194] Updated weights for policy 1, policy_version 62180 (0.0008) +[2023-10-08 18:15:53,771][21194] Updated weights for policy 1, policy_version 62190 (0.0008) +[2023-10-08 18:15:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 127827968. Throughput: 0: 1723.3, 1: 1735.8. Samples: 31968192. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:15:53,803][19739] Avg episode reward: [(0, '942.140'), (1, '668.560')] +[2023-10-08 18:15:54,140][21194] Updated weights for policy 1, policy_version 62200 (0.0011) +[2023-10-08 18:15:54,587][21195] Updated weights for policy 0, policy_version 62660 (0.0009) +[2023-10-08 18:15:54,956][21195] Updated weights for policy 0, policy_version 62670 (0.0007) +[2023-10-08 18:15:55,322][21195] Updated weights for policy 0, policy_version 62680 (0.0008) +[2023-10-08 18:15:57,752][21194] Updated weights for policy 1, policy_version 62210 (0.0009) +[2023-10-08 18:15:58,124][21194] Updated weights for policy 1, policy_version 62220 (0.0008) +[2023-10-08 18:15:58,504][21194] Updated weights for policy 1, policy_version 62230 (0.0009) +[2023-10-08 18:15:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.3, 300 sec: 13773.7). Total num frames: 127893504. Throughput: 0: 1750.0, 1: 1733.9. Samples: 31989524. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:15:58,803][19739] Avg episode reward: [(0, '943.120'), (1, '626.610')] +[2023-10-08 18:15:58,867][21194] Updated weights for policy 1, policy_version 62240 (0.0009) +[2023-10-08 18:15:59,095][21195] Updated weights for policy 0, policy_version 62690 (0.0009) +[2023-10-08 18:15:59,464][21195] Updated weights for policy 0, policy_version 62700 (0.0009) +[2023-10-08 18:15:59,825][21195] Updated weights for policy 0, policy_version 62710 (0.0008) +[2023-10-08 18:16:00,203][21195] Updated weights for policy 0, policy_version 62720 (0.0007) +[2023-10-08 18:16:02,903][21194] Updated weights for policy 1, policy_version 62250 (0.0008) +[2023-10-08 18:16:03,273][21194] Updated weights for policy 1, policy_version 62260 (0.0007) +[2023-10-08 18:16:03,648][21194] Updated weights for policy 1, policy_version 62270 (0.0007) +[2023-10-08 18:16:03,803][19739] Fps is (10 sec: 16383.7, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 127991808. Throughput: 0: 1753.0, 1: 1735.1. Samples: 32005336. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:16:03,804][19739] Avg episode reward: [(0, '943.120'), (1, '626.610')] +[2023-10-08 18:16:04,075][21195] Updated weights for policy 0, policy_version 62730 (0.0009) +[2023-10-08 18:16:04,444][21195] Updated weights for policy 0, policy_version 62740 (0.0007) +[2023-10-08 18:16:04,798][21195] Updated weights for policy 0, policy_version 62750 (0.0010) +[2023-10-08 18:16:07,583][21194] Updated weights for policy 1, policy_version 62280 (0.0008) +[2023-10-08 18:16:07,951][21194] Updated weights for policy 1, policy_version 62290 (0.0007) +[2023-10-08 18:16:08,311][21194] Updated weights for policy 1, policy_version 62300 (0.0009) +[2023-10-08 18:16:08,770][21195] Updated weights for policy 0, policy_version 62760 (0.0011) +[2023-10-08 18:16:08,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 128057344. Throughput: 0: 1732.2, 1: 1734.8. Samples: 32020662. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:16:08,803][19739] Avg episode reward: [(0, '955.720'), (1, '626.610')] +[2023-10-08 18:16:09,137][21195] Updated weights for policy 0, policy_version 62770 (0.0010) +[2023-10-08 18:16:09,509][21195] Updated weights for policy 0, policy_version 62780 (0.0007) +[2023-10-08 18:16:12,331][21194] Updated weights for policy 1, policy_version 62310 (0.0008) +[2023-10-08 18:16:12,709][21194] Updated weights for policy 1, policy_version 62320 (0.0009) +[2023-10-08 18:16:13,080][21194] Updated weights for policy 1, policy_version 62330 (0.0008) +[2023-10-08 18:16:13,437][21195] Updated weights for policy 0, policy_version 62790 (0.0008) +[2023-10-08 18:16:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 128122880. Throughput: 0: 1742.1, 1: 1716.5. Samples: 32041072. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 18:16:13,804][19739] Avg episode reward: [(0, '955.720'), (1, '626.610')] +[2023-10-08 18:16:13,805][21195] Updated weights for policy 0, policy_version 62800 (0.0007) +[2023-10-08 18:16:14,167][21195] Updated weights for policy 0, policy_version 62810 (0.0008) +[2023-10-08 18:16:17,126][21194] Updated weights for policy 1, policy_version 62340 (0.0008) +[2023-10-08 18:16:17,496][21194] Updated weights for policy 1, policy_version 62350 (0.0009) +[2023-10-08 18:16:17,864][21194] Updated weights for policy 1, policy_version 62360 (0.0008) +[2023-10-08 18:16:18,101][21195] Updated weights for policy 0, policy_version 62820 (0.0008) +[2023-10-08 18:16:18,495][21195] Updated weights for policy 0, policy_version 62830 (0.0010) +[2023-10-08 18:16:18,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 128188416. Throughput: 0: 1726.5, 1: 1738.3. Samples: 32056538. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 18:16:18,804][19739] Avg episode reward: [(0, '956.640'), (1, '626.610')] +[2023-10-08 18:16:18,860][21195] Updated weights for policy 0, policy_version 62840 (0.0007) +[2023-10-08 18:16:21,730][21194] Updated weights for policy 1, policy_version 62370 (0.0008) +[2023-10-08 18:16:22,097][21194] Updated weights for policy 1, policy_version 62380 (0.0009) +[2023-10-08 18:16:22,455][21194] Updated weights for policy 1, policy_version 62390 (0.0008) +[2023-10-08 18:16:22,744][21195] Updated weights for policy 0, policy_version 62850 (0.0008) +[2023-10-08 18:16:22,828][21194] Updated weights for policy 1, policy_version 62400 (0.0007) +[2023-10-08 18:16:23,119][21195] Updated weights for policy 0, policy_version 62860 (0.0009) +[2023-10-08 18:16:23,481][21195] Updated weights for policy 0, policy_version 62870 (0.0009) +[2023-10-08 18:16:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 128253952. Throughput: 0: 1742.7, 1: 1736.0. Samples: 32072408. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 18:16:23,804][19739] Avg episode reward: [(0, '956.780'), (1, '626.610')] +[2023-10-08 18:16:23,857][21195] Updated weights for policy 0, policy_version 62880 (0.0010) +[2023-10-08 18:16:26,744][21194] Updated weights for policy 1, policy_version 62410 (0.0008) +[2023-10-08 18:16:27,113][21194] Updated weights for policy 1, policy_version 62420 (0.0008) +[2023-10-08 18:16:27,475][21194] Updated weights for policy 1, policy_version 62430 (0.0008) +[2023-10-08 18:16:27,730][21195] Updated weights for policy 0, policy_version 62890 (0.0007) +[2023-10-08 18:16:28,103][21195] Updated weights for policy 0, policy_version 62900 (0.0009) +[2023-10-08 18:16:28,465][21195] Updated weights for policy 0, policy_version 62910 (0.0010) +[2023-10-08 18:16:28,803][19739] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 128352256. Throughput: 0: 1734.4, 1: 1718.0. Samples: 32092580. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 18:16:28,803][19739] Avg episode reward: [(0, '956.780'), (1, '626.610')] +[2023-10-08 18:16:31,396][21194] Updated weights for policy 1, policy_version 62440 (0.0007) +[2023-10-08 18:16:31,763][21194] Updated weights for policy 1, policy_version 62450 (0.0008) +[2023-10-08 18:16:32,128][21194] Updated weights for policy 1, policy_version 62460 (0.0010) +[2023-10-08 18:16:32,425][21195] Updated weights for policy 0, policy_version 62920 (0.0008) +[2023-10-08 18:16:32,794][21195] Updated weights for policy 0, policy_version 62930 (0.0009) +[2023-10-08 18:16:33,174][21195] Updated weights for policy 0, policy_version 62940 (0.0007) +[2023-10-08 18:16:33,803][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 128417792. Throughput: 0: 1714.6, 1: 1748.5. Samples: 32108540. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 18:16:33,803][19739] Avg episode reward: [(0, '956.780'), (1, '641.540')] +[2023-10-08 18:16:36,078][21194] Updated weights for policy 1, policy_version 62470 (0.0008) +[2023-10-08 18:16:36,435][21194] Updated weights for policy 1, policy_version 62480 (0.0010) +[2023-10-08 18:16:36,813][21194] Updated weights for policy 1, policy_version 62490 (0.0007) +[2023-10-08 18:16:37,200][21195] Updated weights for policy 0, policy_version 62950 (0.0007) +[2023-10-08 18:16:37,573][21195] Updated weights for policy 0, policy_version 62960 (0.0008) +[2023-10-08 18:16:37,940][21195] Updated weights for policy 0, policy_version 62970 (0.0011) +[2023-10-08 18:16:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 128483328. Throughput: 0: 1740.3, 1: 1717.2. Samples: 32123778. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 18:16:38,803][19739] Avg episode reward: [(0, '959.580'), (1, '641.540')] +[2023-10-08 18:16:40,546][21194] Updated weights for policy 1, policy_version 62500 (0.0008) +[2023-10-08 18:16:40,912][21194] Updated weights for policy 1, policy_version 62510 (0.0009) +[2023-10-08 18:16:41,276][21194] Updated weights for policy 1, policy_version 62520 (0.0008) +[2023-10-08 18:16:41,906][21195] Updated weights for policy 0, policy_version 62980 (0.0010) +[2023-10-08 18:16:42,272][21195] Updated weights for policy 0, policy_version 62990 (0.0010) +[2023-10-08 18:16:42,639][21195] Updated weights for policy 0, policy_version 63000 (0.0008) +[2023-10-08 18:16:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 128548864. Throughput: 0: 1714.6, 1: 1723.6. Samples: 32144244. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 18:16:43,803][19739] Avg episode reward: [(0, '959.580'), (1, '641.540')] +[2023-10-08 18:16:45,195][21194] Updated weights for policy 1, policy_version 62530 (0.0008) +[2023-10-08 18:16:45,559][21194] Updated weights for policy 1, policy_version 62540 (0.0010) +[2023-10-08 18:16:45,928][21194] Updated weights for policy 1, policy_version 62550 (0.0009) +[2023-10-08 18:16:46,299][21194] Updated weights for policy 1, policy_version 62560 (0.0007) +[2023-10-08 18:16:46,431][21195] Updated weights for policy 0, policy_version 63010 (0.0009) +[2023-10-08 18:16:46,809][21195] Updated weights for policy 0, policy_version 63020 (0.0007) +[2023-10-08 18:16:47,178][21195] Updated weights for policy 0, policy_version 63030 (0.0010) +[2023-10-08 18:16:47,544][21195] Updated weights for policy 0, policy_version 63040 (0.0010) +[2023-10-08 18:16:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 128614400. Throughput: 0: 1707.2, 1: 1721.9. Samples: 32159644. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 18:16:48,803][19739] Avg episode reward: [(0, '974.900'), (1, '641.540')] +[2023-10-08 18:16:50,279][21194] Updated weights for policy 1, policy_version 62570 (0.0010) +[2023-10-08 18:16:50,639][21194] Updated weights for policy 1, policy_version 62580 (0.0011) +[2023-10-08 18:16:51,006][21194] Updated weights for policy 1, policy_version 62590 (0.0010) +[2023-10-08 18:16:51,421][21195] Updated weights for policy 0, policy_version 63050 (0.0011) +[2023-10-08 18:16:51,791][21195] Updated weights for policy 0, policy_version 63060 (0.0011) +[2023-10-08 18:16:52,162][21195] Updated weights for policy 0, policy_version 63070 (0.0010) +[2023-10-08 18:16:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 128679936. Throughput: 0: 1722.0, 1: 1712.6. Samples: 32175216. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 18:16:53,804][19739] Avg episode reward: [(0, '974.900'), (1, '641.920')] +[2023-10-08 18:16:55,003][21194] Updated weights for policy 1, policy_version 62600 (0.0010) +[2023-10-08 18:16:55,374][21194] Updated weights for policy 1, policy_version 62610 (0.0010) +[2023-10-08 18:16:55,738][21194] Updated weights for policy 1, policy_version 62620 (0.0007) +[2023-10-08 18:16:56,190][21195] Updated weights for policy 0, policy_version 63080 (0.0010) +[2023-10-08 18:16:56,551][21195] Updated weights for policy 0, policy_version 63090 (0.0010) +[2023-10-08 18:16:56,921][21195] Updated weights for policy 0, policy_version 63100 (0.0009) +[2023-10-08 18:16:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 128745472. Throughput: 0: 1710.0, 1: 1738.3. Samples: 32196242. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 18:16:58,803][19739] Avg episode reward: [(0, '974.900'), (1, '641.920')] +[2023-10-08 18:16:59,732][21194] Updated weights for policy 1, policy_version 62630 (0.0009) +[2023-10-08 18:17:00,097][21194] Updated weights for policy 1, policy_version 62640 (0.0010) +[2023-10-08 18:17:00,466][21194] Updated weights for policy 1, policy_version 62650 (0.0008) +[2023-10-08 18:17:00,858][21195] Updated weights for policy 0, policy_version 63110 (0.0009) +[2023-10-08 18:17:01,236][21195] Updated weights for policy 0, policy_version 63120 (0.0008) +[2023-10-08 18:17:01,606][21195] Updated weights for policy 0, policy_version 63130 (0.0008) +[2023-10-08 18:17:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 128811008. Throughput: 0: 1729.4, 1: 1716.0. Samples: 32211578. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 18:17:03,804][19739] Avg episode reward: [(0, '960.520'), (1, '641.920')] +[2023-10-08 18:17:04,379][21194] Updated weights for policy 1, policy_version 62660 (0.0009) +[2023-10-08 18:17:04,755][21194] Updated weights for policy 1, policy_version 62670 (0.0008) +[2023-10-08 18:17:05,118][21194] Updated weights for policy 1, policy_version 62680 (0.0008) +[2023-10-08 18:17:05,523][21195] Updated weights for policy 0, policy_version 63140 (0.0008) +[2023-10-08 18:17:05,888][21195] Updated weights for policy 0, policy_version 63150 (0.0008) +[2023-10-08 18:17:06,252][21195] Updated weights for policy 0, policy_version 63160 (0.0009) +[2023-10-08 18:17:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 128876544. Throughput: 0: 1715.0, 1: 1722.1. Samples: 32227078. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 18:17:08,804][19739] Avg episode reward: [(0, '961.670'), (1, '641.920')] +[2023-10-08 18:17:09,033][21194] Updated weights for policy 1, policy_version 62690 (0.0010) +[2023-10-08 18:17:09,406][21194] Updated weights for policy 1, policy_version 62700 (0.0011) +[2023-10-08 18:17:09,767][21194] Updated weights for policy 1, policy_version 62710 (0.0009) +[2023-10-08 18:17:10,115][21195] Updated weights for policy 0, policy_version 63170 (0.0007) +[2023-10-08 18:17:10,130][21194] Updated weights for policy 1, policy_version 62720 (0.0009) +[2023-10-08 18:17:10,471][21195] Updated weights for policy 0, policy_version 63180 (0.0008) +[2023-10-08 18:17:10,834][21195] Updated weights for policy 0, policy_version 63190 (0.0009) +[2023-10-08 18:17:11,202][21195] Updated weights for policy 0, policy_version 63200 (0.0009) +[2023-10-08 18:17:13,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 128942080. Throughput: 0: 1720.6, 1: 1742.4. Samples: 32248414. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 18:17:13,803][19739] Avg episode reward: [(0, '970.870'), (1, '641.920')] +[2023-10-08 18:17:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000063200_64716800.pth... +[2023-10-08 18:17:13,842][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000061600_63078400.pth +[2023-10-08 18:17:14,086][21194] Updated weights for policy 1, policy_version 62730 (0.0008) +[2023-10-08 18:17:14,447][21194] Updated weights for policy 1, policy_version 62740 (0.0007) +[2023-10-08 18:17:14,822][21194] Updated weights for policy 1, policy_version 62750 (0.0008) +[2023-10-08 18:17:14,890][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000062752_64258048.pth... +[2023-10-08 18:17:14,919][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000061120_62586880.pth +[2023-10-08 18:17:15,252][21195] Updated weights for policy 0, policy_version 63210 (0.0010) +[2023-10-08 18:17:15,621][21195] Updated weights for policy 0, policy_version 63220 (0.0010) +[2023-10-08 18:17:15,989][21195] Updated weights for policy 0, policy_version 63230 (0.0008) +[2023-10-08 18:17:18,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 129007616. Throughput: 0: 1744.8, 1: 1710.1. Samples: 32264012. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 18:17:18,803][19739] Avg episode reward: [(0, '984.720'), (1, '641.920')] +[2023-10-08 18:17:19,087][21194] Updated weights for policy 1, policy_version 62760 (0.0010) +[2023-10-08 18:17:19,453][21194] Updated weights for policy 1, policy_version 62770 (0.0012) +[2023-10-08 18:17:19,818][21194] Updated weights for policy 1, policy_version 62780 (0.0008) +[2023-10-08 18:17:19,832][21195] Updated weights for policy 0, policy_version 63240 (0.0007) +[2023-10-08 18:17:20,194][21195] Updated weights for policy 0, policy_version 63250 (0.0008) +[2023-10-08 18:17:20,568][21195] Updated weights for policy 0, policy_version 63260 (0.0009) +[2023-10-08 18:17:23,643][21194] Updated weights for policy 1, policy_version 62790 (0.0007) +[2023-10-08 18:17:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 129073152. Throughput: 0: 1720.5, 1: 1731.5. Samples: 32279118. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 18:17:23,803][19739] Avg episode reward: [(0, '968.870'), (1, '641.920')] +[2023-10-08 18:17:24,007][21194] Updated weights for policy 1, policy_version 62800 (0.0008) +[2023-10-08 18:17:24,369][21194] Updated weights for policy 1, policy_version 62810 (0.0007) +[2023-10-08 18:17:24,476][21195] Updated weights for policy 0, policy_version 63270 (0.0008) +[2023-10-08 18:17:24,840][21195] Updated weights for policy 0, policy_version 63280 (0.0009) +[2023-10-08 18:17:25,206][21195] Updated weights for policy 0, policy_version 63290 (0.0008) +[2023-10-08 18:17:28,296][21194] Updated weights for policy 1, policy_version 62820 (0.0008) +[2023-10-08 18:17:28,652][21194] Updated weights for policy 1, policy_version 62830 (0.0009) +[2023-10-08 18:17:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 129138688. Throughput: 0: 1748.6, 1: 1729.9. Samples: 32300776. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 18:17:28,803][19739] Avg episode reward: [(0, '968.870'), (1, '657.170')] +[2023-10-08 18:17:28,981][21195] Updated weights for policy 0, policy_version 63300 (0.0009) +[2023-10-08 18:17:29,019][21194] Updated weights for policy 1, policy_version 62840 (0.0009) +[2023-10-08 18:17:29,357][21195] Updated weights for policy 0, policy_version 63310 (0.0007) +[2023-10-08 18:17:29,713][21195] Updated weights for policy 0, policy_version 63320 (0.0007) +[2023-10-08 18:17:33,055][21194] Updated weights for policy 1, policy_version 62850 (0.0007) +[2023-10-08 18:17:33,422][21194] Updated weights for policy 1, policy_version 62860 (0.0007) +[2023-10-08 18:17:33,561][21195] Updated weights for policy 0, policy_version 63330 (0.0009) +[2023-10-08 18:17:33,796][21194] Updated weights for policy 1, policy_version 62870 (0.0008) +[2023-10-08 18:17:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 129204224. Throughput: 0: 1754.3, 1: 1721.4. Samples: 32316050. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 18:17:33,803][19739] Avg episode reward: [(0, '969.310'), (1, '657.170')] +[2023-10-08 18:17:33,929][21195] Updated weights for policy 0, policy_version 63340 (0.0008) +[2023-10-08 18:17:34,159][21194] Updated weights for policy 1, policy_version 62880 (0.0009) +[2023-10-08 18:17:34,287][21195] Updated weights for policy 0, policy_version 63350 (0.0008) +[2023-10-08 18:17:34,665][21195] Updated weights for policy 0, policy_version 63360 (0.0011) +[2023-10-08 18:17:38,084][21194] Updated weights for policy 1, policy_version 62890 (0.0010) +[2023-10-08 18:17:38,450][21194] Updated weights for policy 1, policy_version 62900 (0.0008) +[2023-10-08 18:17:38,649][21195] Updated weights for policy 0, policy_version 63370 (0.0007) +[2023-10-08 18:17:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 129269760. Throughput: 0: 1746.0, 1: 1731.6. Samples: 32331704. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:17:38,803][19739] Avg episode reward: [(0, '969.960'), (1, '657.170')] +[2023-10-08 18:17:38,819][21194] Updated weights for policy 1, policy_version 62910 (0.0007) +[2023-10-08 18:17:39,010][21195] Updated weights for policy 0, policy_version 63380 (0.0009) +[2023-10-08 18:17:39,378][21195] Updated weights for policy 0, policy_version 63390 (0.0007) +[2023-10-08 18:17:42,713][21194] Updated weights for policy 1, policy_version 62920 (0.0008) +[2023-10-08 18:17:43,081][21194] Updated weights for policy 1, policy_version 62930 (0.0009) +[2023-10-08 18:17:43,333][21195] Updated weights for policy 0, policy_version 63400 (0.0007) +[2023-10-08 18:17:43,460][21194] Updated weights for policy 1, policy_version 62940 (0.0010) +[2023-10-08 18:17:43,707][21195] Updated weights for policy 0, policy_version 63410 (0.0007) +[2023-10-08 18:17:43,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 129368064. Throughput: 0: 1756.7, 1: 1714.6. Samples: 32352452. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:17:43,803][19739] Avg episode reward: [(0, '969.960'), (1, '657.170')] +[2023-10-08 18:17:44,079][21195] Updated weights for policy 0, policy_version 63420 (0.0009) +[2023-10-08 18:17:47,618][21194] Updated weights for policy 1, policy_version 62950 (0.0009) +[2023-10-08 18:17:47,922][21195] Updated weights for policy 0, policy_version 63430 (0.0007) +[2023-10-08 18:17:47,983][21194] Updated weights for policy 1, policy_version 62960 (0.0008) +[2023-10-08 18:17:48,286][21195] Updated weights for policy 0, policy_version 63440 (0.0009) +[2023-10-08 18:17:48,350][21194] Updated weights for policy 1, policy_version 62970 (0.0008) +[2023-10-08 18:17:48,666][21195] Updated weights for policy 0, policy_version 63450 (0.0010) +[2023-10-08 18:17:48,803][19739] Fps is (10 sec: 16383.8, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 129433600. Throughput: 0: 1733.2, 1: 1727.1. Samples: 32367292. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:17:48,803][19739] Avg episode reward: [(0, '984.430'), (1, '672.470')] +[2023-10-08 18:17:52,321][21194] Updated weights for policy 1, policy_version 62980 (0.0008) +[2023-10-08 18:17:52,662][21195] Updated weights for policy 0, policy_version 63460 (0.0009) +[2023-10-08 18:17:52,684][21194] Updated weights for policy 1, policy_version 62990 (0.0007) +[2023-10-08 18:17:53,049][21194] Updated weights for policy 1, policy_version 63000 (0.0007) +[2023-10-08 18:17:53,058][21195] Updated weights for policy 0, policy_version 63470 (0.0009) +[2023-10-08 18:17:53,421][21195] Updated weights for policy 0, policy_version 63480 (0.0007) +[2023-10-08 18:17:53,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 129531904. Throughput: 0: 1757.0, 1: 1721.0. Samples: 32383588. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:17:53,803][19739] Avg episode reward: [(0, '984.430'), (1, '672.470')] +[2023-10-08 18:17:56,956][21194] Updated weights for policy 1, policy_version 63010 (0.0007) +[2023-10-08 18:17:57,301][21195] Updated weights for policy 0, policy_version 63490 (0.0007) +[2023-10-08 18:17:57,323][21194] Updated weights for policy 1, policy_version 63020 (0.0008) +[2023-10-08 18:17:57,664][21195] Updated weights for policy 0, policy_version 63500 (0.0007) +[2023-10-08 18:17:57,689][21194] Updated weights for policy 1, policy_version 63030 (0.0008) +[2023-10-08 18:17:58,041][21195] Updated weights for policy 0, policy_version 63510 (0.0008) +[2023-10-08 18:17:58,057][21194] Updated weights for policy 1, policy_version 63040 (0.0008) +[2023-10-08 18:17:58,406][21195] Updated weights for policy 0, policy_version 63520 (0.0009) +[2023-10-08 18:17:58,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 129597440. Throughput: 0: 1742.8, 1: 1692.8. Samples: 32403018. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:17:58,803][19739] Avg episode reward: [(0, '984.430'), (1, '672.470')] +[2023-10-08 18:18:02,093][21194] Updated weights for policy 1, policy_version 63050 (0.0010) +[2023-10-08 18:18:02,319][21195] Updated weights for policy 0, policy_version 63530 (0.0009) +[2023-10-08 18:18:02,457][21194] Updated weights for policy 1, policy_version 63060 (0.0009) +[2023-10-08 18:18:02,691][21195] Updated weights for policy 0, policy_version 63540 (0.0009) +[2023-10-08 18:18:02,827][21194] Updated weights for policy 1, policy_version 63070 (0.0008) +[2023-10-08 18:18:03,051][21195] Updated weights for policy 0, policy_version 63550 (0.0009) +[2023-10-08 18:18:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 129662976. Throughput: 0: 1719.2, 1: 1724.7. Samples: 32418988. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:18:03,803][19739] Avg episode reward: [(0, '984.430'), (1, '672.470')] +[2023-10-08 18:18:06,710][21194] Updated weights for policy 1, policy_version 63080 (0.0008) +[2023-10-08 18:18:06,991][21195] Updated weights for policy 0, policy_version 63560 (0.0010) +[2023-10-08 18:18:07,071][21194] Updated weights for policy 1, policy_version 63090 (0.0008) +[2023-10-08 18:18:07,358][21195] Updated weights for policy 0, policy_version 63570 (0.0010) +[2023-10-08 18:18:07,441][21194] Updated weights for policy 1, policy_version 63100 (0.0008) +[2023-10-08 18:18:07,722][21195] Updated weights for policy 0, policy_version 63580 (0.0008) +[2023-10-08 18:18:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 129728512. Throughput: 0: 1747.0, 1: 1720.4. Samples: 32435150. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:18:08,803][19739] Avg episode reward: [(0, '984.430'), (1, '672.470')] +[2023-10-08 18:18:11,370][21194] Updated weights for policy 1, policy_version 63110 (0.0009) +[2023-10-08 18:18:11,660][21195] Updated weights for policy 0, policy_version 63590 (0.0008) +[2023-10-08 18:18:11,739][21194] Updated weights for policy 1, policy_version 63120 (0.0008) +[2023-10-08 18:18:12,025][21195] Updated weights for policy 0, policy_version 63600 (0.0009) +[2023-10-08 18:18:12,101][21194] Updated weights for policy 1, policy_version 63130 (0.0008) +[2023-10-08 18:18:12,397][21195] Updated weights for policy 0, policy_version 63610 (0.0008) +[2023-10-08 18:18:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 129794048. Throughput: 0: 1717.5, 1: 1697.4. Samples: 32454446. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:18:13,803][19739] Avg episode reward: [(0, '984.430'), (1, '672.470')] +[2023-10-08 18:18:15,994][21194] Updated weights for policy 1, policy_version 63140 (0.0009) +[2023-10-08 18:18:16,311][21195] Updated weights for policy 0, policy_version 63620 (0.0009) +[2023-10-08 18:18:16,357][21194] Updated weights for policy 1, policy_version 63150 (0.0009) +[2023-10-08 18:18:16,694][21195] Updated weights for policy 0, policy_version 63630 (0.0008) +[2023-10-08 18:18:16,719][21194] Updated weights for policy 1, policy_version 63160 (0.0009) +[2023-10-08 18:18:17,061][21195] Updated weights for policy 0, policy_version 63640 (0.0008) +[2023-10-08 18:18:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 129859584. Throughput: 0: 1717.2, 1: 1723.6. Samples: 32470886. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 18:18:18,803][19739] Avg episode reward: [(0, '985.280'), (1, '672.470')] +[2023-10-08 18:18:20,570][21194] Updated weights for policy 1, policy_version 63170 (0.0009) +[2023-10-08 18:18:20,938][21194] Updated weights for policy 1, policy_version 63180 (0.0010) +[2023-10-08 18:18:21,026][21195] Updated weights for policy 0, policy_version 63650 (0.0008) +[2023-10-08 18:18:21,306][21194] Updated weights for policy 1, policy_version 63190 (0.0008) +[2023-10-08 18:18:21,405][21195] Updated weights for policy 0, policy_version 63660 (0.0007) +[2023-10-08 18:18:21,661][21194] Updated weights for policy 1, policy_version 63200 (0.0008) +[2023-10-08 18:18:21,763][21195] Updated weights for policy 0, policy_version 63670 (0.0010) +[2023-10-08 18:18:22,134][21195] Updated weights for policy 0, policy_version 63680 (0.0010) +[2023-10-08 18:18:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 129925120. Throughput: 0: 1720.6, 1: 1704.2. Samples: 32485822. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 18:18:23,803][19739] Avg episode reward: [(0, '985.280'), (1, '672.470')] +[2023-10-08 18:18:25,626][21194] Updated weights for policy 1, policy_version 63210 (0.0008) +[2023-10-08 18:18:26,001][21194] Updated weights for policy 1, policy_version 63220 (0.0008) +[2023-10-08 18:18:26,179][21195] Updated weights for policy 0, policy_version 63690 (0.0008) +[2023-10-08 18:18:26,365][21194] Updated weights for policy 1, policy_version 63230 (0.0007) +[2023-10-08 18:18:26,537][21195] Updated weights for policy 0, policy_version 63700 (0.0007) +[2023-10-08 18:18:26,910][21195] Updated weights for policy 0, policy_version 63710 (0.0007) +[2023-10-08 18:18:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 129990656. Throughput: 0: 1711.4, 1: 1721.7. Samples: 32506942. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 18:18:28,803][19739] Avg episode reward: [(0, '1000.340'), (1, '687.750')] +[2023-10-08 18:18:28,810][20740] Saving new best policy, reward=1000.340! +[2023-10-08 18:18:30,236][21194] Updated weights for policy 1, policy_version 63240 (0.0008) +[2023-10-08 18:18:30,602][21194] Updated weights for policy 1, policy_version 63250 (0.0008) +[2023-10-08 18:18:30,940][21195] Updated weights for policy 0, policy_version 63720 (0.0009) +[2023-10-08 18:18:30,969][21194] Updated weights for policy 1, policy_version 63260 (0.0009) +[2023-10-08 18:18:31,309][21195] Updated weights for policy 0, policy_version 63730 (0.0010) +[2023-10-08 18:18:31,680][21195] Updated weights for policy 0, policy_version 63740 (0.0010) +[2023-10-08 18:18:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 130056192. Throughput: 0: 1734.8, 1: 1713.5. Samples: 32522462. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 18:18:33,803][19739] Avg episode reward: [(0, '1000.340'), (1, '687.750')] +[2023-10-08 18:18:34,940][21194] Updated weights for policy 1, policy_version 63270 (0.0009) +[2023-10-08 18:18:35,321][21194] Updated weights for policy 1, policy_version 63280 (0.0008) +[2023-10-08 18:18:35,551][21195] Updated weights for policy 0, policy_version 63750 (0.0008) +[2023-10-08 18:18:35,694][21194] Updated weights for policy 1, policy_version 63290 (0.0008) +[2023-10-08 18:18:35,923][21195] Updated weights for policy 0, policy_version 63760 (0.0007) +[2023-10-08 18:18:36,295][21195] Updated weights for policy 0, policy_version 63770 (0.0008) +[2023-10-08 18:18:38,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 130121728. Throughput: 0: 1709.4, 1: 1714.8. Samples: 32537676. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 18:18:38,804][19739] Avg episode reward: [(0, '1000.340'), (1, '687.750')] +[2023-10-08 18:18:39,643][21194] Updated weights for policy 1, policy_version 63300 (0.0008) +[2023-10-08 18:18:40,012][21194] Updated weights for policy 1, policy_version 63310 (0.0008) +[2023-10-08 18:18:40,372][21194] Updated weights for policy 1, policy_version 63320 (0.0008) +[2023-10-08 18:18:40,384][21195] Updated weights for policy 0, policy_version 63780 (0.0010) +[2023-10-08 18:18:40,773][21195] Updated weights for policy 0, policy_version 63790 (0.0009) +[2023-10-08 18:18:41,141][21195] Updated weights for policy 0, policy_version 63800 (0.0010) +[2023-10-08 18:18:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 130187264. Throughput: 0: 1720.2, 1: 1738.5. Samples: 32558660. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 18:18:43,803][19739] Avg episode reward: [(0, '987.350'), (1, '687.750')] +[2023-10-08 18:18:44,390][21194] Updated weights for policy 1, policy_version 63330 (0.0007) +[2023-10-08 18:18:44,763][21194] Updated weights for policy 1, policy_version 63340 (0.0009) +[2023-10-08 18:18:44,889][21195] Updated weights for policy 0, policy_version 63810 (0.0007) +[2023-10-08 18:18:45,140][21194] Updated weights for policy 1, policy_version 63350 (0.0007) +[2023-10-08 18:18:45,259][21195] Updated weights for policy 0, policy_version 63820 (0.0008) +[2023-10-08 18:18:45,504][21194] Updated weights for policy 1, policy_version 63360 (0.0009) +[2023-10-08 18:18:45,631][21195] Updated weights for policy 0, policy_version 63830 (0.0008) +[2023-10-08 18:18:45,991][21195] Updated weights for policy 0, policy_version 63840 (0.0007) +[2023-10-08 18:18:48,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 130252800. Throughput: 0: 1742.2, 1: 1708.6. Samples: 32574274. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 18:18:48,803][19739] Avg episode reward: [(0, '987.350'), (1, '702.930')] +[2023-10-08 18:18:49,420][21194] Updated weights for policy 1, policy_version 63370 (0.0008) +[2023-10-08 18:18:49,786][21194] Updated weights for policy 1, policy_version 63380 (0.0009) +[2023-10-08 18:18:49,837][21195] Updated weights for policy 0, policy_version 63850 (0.0007) +[2023-10-08 18:18:50,155][21194] Updated weights for policy 1, policy_version 63390 (0.0007) +[2023-10-08 18:18:50,202][21195] Updated weights for policy 0, policy_version 63860 (0.0008) +[2023-10-08 18:18:50,572][21195] Updated weights for policy 0, policy_version 63870 (0.0009) +[2023-10-08 18:18:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 130318336. Throughput: 0: 1711.9, 1: 1717.3. Samples: 32589464. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 18:18:53,804][19739] Avg episode reward: [(0, '987.350'), (1, '687.230')] +[2023-10-08 18:18:54,074][21194] Updated weights for policy 1, policy_version 63400 (0.0007) +[2023-10-08 18:18:54,437][21194] Updated weights for policy 1, policy_version 63410 (0.0007) +[2023-10-08 18:18:54,488][21195] Updated weights for policy 0, policy_version 63880 (0.0008) +[2023-10-08 18:18:54,807][21194] Updated weights for policy 1, policy_version 63420 (0.0008) +[2023-10-08 18:18:54,858][21195] Updated weights for policy 0, policy_version 63890 (0.0009) +[2023-10-08 18:18:55,222][21195] Updated weights for policy 0, policy_version 63900 (0.0009) +[2023-10-08 18:18:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 130383872. Throughput: 0: 1743.0, 1: 1740.8. Samples: 32611218. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 18:18:58,803][19739] Avg episode reward: [(0, '987.350'), (1, '699.290')] +[2023-10-08 18:18:58,814][21194] Updated weights for policy 1, policy_version 63430 (0.0007) +[2023-10-08 18:18:58,961][21195] Updated weights for policy 0, policy_version 63910 (0.0009) +[2023-10-08 18:18:59,189][21194] Updated weights for policy 1, policy_version 63440 (0.0008) +[2023-10-08 18:18:59,333][21195] Updated weights for policy 0, policy_version 63920 (0.0008) +[2023-10-08 18:18:59,557][21194] Updated weights for policy 1, policy_version 63450 (0.0008) +[2023-10-08 18:18:59,699][21195] Updated weights for policy 0, policy_version 63930 (0.0008) +[2023-10-08 18:19:03,578][21194] Updated weights for policy 1, policy_version 63460 (0.0008) +[2023-10-08 18:19:03,614][21195] Updated weights for policy 0, policy_version 63940 (0.0010) +[2023-10-08 18:19:03,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 130449408. Throughput: 0: 1738.5, 1: 1711.7. Samples: 32626144. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:19:03,803][19739] Avg episode reward: [(0, '987.350'), (1, '714.520')] +[2023-10-08 18:19:03,938][21194] Updated weights for policy 1, policy_version 63470 (0.0009) +[2023-10-08 18:19:03,982][21195] Updated weights for policy 0, policy_version 63950 (0.0009) +[2023-10-08 18:19:04,306][21194] Updated weights for policy 1, policy_version 63480 (0.0008) +[2023-10-08 18:19:04,351][21195] Updated weights for policy 0, policy_version 63960 (0.0008) +[2023-10-08 18:19:08,281][21195] Updated weights for policy 0, policy_version 63970 (0.0007) +[2023-10-08 18:19:08,360][21194] Updated weights for policy 1, policy_version 63490 (0.0007) +[2023-10-08 18:19:08,644][21195] Updated weights for policy 0, policy_version 63980 (0.0007) +[2023-10-08 18:19:08,722][21194] Updated weights for policy 1, policy_version 63500 (0.0009) +[2023-10-08 18:19:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 130514944. Throughput: 0: 1735.2, 1: 1729.1. Samples: 32641714. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:19:08,803][19739] Avg episode reward: [(0, '987.350'), (1, '714.520')] +[2023-10-08 18:19:09,010][21195] Updated weights for policy 0, policy_version 63990 (0.0009) +[2023-10-08 18:19:09,091][21194] Updated weights for policy 1, policy_version 63510 (0.0008) +[2023-10-08 18:19:09,382][21195] Updated weights for policy 0, policy_version 64000 (0.0009) +[2023-10-08 18:19:09,460][21194] Updated weights for policy 1, policy_version 63520 (0.0007) +[2023-10-08 18:19:13,378][21195] Updated weights for policy 0, policy_version 64010 (0.0009) +[2023-10-08 18:19:13,564][21194] Updated weights for policy 1, policy_version 63530 (0.0007) +[2023-10-08 18:19:13,746][21195] Updated weights for policy 0, policy_version 64020 (0.0007) +[2023-10-08 18:19:13,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 130580480. Throughput: 0: 1747.0, 1: 1721.3. Samples: 32663016. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:19:13,804][19739] Avg episode reward: [(0, '987.350'), (1, '715.310')] +[2023-10-08 18:19:13,925][21194] Updated weights for policy 1, policy_version 63540 (0.0007) +[2023-10-08 18:19:14,117][21195] Updated weights for policy 0, policy_version 64030 (0.0010) +[2023-10-08 18:19:14,182][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000064032_65568768.pth... +[2023-10-08 18:19:14,212][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000062400_63897600.pth +[2023-10-08 18:19:14,288][21194] Updated weights for policy 1, policy_version 63550 (0.0008) +[2023-10-08 18:19:14,363][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000063552_65077248.pth... +[2023-10-08 18:19:14,391][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000061920_63406080.pth +[2023-10-08 18:19:18,063][21195] Updated weights for policy 0, policy_version 64040 (0.0009) +[2023-10-08 18:19:18,315][21194] Updated weights for policy 1, policy_version 63560 (0.0008) +[2023-10-08 18:19:18,434][21195] Updated weights for policy 0, policy_version 64050 (0.0009) +[2023-10-08 18:19:18,685][21194] Updated weights for policy 1, policy_version 63570 (0.0008) +[2023-10-08 18:19:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 130646016. Throughput: 0: 1722.7, 1: 1716.0. Samples: 32677204. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:19:18,803][19739] Avg episode reward: [(0, '987.350'), (1, '730.620')] +[2023-10-08 18:19:18,807][21195] Updated weights for policy 0, policy_version 64060 (0.0008) +[2023-10-08 18:19:19,056][21194] Updated weights for policy 1, policy_version 63580 (0.0008) +[2023-10-08 18:19:22,890][21195] Updated weights for policy 0, policy_version 64070 (0.0008) +[2023-10-08 18:19:23,093][21194] Updated weights for policy 1, policy_version 63590 (0.0008) +[2023-10-08 18:19:23,263][21195] Updated weights for policy 0, policy_version 64080 (0.0007) +[2023-10-08 18:19:23,462][21194] Updated weights for policy 1, policy_version 63600 (0.0008) +[2023-10-08 18:19:23,623][21195] Updated weights for policy 0, policy_version 64090 (0.0007) +[2023-10-08 18:19:23,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 130711552. Throughput: 0: 1746.1, 1: 1713.6. Samples: 32693360. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:19:23,803][19739] Avg episode reward: [(0, '1002.900'), (1, '730.620')] +[2023-10-08 18:19:23,834][21194] Updated weights for policy 1, policy_version 63610 (0.0008) +[2023-10-08 18:19:23,840][20740] Saving new best policy, reward=1002.900! +[2023-10-08 18:19:27,699][21195] Updated weights for policy 0, policy_version 64100 (0.0008) +[2023-10-08 18:19:27,856][21194] Updated weights for policy 1, policy_version 63620 (0.0009) +[2023-10-08 18:19:28,065][21195] Updated weights for policy 0, policy_version 64110 (0.0007) +[2023-10-08 18:19:28,227][21194] Updated weights for policy 1, policy_version 63630 (0.0009) +[2023-10-08 18:19:28,437][21195] Updated weights for policy 0, policy_version 64120 (0.0008) +[2023-10-08 18:19:28,588][21194] Updated weights for policy 1, policy_version 63640 (0.0008) +[2023-10-08 18:19:28,803][19739] Fps is (10 sec: 16383.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 130809856. Throughput: 0: 1740.5, 1: 1706.8. Samples: 32713788. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:19:28,804][19739] Avg episode reward: [(0, '1002.900'), (1, '746.600')] +[2023-10-08 18:19:32,378][21195] Updated weights for policy 0, policy_version 64130 (0.0010) +[2023-10-08 18:19:32,519][21194] Updated weights for policy 1, policy_version 63650 (0.0009) +[2023-10-08 18:19:32,752][21195] Updated weights for policy 0, policy_version 64140 (0.0009) +[2023-10-08 18:19:32,871][21194] Updated weights for policy 1, policy_version 63660 (0.0009) +[2023-10-08 18:19:33,132][21195] Updated weights for policy 0, policy_version 64150 (0.0008) +[2023-10-08 18:19:33,247][21194] Updated weights for policy 1, policy_version 63670 (0.0007) +[2023-10-08 18:19:33,495][21195] Updated weights for policy 0, policy_version 64160 (0.0007) +[2023-10-08 18:19:33,607][21194] Updated weights for policy 1, policy_version 63680 (0.0008) +[2023-10-08 18:19:33,803][19739] Fps is (10 sec: 19660.7, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 130908160. Throughput: 0: 1706.9, 1: 1712.8. Samples: 32728164. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:19:33,803][19739] Avg episode reward: [(0, '1002.900'), (1, '761.810')] +[2023-10-08 18:19:37,381][21195] Updated weights for policy 0, policy_version 64170 (0.0009) +[2023-10-08 18:19:37,583][21194] Updated weights for policy 1, policy_version 63690 (0.0007) +[2023-10-08 18:19:37,752][21195] Updated weights for policy 0, policy_version 64180 (0.0008) +[2023-10-08 18:19:37,954][21194] Updated weights for policy 1, policy_version 63700 (0.0008) +[2023-10-08 18:19:38,113][21195] Updated weights for policy 0, policy_version 64190 (0.0008) +[2023-10-08 18:19:38,318][21194] Updated weights for policy 1, policy_version 63710 (0.0008) +[2023-10-08 18:19:38,803][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 130973696. Throughput: 0: 1739.2, 1: 1711.1. Samples: 32744728. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:19:38,803][19739] Avg episode reward: [(0, '1002.900'), (1, '761.900')] +[2023-10-08 18:19:41,969][21195] Updated weights for policy 0, policy_version 64200 (0.0010) +[2023-10-08 18:19:42,343][21195] Updated weights for policy 0, policy_version 64210 (0.0008) +[2023-10-08 18:19:42,457][21194] Updated weights for policy 1, policy_version 63720 (0.0008) +[2023-10-08 18:19:42,704][21195] Updated weights for policy 0, policy_version 64220 (0.0007) +[2023-10-08 18:19:42,830][21194] Updated weights for policy 1, policy_version 63730 (0.0008) +[2023-10-08 18:19:43,189][21194] Updated weights for policy 1, policy_version 63740 (0.0010) +[2023-10-08 18:19:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 131039232. Throughput: 0: 1706.3, 1: 1684.7. Samples: 32763814. Policy #0 lag: (min: 5.0, avg: 12.9, max: 37.0) +[2023-10-08 18:19:43,803][19739] Avg episode reward: [(0, '1002.900'), (1, '761.900')] +[2023-10-08 18:19:46,836][21195] Updated weights for policy 0, policy_version 64230 (0.0010) +[2023-10-08 18:19:47,109][21194] Updated weights for policy 1, policy_version 63750 (0.0009) +[2023-10-08 18:19:47,201][21195] Updated weights for policy 0, policy_version 64240 (0.0007) +[2023-10-08 18:19:47,468][21194] Updated weights for policy 1, policy_version 63760 (0.0009) +[2023-10-08 18:19:47,566][21195] Updated weights for policy 0, policy_version 64250 (0.0008) +[2023-10-08 18:19:47,827][21194] Updated weights for policy 1, policy_version 63770 (0.0008) +[2023-10-08 18:19:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 131104768. Throughput: 0: 1707.1, 1: 1710.9. Samples: 32779954. Policy #0 lag: (min: 5.0, avg: 12.9, max: 37.0) +[2023-10-08 18:19:48,803][19739] Avg episode reward: [(0, '1002.900'), (1, '777.130')] +[2023-10-08 18:19:51,488][21195] Updated weights for policy 0, policy_version 64260 (0.0007) +[2023-10-08 18:19:51,718][21194] Updated weights for policy 1, policy_version 63780 (0.0010) +[2023-10-08 18:19:51,858][21195] Updated weights for policy 0, policy_version 64270 (0.0009) +[2023-10-08 18:19:52,093][21194] Updated weights for policy 1, policy_version 63790 (0.0009) +[2023-10-08 18:19:52,226][21195] Updated weights for policy 0, policy_version 64280 (0.0009) +[2023-10-08 18:19:52,450][21194] Updated weights for policy 1, policy_version 63800 (0.0008) +[2023-10-08 18:19:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 131170304. Throughput: 0: 1719.9, 1: 1705.8. Samples: 32795870. Policy #0 lag: (min: 5.0, avg: 12.9, max: 37.0) +[2023-10-08 18:19:53,803][19739] Avg episode reward: [(0, '1002.900'), (1, '762.330')] +[2023-10-08 18:19:56,216][21195] Updated weights for policy 0, policy_version 64290 (0.0007) +[2023-10-08 18:19:56,583][21194] Updated weights for policy 1, policy_version 63810 (0.0009) +[2023-10-08 18:19:56,587][21195] Updated weights for policy 0, policy_version 64300 (0.0009) +[2023-10-08 18:19:56,950][21194] Updated weights for policy 1, policy_version 63820 (0.0007) +[2023-10-08 18:19:56,953][21195] Updated weights for policy 0, policy_version 64310 (0.0008) +[2023-10-08 18:19:57,311][21195] Updated weights for policy 0, policy_version 64320 (0.0007) +[2023-10-08 18:19:57,323][21194] Updated weights for policy 1, policy_version 63830 (0.0009) +[2023-10-08 18:19:57,700][21194] Updated weights for policy 1, policy_version 63840 (0.0007) +[2023-10-08 18:19:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 131235840. Throughput: 0: 1699.3, 1: 1687.9. Samples: 32815442. Policy #0 lag: (min: 5.0, avg: 12.9, max: 37.0) +[2023-10-08 18:19:58,803][19739] Avg episode reward: [(0, '1002.900'), (1, '792.300')] +[2023-10-08 18:20:01,223][21195] Updated weights for policy 0, policy_version 64330 (0.0009) +[2023-10-08 18:20:01,585][21195] Updated weights for policy 0, policy_version 64340 (0.0008) +[2023-10-08 18:20:01,691][21194] Updated weights for policy 1, policy_version 63850 (0.0008) +[2023-10-08 18:20:01,955][21195] Updated weights for policy 0, policy_version 64350 (0.0007) +[2023-10-08 18:20:02,052][21194] Updated weights for policy 1, policy_version 63860 (0.0008) +[2023-10-08 18:20:02,413][21194] Updated weights for policy 1, policy_version 63870 (0.0007) +[2023-10-08 18:20:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 131301376. Throughput: 0: 1723.0, 1: 1718.1. Samples: 32832054. Policy #0 lag: (min: 5.0, avg: 12.9, max: 37.0) +[2023-10-08 18:20:03,803][19739] Avg episode reward: [(0, '1002.900'), (1, '792.300')] +[2023-10-08 18:20:05,910][21195] Updated weights for policy 0, policy_version 64360 (0.0008) +[2023-10-08 18:20:06,279][21195] Updated weights for policy 0, policy_version 64370 (0.0009) +[2023-10-08 18:20:06,510][21194] Updated weights for policy 1, policy_version 63880 (0.0007) +[2023-10-08 18:20:06,646][21195] Updated weights for policy 0, policy_version 64380 (0.0007) +[2023-10-08 18:20:06,878][21194] Updated weights for policy 1, policy_version 63890 (0.0008) +[2023-10-08 18:20:07,246][21194] Updated weights for policy 1, policy_version 63900 (0.0007) +[2023-10-08 18:20:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 131366912. Throughput: 0: 1701.5, 1: 1702.4. Samples: 32846536. Policy #0 lag: (min: 5.0, avg: 12.9, max: 37.0) +[2023-10-08 18:20:08,803][19739] Avg episode reward: [(0, '1001.840'), (1, '792.300')] +[2023-10-08 18:20:10,566][21195] Updated weights for policy 0, policy_version 64390 (0.0007) +[2023-10-08 18:20:10,940][21195] Updated weights for policy 0, policy_version 64400 (0.0009) +[2023-10-08 18:20:11,086][21194] Updated weights for policy 1, policy_version 63910 (0.0007) +[2023-10-08 18:20:11,307][21195] Updated weights for policy 0, policy_version 64410 (0.0009) +[2023-10-08 18:20:11,459][21194] Updated weights for policy 1, policy_version 63920 (0.0007) +[2023-10-08 18:20:11,828][21194] Updated weights for policy 1, policy_version 63930 (0.0009) +[2023-10-08 18:20:13,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 131432448. Throughput: 0: 1707.6, 1: 1707.6. Samples: 32867472. Policy #0 lag: (min: 5.0, avg: 12.9, max: 37.0) +[2023-10-08 18:20:13,804][19739] Avg episode reward: [(0, '1001.840'), (1, '792.300')] +[2023-10-08 18:20:15,377][21195] Updated weights for policy 0, policy_version 64420 (0.0009) +[2023-10-08 18:20:15,717][21194] Updated weights for policy 1, policy_version 63940 (0.0008) +[2023-10-08 18:20:15,743][21195] Updated weights for policy 0, policy_version 64430 (0.0010) +[2023-10-08 18:20:16,083][21194] Updated weights for policy 1, policy_version 63950 (0.0009) +[2023-10-08 18:20:16,105][21195] Updated weights for policy 0, policy_version 64440 (0.0008) +[2023-10-08 18:20:16,458][21194] Updated weights for policy 1, policy_version 63960 (0.0009) +[2023-10-08 18:20:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 131497984. Throughput: 0: 1738.7, 1: 1717.7. Samples: 32883702. Policy #0 lag: (min: 5.0, avg: 12.9, max: 37.0) +[2023-10-08 18:20:18,803][19739] Avg episode reward: [(0, '1001.840'), (1, '792.300')] +[2023-10-08 18:20:19,909][21195] Updated weights for policy 0, policy_version 64450 (0.0007) +[2023-10-08 18:20:20,271][21195] Updated weights for policy 0, policy_version 64460 (0.0008) +[2023-10-08 18:20:20,345][21194] Updated weights for policy 1, policy_version 63970 (0.0008) +[2023-10-08 18:20:20,634][21195] Updated weights for policy 0, policy_version 64470 (0.0009) +[2023-10-08 18:20:20,699][21194] Updated weights for policy 1, policy_version 63980 (0.0008) +[2023-10-08 18:20:21,005][21195] Updated weights for policy 0, policy_version 64480 (0.0008) +[2023-10-08 18:20:21,063][21194] Updated weights for policy 1, policy_version 63990 (0.0008) +[2023-10-08 18:20:21,438][21194] Updated weights for policy 1, policy_version 64000 (0.0010) +[2023-10-08 18:20:23,802][19739] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 131563520. Throughput: 0: 1704.6, 1: 1700.4. Samples: 32897950. Policy #0 lag: (min: 5.0, avg: 12.9, max: 37.0) +[2023-10-08 18:20:23,803][19739] Avg episode reward: [(0, '1001.840'), (1, '792.300')] +[2023-10-08 18:20:24,810][21195] Updated weights for policy 0, policy_version 64490 (0.0009) +[2023-10-08 18:20:25,177][21195] Updated weights for policy 0, policy_version 64500 (0.0007) +[2023-10-08 18:20:25,502][21194] Updated weights for policy 1, policy_version 64010 (0.0008) +[2023-10-08 18:20:25,547][21195] Updated weights for policy 0, policy_version 64510 (0.0009) +[2023-10-08 18:20:25,875][21194] Updated weights for policy 1, policy_version 64020 (0.0007) +[2023-10-08 18:20:26,230][21194] Updated weights for policy 1, policy_version 64030 (0.0008) +[2023-10-08 18:20:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 131629056. Throughput: 0: 1736.6, 1: 1721.0. Samples: 32919408. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:20:28,803][19739] Avg episode reward: [(0, '1001.970'), (1, '792.300')] +[2023-10-08 18:20:29,502][21195] Updated weights for policy 0, policy_version 64520 (0.0008) +[2023-10-08 18:20:29,867][21195] Updated weights for policy 0, policy_version 64530 (0.0008) +[2023-10-08 18:20:30,174][21194] Updated weights for policy 1, policy_version 64040 (0.0007) +[2023-10-08 18:20:30,245][21195] Updated weights for policy 0, policy_version 64540 (0.0009) +[2023-10-08 18:20:30,538][21194] Updated weights for policy 1, policy_version 64050 (0.0007) +[2023-10-08 18:20:30,916][21194] Updated weights for policy 1, policy_version 64060 (0.0009) +[2023-10-08 18:20:33,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 131694592. Throughput: 0: 1741.5, 1: 1704.1. Samples: 32935008. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:20:33,803][19739] Avg episode reward: [(0, '1001.970'), (1, '792.300')] +[2023-10-08 18:20:34,071][21195] Updated weights for policy 0, policy_version 64550 (0.0010) +[2023-10-08 18:20:34,435][21195] Updated weights for policy 0, policy_version 64560 (0.0008) +[2023-10-08 18:20:34,713][21194] Updated weights for policy 1, policy_version 64070 (0.0008) +[2023-10-08 18:20:34,801][21195] Updated weights for policy 0, policy_version 64570 (0.0007) +[2023-10-08 18:20:35,072][21194] Updated weights for policy 1, policy_version 64080 (0.0008) +[2023-10-08 18:20:35,441][21194] Updated weights for policy 1, policy_version 64090 (0.0008) +[2023-10-08 18:20:38,708][21195] Updated weights for policy 0, policy_version 64580 (0.0007) +[2023-10-08 18:20:38,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 131760128. Throughput: 0: 1727.5, 1: 1708.2. Samples: 32950474. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:20:38,804][19739] Avg episode reward: [(0, '1001.970'), (1, '792.300')] +[2023-10-08 18:20:39,073][21195] Updated weights for policy 0, policy_version 64590 (0.0008) +[2023-10-08 18:20:39,316][21194] Updated weights for policy 1, policy_version 64100 (0.0009) +[2023-10-08 18:20:39,446][21195] Updated weights for policy 0, policy_version 64600 (0.0007) +[2023-10-08 18:20:39,674][21194] Updated weights for policy 1, policy_version 64110 (0.0008) +[2023-10-08 18:20:40,039][21194] Updated weights for policy 1, policy_version 64120 (0.0007) +[2023-10-08 18:20:43,185][21195] Updated weights for policy 0, policy_version 64610 (0.0008) +[2023-10-08 18:20:43,549][21195] Updated weights for policy 0, policy_version 64620 (0.0010) +[2023-10-08 18:20:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 131825664. Throughput: 0: 1749.8, 1: 1726.0. Samples: 32971850. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:20:43,803][19739] Avg episode reward: [(0, '1001.970'), (1, '793.020')] +[2023-10-08 18:20:43,912][21195] Updated weights for policy 0, policy_version 64630 (0.0009) +[2023-10-08 18:20:44,144][21194] Updated weights for policy 1, policy_version 64130 (0.0008) +[2023-10-08 18:20:44,285][21195] Updated weights for policy 0, policy_version 64640 (0.0008) +[2023-10-08 18:20:44,515][21194] Updated weights for policy 1, policy_version 64140 (0.0009) +[2023-10-08 18:20:44,870][21194] Updated weights for policy 1, policy_version 64150 (0.0008) +[2023-10-08 18:20:45,233][21194] Updated weights for policy 1, policy_version 64160 (0.0008) +[2023-10-08 18:20:48,012][21195] Updated weights for policy 0, policy_version 64650 (0.0008) +[2023-10-08 18:20:48,384][21195] Updated weights for policy 0, policy_version 64660 (0.0008) +[2023-10-08 18:20:48,757][21195] Updated weights for policy 0, policy_version 64670 (0.0007) +[2023-10-08 18:20:48,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 131891200. Throughput: 0: 1730.0, 1: 1696.1. Samples: 32986228. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:20:48,803][19739] Avg episode reward: [(0, '1001.970'), (1, '777.680')] +[2023-10-08 18:20:49,330][21194] Updated weights for policy 1, policy_version 64170 (0.0010) +[2023-10-08 18:20:49,692][21194] Updated weights for policy 1, policy_version 64180 (0.0011) +[2023-10-08 18:20:50,058][21194] Updated weights for policy 1, policy_version 64190 (0.0011) +[2023-10-08 18:20:52,891][21195] Updated weights for policy 0, policy_version 64680 (0.0007) +[2023-10-08 18:20:53,256][21195] Updated weights for policy 0, policy_version 64690 (0.0008) +[2023-10-08 18:20:53,629][21195] Updated weights for policy 0, policy_version 64700 (0.0007) +[2023-10-08 18:20:53,802][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 131989504. Throughput: 0: 1755.6, 1: 1717.1. Samples: 33002804. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:20:53,803][19739] Avg episode reward: [(0, '1002.370'), (1, '777.680')] +[2023-10-08 18:20:53,944][21194] Updated weights for policy 1, policy_version 64200 (0.0008) +[2023-10-08 18:20:54,306][21194] Updated weights for policy 1, policy_version 64210 (0.0007) +[2023-10-08 18:20:54,676][21194] Updated weights for policy 1, policy_version 64220 (0.0007) +[2023-10-08 18:20:57,386][21195] Updated weights for policy 0, policy_version 64710 (0.0008) +[2023-10-08 18:20:57,752][21195] Updated weights for policy 0, policy_version 64720 (0.0009) +[2023-10-08 18:20:58,128][21195] Updated weights for policy 0, policy_version 64730 (0.0008) +[2023-10-08 18:20:58,708][21194] Updated weights for policy 1, policy_version 64230 (0.0008) +[2023-10-08 18:20:58,803][19739] Fps is (10 sec: 16383.8, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 132055040. Throughput: 0: 1746.5, 1: 1724.5. Samples: 33023670. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:20:58,803][19739] Avg episode reward: [(0, '1002.320'), (1, '769.010')] +[2023-10-08 18:20:59,091][21194] Updated weights for policy 1, policy_version 64240 (0.0008) +[2023-10-08 18:20:59,460][21194] Updated weights for policy 1, policy_version 64250 (0.0008) +[2023-10-08 18:21:01,843][21195] Updated weights for policy 0, policy_version 64740 (0.0007) +[2023-10-08 18:21:02,244][21195] Updated weights for policy 0, policy_version 64750 (0.0008) +[2023-10-08 18:21:02,615][21195] Updated weights for policy 0, policy_version 64760 (0.0009) +[2023-10-08 18:21:03,321][21194] Updated weights for policy 1, policy_version 64260 (0.0007) +[2023-10-08 18:21:03,692][21194] Updated weights for policy 1, policy_version 64270 (0.0010) +[2023-10-08 18:21:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 132120576. Throughput: 0: 1734.2, 1: 1705.2. Samples: 33038474. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:21:03,803][19739] Avg episode reward: [(0, '1002.320'), (1, '769.010')] +[2023-10-08 18:21:04,053][21194] Updated weights for policy 1, policy_version 64280 (0.0008) +[2023-10-08 18:21:06,383][21195] Updated weights for policy 0, policy_version 64770 (0.0008) +[2023-10-08 18:21:06,750][21195] Updated weights for policy 0, policy_version 64780 (0.0009) +[2023-10-08 18:21:07,127][21195] Updated weights for policy 0, policy_version 64790 (0.0007) +[2023-10-08 18:21:07,494][21195] Updated weights for policy 0, policy_version 64800 (0.0007) +[2023-10-08 18:21:07,932][21194] Updated weights for policy 1, policy_version 64290 (0.0008) +[2023-10-08 18:21:08,298][21194] Updated weights for policy 1, policy_version 64300 (0.0010) +[2023-10-08 18:21:08,666][21194] Updated weights for policy 1, policy_version 64310 (0.0009) +[2023-10-08 18:21:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 132186112. Throughput: 0: 1759.2, 1: 1731.8. Samples: 33055042. Policy #0 lag: (min: 31.0, avg: 37.9, max: 63.0) +[2023-10-08 18:21:08,803][19739] Avg episode reward: [(0, '1002.320'), (1, '768.830')] +[2023-10-08 18:21:09,030][21194] Updated weights for policy 1, policy_version 64320 (0.0007) +[2023-10-08 18:21:11,489][21195] Updated weights for policy 0, policy_version 64810 (0.0007) +[2023-10-08 18:21:11,856][21195] Updated weights for policy 0, policy_version 64820 (0.0007) +[2023-10-08 18:21:12,229][21195] Updated weights for policy 0, policy_version 64830 (0.0007) +[2023-10-08 18:21:13,000][21194] Updated weights for policy 1, policy_version 64330 (0.0008) +[2023-10-08 18:21:13,365][21194] Updated weights for policy 1, policy_version 64340 (0.0011) +[2023-10-08 18:21:13,745][21194] Updated weights for policy 1, policy_version 64350 (0.0009) +[2023-10-08 18:21:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 132251648. Throughput: 0: 1739.0, 1: 1723.6. Samples: 33075226. Policy #0 lag: (min: 31.0, avg: 37.9, max: 63.0) +[2023-10-08 18:21:13,803][19739] Avg episode reward: [(0, '1004.170'), (1, '768.830')] +[2023-10-08 18:21:13,810][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000064352_65896448.pth... +[2023-10-08 18:21:13,810][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000064832_66387968.pth... +[2023-10-08 18:21:13,847][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000062752_64258048.pth +[2023-10-08 18:21:13,851][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000063200_64716800.pth +[2023-10-08 18:21:13,852][20836] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p1/milestones/checkpoint_000064352_65896448.pth +[2023-10-08 18:21:13,856][20740] Saving new best policy, reward=1004.170! +[2023-10-08 18:21:13,898][20740] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p0/milestones/checkpoint_000064832_66387968.pth +[2023-10-08 18:21:16,241][21195] Updated weights for policy 0, policy_version 64840 (0.0009) +[2023-10-08 18:21:16,606][21195] Updated weights for policy 0, policy_version 64850 (0.0007) +[2023-10-08 18:21:16,968][21195] Updated weights for policy 0, policy_version 64860 (0.0007) +[2023-10-08 18:21:17,754][21194] Updated weights for policy 1, policy_version 64360 (0.0009) +[2023-10-08 18:21:18,113][21194] Updated weights for policy 1, policy_version 64370 (0.0011) +[2023-10-08 18:21:18,487][21194] Updated weights for policy 1, policy_version 64380 (0.0008) +[2023-10-08 18:21:18,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 132349952. Throughput: 0: 1743.6, 1: 1725.5. Samples: 33091120. Policy #0 lag: (min: 31.0, avg: 37.9, max: 63.0) +[2023-10-08 18:21:18,803][19739] Avg episode reward: [(0, '1005.520'), (1, '768.830')] +[2023-10-08 18:21:18,804][20740] Saving new best policy, reward=1005.520! +[2023-10-08 18:21:21,193][21195] Updated weights for policy 0, policy_version 64870 (0.0008) +[2023-10-08 18:21:21,560][21195] Updated weights for policy 0, policy_version 64880 (0.0007) +[2023-10-08 18:21:21,926][21195] Updated weights for policy 0, policy_version 64890 (0.0010) +[2023-10-08 18:21:22,327][21194] Updated weights for policy 1, policy_version 64390 (0.0008) +[2023-10-08 18:21:22,691][21194] Updated weights for policy 1, policy_version 64400 (0.0009) +[2023-10-08 18:21:23,056][21194] Updated weights for policy 1, policy_version 64410 (0.0008) +[2023-10-08 18:21:23,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 132415488. Throughput: 0: 1746.8, 1: 1731.1. Samples: 33106978. Policy #0 lag: (min: 31.0, avg: 37.9, max: 63.0) +[2023-10-08 18:21:23,803][19739] Avg episode reward: [(0, '1021.280'), (1, '768.830')] +[2023-10-08 18:21:23,804][20740] Saving new best policy, reward=1021.280! +[2023-10-08 18:21:25,750][21195] Updated weights for policy 0, policy_version 64900 (0.0008) +[2023-10-08 18:21:26,111][21195] Updated weights for policy 0, policy_version 64910 (0.0008) +[2023-10-08 18:21:26,477][21195] Updated weights for policy 0, policy_version 64920 (0.0008) +[2023-10-08 18:21:26,988][21194] Updated weights for policy 1, policy_version 64420 (0.0009) +[2023-10-08 18:21:27,350][21194] Updated weights for policy 1, policy_version 64430 (0.0008) +[2023-10-08 18:21:27,712][21194] Updated weights for policy 1, policy_version 64440 (0.0009) +[2023-10-08 18:21:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 132481024. Throughput: 0: 1733.2, 1: 1709.6. Samples: 33126776. Policy #0 lag: (min: 31.0, avg: 37.9, max: 63.0) +[2023-10-08 18:21:28,803][19739] Avg episode reward: [(0, '1021.280'), (1, '768.830')] +[2023-10-08 18:21:30,359][21195] Updated weights for policy 0, policy_version 64930 (0.0009) +[2023-10-08 18:21:30,728][21195] Updated weights for policy 0, policy_version 64940 (0.0008) +[2023-10-08 18:21:31,105][21195] Updated weights for policy 0, policy_version 64950 (0.0009) +[2023-10-08 18:21:31,480][21195] Updated weights for policy 0, policy_version 64960 (0.0010) +[2023-10-08 18:21:31,548][21194] Updated weights for policy 1, policy_version 64450 (0.0010) +[2023-10-08 18:21:31,912][21194] Updated weights for policy 1, policy_version 64460 (0.0009) +[2023-10-08 18:21:32,285][21194] Updated weights for policy 1, policy_version 64470 (0.0009) +[2023-10-08 18:21:32,656][21194] Updated weights for policy 1, policy_version 64480 (0.0007) +[2023-10-08 18:21:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 132546560. Throughput: 0: 1756.9, 1: 1741.9. Samples: 33143676. Policy #0 lag: (min: 31.0, avg: 37.9, max: 63.0) +[2023-10-08 18:21:33,804][19739] Avg episode reward: [(0, '1021.280'), (1, '768.830')] +[2023-10-08 18:21:35,340][21195] Updated weights for policy 0, policy_version 64970 (0.0009) +[2023-10-08 18:21:35,704][21195] Updated weights for policy 0, policy_version 64980 (0.0008) +[2023-10-08 18:21:36,073][21195] Updated weights for policy 0, policy_version 64990 (0.0007) +[2023-10-08 18:21:36,557][21194] Updated weights for policy 1, policy_version 64490 (0.0008) +[2023-10-08 18:21:36,926][21194] Updated weights for policy 1, policy_version 64500 (0.0008) +[2023-10-08 18:21:37,293][21194] Updated weights for policy 1, policy_version 64510 (0.0008) +[2023-10-08 18:21:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 132612096. Throughput: 0: 1730.7, 1: 1729.8. Samples: 33158526. Policy #0 lag: (min: 31.0, avg: 37.9, max: 63.0) +[2023-10-08 18:21:38,804][19739] Avg episode reward: [(0, '1030.470'), (1, '768.830')] +[2023-10-08 18:21:38,805][20740] Saving new best policy, reward=1030.470! +[2023-10-08 18:21:39,964][21195] Updated weights for policy 0, policy_version 65000 (0.0008) +[2023-10-08 18:21:40,331][21195] Updated weights for policy 0, policy_version 65010 (0.0009) +[2023-10-08 18:21:40,692][21195] Updated weights for policy 0, policy_version 65020 (0.0010) +[2023-10-08 18:21:41,228][21194] Updated weights for policy 1, policy_version 64520 (0.0011) +[2023-10-08 18:21:41,599][21194] Updated weights for policy 1, policy_version 64530 (0.0009) +[2023-10-08 18:21:41,961][21194] Updated weights for policy 1, policy_version 64540 (0.0008) +[2023-10-08 18:21:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 132677632. Throughput: 0: 1744.5, 1: 1716.0. Samples: 33179392. Policy #0 lag: (min: 31.0, avg: 37.9, max: 63.0) +[2023-10-08 18:21:43,803][19739] Avg episode reward: [(0, '1015.120'), (1, '783.650')] +[2023-10-08 18:21:44,462][21195] Updated weights for policy 0, policy_version 65030 (0.0009) +[2023-10-08 18:21:44,820][21195] Updated weights for policy 0, policy_version 65040 (0.0011) +[2023-10-08 18:21:45,183][21195] Updated weights for policy 0, policy_version 65050 (0.0011) +[2023-10-08 18:21:46,154][21194] Updated weights for policy 1, policy_version 64550 (0.0011) +[2023-10-08 18:21:46,537][21194] Updated weights for policy 1, policy_version 64560 (0.0007) +[2023-10-08 18:21:46,913][21194] Updated weights for policy 1, policy_version 64570 (0.0008) +[2023-10-08 18:21:48,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 132743168. Throughput: 0: 1752.8, 1: 1740.6. Samples: 33195680. Policy #0 lag: (min: 31.0, avg: 37.9, max: 63.0) +[2023-10-08 18:21:48,803][19739] Avg episode reward: [(0, '1015.160'), (1, '783.650')] +[2023-10-08 18:21:49,228][21195] Updated weights for policy 0, policy_version 65060 (0.0010) +[2023-10-08 18:21:49,614][21195] Updated weights for policy 0, policy_version 65070 (0.0009) +[2023-10-08 18:21:49,973][21195] Updated weights for policy 0, policy_version 65080 (0.0009) +[2023-10-08 18:21:50,846][21194] Updated weights for policy 1, policy_version 64580 (0.0010) +[2023-10-08 18:21:51,219][21194] Updated weights for policy 1, policy_version 64590 (0.0009) +[2023-10-08 18:21:51,582][21194] Updated weights for policy 1, policy_version 64600 (0.0008) +[2023-10-08 18:21:53,767][21195] Updated weights for policy 0, policy_version 65090 (0.0007) +[2023-10-08 18:21:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 132808704. Throughput: 0: 1731.3, 1: 1708.0. Samples: 33209812. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:21:53,803][19739] Avg episode reward: [(0, '1015.160'), (1, '783.650')] +[2023-10-08 18:21:54,132][21195] Updated weights for policy 0, policy_version 65100 (0.0009) +[2023-10-08 18:21:54,493][21195] Updated weights for policy 0, policy_version 65110 (0.0008) +[2023-10-08 18:21:54,851][21195] Updated weights for policy 0, policy_version 65120 (0.0009) +[2023-10-08 18:21:55,517][21194] Updated weights for policy 1, policy_version 64610 (0.0008) +[2023-10-08 18:21:55,889][21194] Updated weights for policy 1, policy_version 64620 (0.0007) +[2023-10-08 18:21:56,250][21194] Updated weights for policy 1, policy_version 64630 (0.0008) +[2023-10-08 18:21:56,623][21194] Updated weights for policy 1, policy_version 64640 (0.0008) +[2023-10-08 18:21:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 132874240. Throughput: 0: 1746.8, 1: 1715.4. Samples: 33231022. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:21:58,803][19739] Avg episode reward: [(0, '1015.130'), (1, '783.650')] +[2023-10-08 18:21:58,887][21195] Updated weights for policy 0, policy_version 65130 (0.0009) +[2023-10-08 18:21:59,258][21195] Updated weights for policy 0, policy_version 65140 (0.0008) +[2023-10-08 18:21:59,633][21195] Updated weights for policy 0, policy_version 65150 (0.0009) +[2023-10-08 18:22:00,558][21194] Updated weights for policy 1, policy_version 64650 (0.0008) +[2023-10-08 18:22:00,918][21194] Updated weights for policy 1, policy_version 64660 (0.0007) +[2023-10-08 18:22:01,285][21194] Updated weights for policy 1, policy_version 64670 (0.0007) +[2023-10-08 18:22:03,694][21195] Updated weights for policy 0, policy_version 65160 (0.0007) +[2023-10-08 18:22:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 132939776. Throughput: 0: 1728.7, 1: 1723.7. Samples: 33246478. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:22:03,803][19739] Avg episode reward: [(0, '1015.130'), (1, '783.880')] +[2023-10-08 18:22:04,054][21195] Updated weights for policy 0, policy_version 65170 (0.0009) +[2023-10-08 18:22:04,416][21195] Updated weights for policy 0, policy_version 65180 (0.0007) +[2023-10-08 18:22:05,221][21194] Updated weights for policy 1, policy_version 64680 (0.0011) +[2023-10-08 18:22:05,588][21194] Updated weights for policy 1, policy_version 64690 (0.0009) +[2023-10-08 18:22:05,961][21194] Updated weights for policy 1, policy_version 64700 (0.0010) +[2023-10-08 18:22:08,259][21195] Updated weights for policy 0, policy_version 65190 (0.0007) +[2023-10-08 18:22:08,628][21195] Updated weights for policy 0, policy_version 65200 (0.0007) +[2023-10-08 18:22:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 133005312. Throughput: 0: 1736.6, 1: 1707.7. Samples: 33261972. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:22:08,803][19739] Avg episode reward: [(0, '1015.130'), (1, '783.880')] +[2023-10-08 18:22:08,984][21195] Updated weights for policy 0, policy_version 65210 (0.0007) +[2023-10-08 18:22:09,881][21194] Updated weights for policy 1, policy_version 64710 (0.0010) +[2023-10-08 18:22:10,237][21194] Updated weights for policy 1, policy_version 64720 (0.0010) +[2023-10-08 18:22:10,599][21194] Updated weights for policy 1, policy_version 64730 (0.0011) +[2023-10-08 18:22:12,947][21195] Updated weights for policy 0, policy_version 65220 (0.0008) +[2023-10-08 18:22:13,312][21195] Updated weights for policy 0, policy_version 65230 (0.0007) +[2023-10-08 18:22:13,677][21195] Updated weights for policy 0, policy_version 65240 (0.0008) +[2023-10-08 18:22:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 133070848. Throughput: 0: 1749.6, 1: 1736.5. Samples: 33283648. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:22:13,803][19739] Avg episode reward: [(0, '1015.130'), (1, '783.880')] +[2023-10-08 18:22:14,598][21194] Updated weights for policy 1, policy_version 64740 (0.0010) +[2023-10-08 18:22:14,974][21194] Updated weights for policy 1, policy_version 64750 (0.0009) +[2023-10-08 18:22:15,340][21194] Updated weights for policy 1, policy_version 64760 (0.0010) +[2023-10-08 18:22:17,672][21195] Updated weights for policy 0, policy_version 65250 (0.0008) +[2023-10-08 18:22:18,037][21195] Updated weights for policy 0, policy_version 65260 (0.0010) +[2023-10-08 18:22:18,411][21195] Updated weights for policy 0, policy_version 65270 (0.0010) +[2023-10-08 18:22:18,770][21195] Updated weights for policy 0, policy_version 65280 (0.0011) +[2023-10-08 18:22:18,803][19739] Fps is (10 sec: 16383.7, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 133169152. Throughput: 0: 1711.3, 1: 1705.0. Samples: 33297412. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:22:18,804][19739] Avg episode reward: [(0, '1015.130'), (1, '783.880')] +[2023-10-08 18:22:19,075][21194] Updated weights for policy 1, policy_version 64770 (0.0010) +[2023-10-08 18:22:19,437][21194] Updated weights for policy 1, policy_version 64780 (0.0007) +[2023-10-08 18:22:19,795][21194] Updated weights for policy 1, policy_version 64790 (0.0007) +[2023-10-08 18:22:20,171][21194] Updated weights for policy 1, policy_version 64800 (0.0007) +[2023-10-08 18:22:22,745][21195] Updated weights for policy 0, policy_version 65290 (0.0008) +[2023-10-08 18:22:23,117][21195] Updated weights for policy 0, policy_version 65300 (0.0008) +[2023-10-08 18:22:23,498][21195] Updated weights for policy 0, policy_version 65310 (0.0008) +[2023-10-08 18:22:23,803][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 133234688. Throughput: 0: 1739.8, 1: 1721.8. Samples: 33314298. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:22:23,803][19739] Avg episode reward: [(0, '1015.130'), (1, '783.880')] +[2023-10-08 18:22:24,050][21194] Updated weights for policy 1, policy_version 64810 (0.0007) +[2023-10-08 18:22:24,413][21194] Updated weights for policy 1, policy_version 64820 (0.0009) +[2023-10-08 18:22:24,787][21194] Updated weights for policy 1, policy_version 64830 (0.0007) +[2023-10-08 18:22:27,402][21195] Updated weights for policy 0, policy_version 65320 (0.0010) +[2023-10-08 18:22:27,785][21195] Updated weights for policy 0, policy_version 65330 (0.0011) +[2023-10-08 18:22:28,154][21195] Updated weights for policy 0, policy_version 65340 (0.0007) +[2023-10-08 18:22:28,745][21194] Updated weights for policy 1, policy_version 64840 (0.0008) +[2023-10-08 18:22:28,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 133300224. Throughput: 0: 1719.7, 1: 1740.0. Samples: 33335082. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:22:28,803][19739] Avg episode reward: [(0, '1015.940'), (1, '783.880')] +[2023-10-08 18:22:29,115][21194] Updated weights for policy 1, policy_version 64850 (0.0007) +[2023-10-08 18:22:29,476][21194] Updated weights for policy 1, policy_version 64860 (0.0009) +[2023-10-08 18:22:32,008][21195] Updated weights for policy 0, policy_version 65350 (0.0009) +[2023-10-08 18:22:32,373][21195] Updated weights for policy 0, policy_version 65360 (0.0009) +[2023-10-08 18:22:32,748][21195] Updated weights for policy 0, policy_version 65370 (0.0008) +[2023-10-08 18:22:33,518][21194] Updated weights for policy 1, policy_version 64870 (0.0008) +[2023-10-08 18:22:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 133365760. Throughput: 0: 1709.0, 1: 1716.2. Samples: 33349812. Policy #0 lag: (min: 31.0, avg: 35.2, max: 63.0) +[2023-10-08 18:22:33,803][19739] Avg episode reward: [(0, '1016.070'), (1, '783.880')] +[2023-10-08 18:22:33,905][21194] Updated weights for policy 1, policy_version 64880 (0.0009) +[2023-10-08 18:22:34,271][21194] Updated weights for policy 1, policy_version 64890 (0.0010) +[2023-10-08 18:22:36,734][21195] Updated weights for policy 0, policy_version 65380 (0.0009) +[2023-10-08 18:22:37,121][21195] Updated weights for policy 0, policy_version 65390 (0.0008) +[2023-10-08 18:22:37,485][21195] Updated weights for policy 0, policy_version 65400 (0.0007) +[2023-10-08 18:22:38,091][21194] Updated weights for policy 1, policy_version 64900 (0.0009) +[2023-10-08 18:22:38,453][21194] Updated weights for policy 1, policy_version 64910 (0.0008) +[2023-10-08 18:22:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 133431296. Throughput: 0: 1734.5, 1: 1743.4. Samples: 33366318. Policy #0 lag: (min: 31.0, avg: 35.2, max: 63.0) +[2023-10-08 18:22:38,803][19739] Avg episode reward: [(0, '1016.070'), (1, '783.880')] +[2023-10-08 18:22:38,820][21194] Updated weights for policy 1, policy_version 64920 (0.0009) +[2023-10-08 18:22:41,315][21195] Updated weights for policy 0, policy_version 65410 (0.0009) +[2023-10-08 18:22:41,694][21195] Updated weights for policy 0, policy_version 65420 (0.0008) +[2023-10-08 18:22:42,051][21195] Updated weights for policy 0, policy_version 65430 (0.0008) +[2023-10-08 18:22:42,421][21195] Updated weights for policy 0, policy_version 65440 (0.0007) +[2023-10-08 18:22:42,782][21194] Updated weights for policy 1, policy_version 64930 (0.0010) +[2023-10-08 18:22:43,155][21194] Updated weights for policy 1, policy_version 64940 (0.0011) +[2023-10-08 18:22:43,521][21194] Updated weights for policy 1, policy_version 64950 (0.0010) +[2023-10-08 18:22:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 133496832. Throughput: 0: 1711.4, 1: 1743.9. Samples: 33386510. Policy #0 lag: (min: 31.0, avg: 35.2, max: 63.0) +[2023-10-08 18:22:43,803][19739] Avg episode reward: [(0, '1016.070'), (1, '784.000')] +[2023-10-08 18:22:43,885][21194] Updated weights for policy 1, policy_version 64960 (0.0008) +[2023-10-08 18:22:46,470][21195] Updated weights for policy 0, policy_version 65450 (0.0008) +[2023-10-08 18:22:46,840][21195] Updated weights for policy 0, policy_version 65460 (0.0007) +[2023-10-08 18:22:47,210][21195] Updated weights for policy 0, policy_version 65470 (0.0007) +[2023-10-08 18:22:47,811][21194] Updated weights for policy 1, policy_version 64970 (0.0007) +[2023-10-08 18:22:48,172][21194] Updated weights for policy 1, policy_version 64980 (0.0008) +[2023-10-08 18:22:48,541][21194] Updated weights for policy 1, policy_version 64990 (0.0010) +[2023-10-08 18:22:48,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 133595136. Throughput: 0: 1723.7, 1: 1736.6. Samples: 33402194. Policy #0 lag: (min: 31.0, avg: 35.2, max: 63.0) +[2023-10-08 18:22:48,803][19739] Avg episode reward: [(0, '1016.070'), (1, '784.150')] +[2023-10-08 18:22:51,185][21195] Updated weights for policy 0, policy_version 65480 (0.0010) +[2023-10-08 18:22:51,558][21195] Updated weights for policy 0, policy_version 65490 (0.0009) +[2023-10-08 18:22:51,934][21195] Updated weights for policy 0, policy_version 65500 (0.0010) +[2023-10-08 18:22:52,417][21194] Updated weights for policy 1, policy_version 65000 (0.0009) +[2023-10-08 18:22:52,790][21194] Updated weights for policy 1, policy_version 65010 (0.0008) +[2023-10-08 18:22:53,149][21194] Updated weights for policy 1, policy_version 65020 (0.0008) +[2023-10-08 18:22:53,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 133660672. Throughput: 0: 1713.2, 1: 1755.4. Samples: 33418062. Policy #0 lag: (min: 31.0, avg: 35.2, max: 63.0) +[2023-10-08 18:22:53,804][19739] Avg episode reward: [(0, '1016.070'), (1, '784.150')] +[2023-10-08 18:22:55,895][21195] Updated weights for policy 0, policy_version 65510 (0.0010) +[2023-10-08 18:22:56,268][21195] Updated weights for policy 0, policy_version 65520 (0.0010) +[2023-10-08 18:22:56,636][21195] Updated weights for policy 0, policy_version 65530 (0.0008) +[2023-10-08 18:22:57,214][21194] Updated weights for policy 1, policy_version 65030 (0.0007) +[2023-10-08 18:22:57,576][21194] Updated weights for policy 1, policy_version 65040 (0.0008) +[2023-10-08 18:22:57,943][21194] Updated weights for policy 1, policy_version 65050 (0.0007) +[2023-10-08 18:22:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 133726208. Throughput: 0: 1704.0, 1: 1729.2. Samples: 33438144. Policy #0 lag: (min: 31.0, avg: 35.2, max: 63.0) +[2023-10-08 18:22:58,803][19739] Avg episode reward: [(0, '1001.010'), (1, '784.150')] +[2023-10-08 18:23:00,562][21195] Updated weights for policy 0, policy_version 65540 (0.0007) +[2023-10-08 18:23:00,930][21195] Updated weights for policy 0, policy_version 65550 (0.0009) +[2023-10-08 18:23:01,297][21195] Updated weights for policy 0, policy_version 65560 (0.0007) +[2023-10-08 18:23:01,841][21194] Updated weights for policy 1, policy_version 65060 (0.0009) +[2023-10-08 18:23:02,205][21194] Updated weights for policy 1, policy_version 65070 (0.0008) +[2023-10-08 18:23:02,563][21194] Updated weights for policy 1, policy_version 65080 (0.0010) +[2023-10-08 18:23:03,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 133791744. Throughput: 0: 1739.9, 1: 1755.8. Samples: 33454718. Policy #0 lag: (min: 31.0, avg: 35.2, max: 63.0) +[2023-10-08 18:23:03,803][19739] Avg episode reward: [(0, '1001.010'), (1, '811.080')] +[2023-10-08 18:23:05,223][21195] Updated weights for policy 0, policy_version 65570 (0.0007) +[2023-10-08 18:23:05,597][21195] Updated weights for policy 0, policy_version 65580 (0.0008) +[2023-10-08 18:23:05,969][21195] Updated weights for policy 0, policy_version 65590 (0.0007) +[2023-10-08 18:23:06,332][21195] Updated weights for policy 0, policy_version 65600 (0.0008) +[2023-10-08 18:23:06,522][21194] Updated weights for policy 1, policy_version 65090 (0.0009) +[2023-10-08 18:23:06,886][21194] Updated weights for policy 1, policy_version 65100 (0.0007) +[2023-10-08 18:23:07,258][21194] Updated weights for policy 1, policy_version 65110 (0.0009) +[2023-10-08 18:23:07,621][21194] Updated weights for policy 1, policy_version 65120 (0.0008) +[2023-10-08 18:23:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 133857280. Throughput: 0: 1708.0, 1: 1734.6. Samples: 33469216. Policy #0 lag: (min: 31.0, avg: 35.2, max: 63.0) +[2023-10-08 18:23:08,803][19739] Avg episode reward: [(0, '1001.010'), (1, '811.080')] +[2023-10-08 18:23:10,190][21195] Updated weights for policy 0, policy_version 65610 (0.0007) +[2023-10-08 18:23:10,552][21195] Updated weights for policy 0, policy_version 65620 (0.0007) +[2023-10-08 18:23:10,922][21195] Updated weights for policy 0, policy_version 65630 (0.0009) +[2023-10-08 18:23:11,666][21194] Updated weights for policy 1, policy_version 65130 (0.0007) +[2023-10-08 18:23:12,029][21194] Updated weights for policy 1, policy_version 65140 (0.0008) +[2023-10-08 18:23:12,393][21194] Updated weights for policy 1, policy_version 65150 (0.0008) +[2023-10-08 18:23:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 133922816. Throughput: 0: 1729.2, 1: 1711.4. Samples: 33489908. Policy #0 lag: (min: 31.0, avg: 35.2, max: 63.0) +[2023-10-08 18:23:13,803][19739] Avg episode reward: [(0, '1001.010'), (1, '811.080')] +[2023-10-08 18:23:13,810][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000065632_67207168.pth... +[2023-10-08 18:23:13,810][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000065152_66715648.pth... +[2023-10-08 18:23:13,840][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000063552_65077248.pth +[2023-10-08 18:23:13,843][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000064032_65568768.pth +[2023-10-08 18:23:14,886][21195] Updated weights for policy 0, policy_version 65640 (0.0007) +[2023-10-08 18:23:15,266][21195] Updated weights for policy 0, policy_version 65650 (0.0008) +[2023-10-08 18:23:15,641][21195] Updated weights for policy 0, policy_version 65660 (0.0009) +[2023-10-08 18:23:16,393][21194] Updated weights for policy 1, policy_version 65160 (0.0009) +[2023-10-08 18:23:16,760][21194] Updated weights for policy 1, policy_version 65170 (0.0009) +[2023-10-08 18:23:17,135][21194] Updated weights for policy 1, policy_version 65180 (0.0009) +[2023-10-08 18:23:18,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 133988352. Throughput: 0: 1737.5, 1: 1743.2. Samples: 33506446. Policy #0 lag: (min: 18.0, avg: 18.5, max: 34.0) +[2023-10-08 18:23:18,804][19739] Avg episode reward: [(0, '1001.010'), (1, '812.050')] +[2023-10-08 18:23:19,560][21195] Updated weights for policy 0, policy_version 65670 (0.0009) +[2023-10-08 18:23:19,929][21195] Updated weights for policy 0, policy_version 65680 (0.0008) +[2023-10-08 18:23:20,288][21195] Updated weights for policy 0, policy_version 65690 (0.0008) +[2023-10-08 18:23:21,133][21194] Updated weights for policy 1, policy_version 65190 (0.0008) +[2023-10-08 18:23:21,499][21194] Updated weights for policy 1, policy_version 65200 (0.0008) +[2023-10-08 18:23:21,867][21194] Updated weights for policy 1, policy_version 65210 (0.0009) +[2023-10-08 18:23:23,803][19739] Fps is (10 sec: 13106.7, 60 sec: 13653.2, 300 sec: 13773.6). Total num frames: 134053888. Throughput: 0: 1716.0, 1: 1714.7. Samples: 33520698. Policy #0 lag: (min: 18.0, avg: 18.5, max: 34.0) +[2023-10-08 18:23:23,804][19739] Avg episode reward: [(0, '1001.010'), (1, '812.050')] +[2023-10-08 18:23:24,228][21195] Updated weights for policy 0, policy_version 65700 (0.0009) +[2023-10-08 18:23:24,612][21195] Updated weights for policy 0, policy_version 65710 (0.0011) +[2023-10-08 18:23:24,973][21195] Updated weights for policy 0, policy_version 65720 (0.0010) +[2023-10-08 18:23:25,786][21194] Updated weights for policy 1, policy_version 65220 (0.0010) +[2023-10-08 18:23:26,180][21194] Updated weights for policy 1, policy_version 65230 (0.0009) +[2023-10-08 18:23:26,542][21194] Updated weights for policy 1, policy_version 65240 (0.0007) +[2023-10-08 18:23:28,738][21195] Updated weights for policy 0, policy_version 65730 (0.0009) +[2023-10-08 18:23:28,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 134119424. Throughput: 0: 1743.0, 1: 1716.2. Samples: 33542172. Policy #0 lag: (min: 18.0, avg: 18.5, max: 34.0) +[2023-10-08 18:23:28,803][19739] Avg episode reward: [(0, '1001.010'), (1, '806.210')] +[2023-10-08 18:23:29,108][21195] Updated weights for policy 0, policy_version 65740 (0.0009) +[2023-10-08 18:23:29,471][21195] Updated weights for policy 0, policy_version 65750 (0.0008) +[2023-10-08 18:23:29,848][21195] Updated weights for policy 0, policy_version 65760 (0.0008) +[2023-10-08 18:23:30,241][21194] Updated weights for policy 1, policy_version 65250 (0.0008) +[2023-10-08 18:23:30,612][21194] Updated weights for policy 1, policy_version 65260 (0.0009) +[2023-10-08 18:23:30,974][21194] Updated weights for policy 1, policy_version 65270 (0.0009) +[2023-10-08 18:23:31,350][21194] Updated weights for policy 1, policy_version 65280 (0.0009) +[2023-10-08 18:23:33,803][19739] Fps is (10 sec: 13107.7, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 134184960. Throughput: 0: 1735.9, 1: 1721.2. Samples: 33557766. Policy #0 lag: (min: 18.0, avg: 18.5, max: 34.0) +[2023-10-08 18:23:33,803][19739] Avg episode reward: [(0, '1017.340'), (1, '806.420')] +[2023-10-08 18:23:33,938][21195] Updated weights for policy 0, policy_version 65770 (0.0009) +[2023-10-08 18:23:34,306][21195] Updated weights for policy 0, policy_version 65780 (0.0007) +[2023-10-08 18:23:34,682][21195] Updated weights for policy 0, policy_version 65790 (0.0007) +[2023-10-08 18:23:35,346][21194] Updated weights for policy 1, policy_version 65290 (0.0009) +[2023-10-08 18:23:35,719][21194] Updated weights for policy 1, policy_version 65300 (0.0009) +[2023-10-08 18:23:36,080][21194] Updated weights for policy 1, policy_version 65310 (0.0007) +[2023-10-08 18:23:38,434][21195] Updated weights for policy 0, policy_version 65800 (0.0008) +[2023-10-08 18:23:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 134250496. Throughput: 0: 1739.4, 1: 1706.8. Samples: 33573138. Policy #0 lag: (min: 18.0, avg: 18.5, max: 34.0) +[2023-10-08 18:23:38,803][19739] Avg episode reward: [(0, '1017.650'), (1, '820.990')] +[2023-10-08 18:23:38,810][21195] Updated weights for policy 0, policy_version 65810 (0.0008) +[2023-10-08 18:23:39,179][21195] Updated weights for policy 0, policy_version 65820 (0.0010) +[2023-10-08 18:23:39,858][21194] Updated weights for policy 1, policy_version 65320 (0.0008) +[2023-10-08 18:23:40,223][21194] Updated weights for policy 1, policy_version 65330 (0.0010) +[2023-10-08 18:23:40,588][21194] Updated weights for policy 1, policy_version 65340 (0.0011) +[2023-10-08 18:23:43,085][21195] Updated weights for policy 0, policy_version 65830 (0.0007) +[2023-10-08 18:23:43,451][21195] Updated weights for policy 0, policy_version 65840 (0.0011) +[2023-10-08 18:23:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 134316032. Throughput: 0: 1747.8, 1: 1726.2. Samples: 33594474. Policy #0 lag: (min: 18.0, avg: 18.5, max: 34.0) +[2023-10-08 18:23:43,803][19739] Avg episode reward: [(0, '1017.650'), (1, '810.500')] +[2023-10-08 18:23:43,821][21195] Updated weights for policy 0, policy_version 65850 (0.0010) +[2023-10-08 18:23:44,686][21194] Updated weights for policy 1, policy_version 65350 (0.0009) +[2023-10-08 18:23:45,045][21194] Updated weights for policy 1, policy_version 65360 (0.0008) +[2023-10-08 18:23:45,410][21194] Updated weights for policy 1, policy_version 65370 (0.0010) +[2023-10-08 18:23:47,819][21195] Updated weights for policy 0, policy_version 65860 (0.0008) +[2023-10-08 18:23:48,180][21195] Updated weights for policy 0, policy_version 65870 (0.0009) +[2023-10-08 18:23:48,542][21195] Updated weights for policy 0, policy_version 65880 (0.0010) +[2023-10-08 18:23:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 134381568. Throughput: 0: 1717.3, 1: 1700.0. Samples: 33608498. Policy #0 lag: (min: 18.0, avg: 18.5, max: 34.0) +[2023-10-08 18:23:48,803][19739] Avg episode reward: [(0, '1017.650'), (1, '810.500')] +[2023-10-08 18:23:49,346][21194] Updated weights for policy 1, policy_version 65380 (0.0010) +[2023-10-08 18:23:49,706][21194] Updated weights for policy 1, policy_version 65390 (0.0009) +[2023-10-08 18:23:50,073][21194] Updated weights for policy 1, policy_version 65400 (0.0008) +[2023-10-08 18:23:52,642][21195] Updated weights for policy 0, policy_version 65890 (0.0010) +[2023-10-08 18:23:53,012][21195] Updated weights for policy 0, policy_version 65900 (0.0010) +[2023-10-08 18:23:53,381][21195] Updated weights for policy 0, policy_version 65910 (0.0007) +[2023-10-08 18:23:53,746][21195] Updated weights for policy 0, policy_version 65920 (0.0010) +[2023-10-08 18:23:53,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 134479872. Throughput: 0: 1740.7, 1: 1714.4. Samples: 33624694. Policy #0 lag: (min: 18.0, avg: 18.5, max: 34.0) +[2023-10-08 18:23:53,803][19739] Avg episode reward: [(0, '1017.650'), (1, '810.500')] +[2023-10-08 18:23:54,073][21194] Updated weights for policy 1, policy_version 65410 (0.0008) +[2023-10-08 18:23:54,434][21194] Updated weights for policy 1, policy_version 65420 (0.0011) +[2023-10-08 18:23:54,801][21194] Updated weights for policy 1, policy_version 65430 (0.0007) +[2023-10-08 18:23:55,158][21194] Updated weights for policy 1, policy_version 65440 (0.0007) +[2023-10-08 18:23:57,756][21195] Updated weights for policy 0, policy_version 65930 (0.0008) +[2023-10-08 18:23:58,129][21195] Updated weights for policy 0, policy_version 65940 (0.0008) +[2023-10-08 18:23:58,497][21195] Updated weights for policy 0, policy_version 65950 (0.0009) +[2023-10-08 18:23:58,803][19739] Fps is (10 sec: 16383.7, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 134545408. Throughput: 0: 1726.3, 1: 1730.0. Samples: 33645440. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:23:58,804][19739] Avg episode reward: [(0, '1017.650'), (1, '825.280')] +[2023-10-08 18:23:59,169][21194] Updated weights for policy 1, policy_version 65450 (0.0009) +[2023-10-08 18:23:59,541][21194] Updated weights for policy 1, policy_version 65460 (0.0007) +[2023-10-08 18:23:59,899][21194] Updated weights for policy 1, policy_version 65470 (0.0008) +[2023-10-08 18:24:02,493][21195] Updated weights for policy 0, policy_version 65960 (0.0010) +[2023-10-08 18:24:02,864][21195] Updated weights for policy 0, policy_version 65970 (0.0010) +[2023-10-08 18:24:03,223][21195] Updated weights for policy 0, policy_version 65980 (0.0010) +[2023-10-08 18:24:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 134610944. Throughput: 0: 1710.3, 1: 1698.8. Samples: 33659856. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:24:03,803][19739] Avg episode reward: [(0, '1017.650'), (1, '825.280')] +[2023-10-08 18:24:03,899][21194] Updated weights for policy 1, policy_version 65480 (0.0007) +[2023-10-08 18:24:04,269][21194] Updated weights for policy 1, policy_version 65490 (0.0008) +[2023-10-08 18:24:04,635][21194] Updated weights for policy 1, policy_version 65500 (0.0009) +[2023-10-08 18:24:07,093][21195] Updated weights for policy 0, policy_version 65990 (0.0009) +[2023-10-08 18:24:07,456][21195] Updated weights for policy 0, policy_version 66000 (0.0009) +[2023-10-08 18:24:07,824][21195] Updated weights for policy 0, policy_version 66010 (0.0008) +[2023-10-08 18:24:08,479][21194] Updated weights for policy 1, policy_version 65510 (0.0007) +[2023-10-08 18:24:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 134676480. Throughput: 0: 1741.5, 1: 1732.9. Samples: 33677044. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:24:08,803][19739] Avg episode reward: [(0, '1017.650'), (1, '840.770')] +[2023-10-08 18:24:08,847][21194] Updated weights for policy 1, policy_version 65520 (0.0009) +[2023-10-08 18:24:09,208][21194] Updated weights for policy 1, policy_version 65530 (0.0011) +[2023-10-08 18:24:11,772][21195] Updated weights for policy 0, policy_version 66020 (0.0008) +[2023-10-08 18:24:12,161][21195] Updated weights for policy 0, policy_version 66030 (0.0008) +[2023-10-08 18:24:12,523][21195] Updated weights for policy 0, policy_version 66040 (0.0007) +[2023-10-08 18:24:13,216][21194] Updated weights for policy 1, policy_version 65540 (0.0009) +[2023-10-08 18:24:13,603][21194] Updated weights for policy 1, policy_version 65550 (0.0009) +[2023-10-08 18:24:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 134742016. Throughput: 0: 1706.3, 1: 1732.8. Samples: 33696932. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:24:13,803][19739] Avg episode reward: [(0, '1017.650'), (1, '840.770')] +[2023-10-08 18:24:13,973][21194] Updated weights for policy 1, policy_version 65560 (0.0009) +[2023-10-08 18:24:16,393][21195] Updated weights for policy 0, policy_version 66050 (0.0008) +[2023-10-08 18:24:16,766][21195] Updated weights for policy 0, policy_version 66060 (0.0009) +[2023-10-08 18:24:17,143][21195] Updated weights for policy 0, policy_version 66070 (0.0010) +[2023-10-08 18:24:17,509][21195] Updated weights for policy 0, policy_version 66080 (0.0009) +[2023-10-08 18:24:17,885][21194] Updated weights for policy 1, policy_version 65570 (0.0009) +[2023-10-08 18:24:18,254][21194] Updated weights for policy 1, policy_version 65580 (0.0010) +[2023-10-08 18:24:18,613][21194] Updated weights for policy 1, policy_version 65590 (0.0007) +[2023-10-08 18:24:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 134807552. Throughput: 0: 1709.9, 1: 1718.4. Samples: 33712042. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:24:18,803][19739] Avg episode reward: [(0, '1032.760'), (1, '840.770')] +[2023-10-08 18:24:18,804][20740] Saving new best policy, reward=1032.760! +[2023-10-08 18:24:18,981][21194] Updated weights for policy 1, policy_version 65600 (0.0010) +[2023-10-08 18:24:21,533][21195] Updated weights for policy 0, policy_version 66090 (0.0007) +[2023-10-08 18:24:21,903][21195] Updated weights for policy 0, policy_version 66100 (0.0009) +[2023-10-08 18:24:22,277][21195] Updated weights for policy 0, policy_version 66110 (0.0007) +[2023-10-08 18:24:22,923][21194] Updated weights for policy 1, policy_version 65610 (0.0008) +[2023-10-08 18:24:23,294][21194] Updated weights for policy 1, policy_version 65620 (0.0011) +[2023-10-08 18:24:23,655][21194] Updated weights for policy 1, policy_version 65630 (0.0011) +[2023-10-08 18:24:23,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 134905856. Throughput: 0: 1715.3, 1: 1731.2. Samples: 33728234. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:24:23,804][19739] Avg episode reward: [(0, '1032.760'), (1, '840.770')] +[2023-10-08 18:24:26,055][21195] Updated weights for policy 0, policy_version 66120 (0.0010) +[2023-10-08 18:24:26,423][21195] Updated weights for policy 0, policy_version 66130 (0.0011) +[2023-10-08 18:24:26,797][21195] Updated weights for policy 0, policy_version 66140 (0.0011) +[2023-10-08 18:24:27,562][21194] Updated weights for policy 1, policy_version 65640 (0.0008) +[2023-10-08 18:24:27,936][21194] Updated weights for policy 1, policy_version 65650 (0.0008) +[2023-10-08 18:24:28,297][21194] Updated weights for policy 1, policy_version 65660 (0.0010) +[2023-10-08 18:24:28,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 134971392. Throughput: 0: 1698.8, 1: 1719.3. Samples: 33748286. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:24:28,803][19739] Avg episode reward: [(0, '1032.760'), (1, '840.770')] +[2023-10-08 18:24:30,741][21195] Updated weights for policy 0, policy_version 66150 (0.0009) +[2023-10-08 18:24:31,110][21195] Updated weights for policy 0, policy_version 66160 (0.0009) +[2023-10-08 18:24:31,478][21195] Updated weights for policy 0, policy_version 66170 (0.0009) +[2023-10-08 18:24:32,251][21194] Updated weights for policy 1, policy_version 65670 (0.0010) +[2023-10-08 18:24:32,613][21194] Updated weights for policy 1, policy_version 65680 (0.0010) +[2023-10-08 18:24:32,976][21194] Updated weights for policy 1, policy_version 65690 (0.0010) +[2023-10-08 18:24:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 135036928. Throughput: 0: 1731.3, 1: 1735.5. Samples: 33764504. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:24:33,804][19739] Avg episode reward: [(0, '1032.760'), (1, '840.770')] +[2023-10-08 18:24:35,453][21195] Updated weights for policy 0, policy_version 66180 (0.0009) +[2023-10-08 18:24:35,807][21195] Updated weights for policy 0, policy_version 66190 (0.0007) +[2023-10-08 18:24:36,182][21195] Updated weights for policy 0, policy_version 66200 (0.0007) +[2023-10-08 18:24:36,940][21194] Updated weights for policy 1, policy_version 65700 (0.0010) +[2023-10-08 18:24:37,315][21194] Updated weights for policy 1, policy_version 65710 (0.0010) +[2023-10-08 18:24:37,679][21194] Updated weights for policy 1, policy_version 65720 (0.0011) +[2023-10-08 18:24:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 135102464. Throughput: 0: 1707.7, 1: 1735.6. Samples: 33779646. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:24:38,803][19739] Avg episode reward: [(0, '1033.010'), (1, '840.770')] +[2023-10-08 18:24:38,804][20740] Saving new best policy, reward=1033.010! +[2023-10-08 18:24:39,990][21195] Updated weights for policy 0, policy_version 66210 (0.0008) +[2023-10-08 18:24:40,362][21195] Updated weights for policy 0, policy_version 66220 (0.0008) +[2023-10-08 18:24:40,725][21195] Updated weights for policy 0, policy_version 66230 (0.0008) +[2023-10-08 18:24:41,093][21195] Updated weights for policy 0, policy_version 66240 (0.0009) +[2023-10-08 18:24:41,608][21194] Updated weights for policy 1, policy_version 65730 (0.0009) +[2023-10-08 18:24:41,974][21194] Updated weights for policy 1, policy_version 65740 (0.0007) +[2023-10-08 18:24:42,343][21194] Updated weights for policy 1, policy_version 65750 (0.0007) +[2023-10-08 18:24:42,708][21194] Updated weights for policy 1, policy_version 65760 (0.0008) +[2023-10-08 18:24:43,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 135168000. Throughput: 0: 1727.8, 1: 1715.0. Samples: 33800366. Policy #0 lag: (min: 12.0, avg: 12.8, max: 31.0) +[2023-10-08 18:24:43,803][19739] Avg episode reward: [(0, '1033.010'), (1, '840.770')] +[2023-10-08 18:24:44,897][21195] Updated weights for policy 0, policy_version 66250 (0.0007) +[2023-10-08 18:24:45,259][21195] Updated weights for policy 0, policy_version 66260 (0.0008) +[2023-10-08 18:24:45,623][21195] Updated weights for policy 0, policy_version 66270 (0.0007) +[2023-10-08 18:24:46,605][21194] Updated weights for policy 1, policy_version 65770 (0.0008) +[2023-10-08 18:24:46,964][21194] Updated weights for policy 1, policy_version 65780 (0.0009) +[2023-10-08 18:24:47,325][21194] Updated weights for policy 1, policy_version 65790 (0.0008) +[2023-10-08 18:24:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 135233536. Throughput: 0: 1749.5, 1: 1744.3. Samples: 33817078. Policy #0 lag: (min: 12.0, avg: 12.8, max: 31.0) +[2023-10-08 18:24:48,803][19739] Avg episode reward: [(0, '1033.010'), (1, '841.140')] +[2023-10-08 18:24:49,638][21195] Updated weights for policy 0, policy_version 66280 (0.0008) +[2023-10-08 18:24:50,008][21195] Updated weights for policy 0, policy_version 66290 (0.0007) +[2023-10-08 18:24:50,377][21195] Updated weights for policy 0, policy_version 66300 (0.0010) +[2023-10-08 18:24:51,464][21194] Updated weights for policy 1, policy_version 65800 (0.0007) +[2023-10-08 18:24:51,832][21194] Updated weights for policy 1, policy_version 65810 (0.0010) +[2023-10-08 18:24:52,211][21194] Updated weights for policy 1, policy_version 65820 (0.0010) +[2023-10-08 18:24:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 135299072. Throughput: 0: 1713.7, 1: 1712.9. Samples: 33831242. Policy #0 lag: (min: 12.0, avg: 12.8, max: 31.0) +[2023-10-08 18:24:53,803][19739] Avg episode reward: [(0, '1033.010'), (1, '841.140')] +[2023-10-08 18:24:54,266][21195] Updated weights for policy 0, policy_version 66310 (0.0009) +[2023-10-08 18:24:54,637][21195] Updated weights for policy 0, policy_version 66320 (0.0007) +[2023-10-08 18:24:55,013][21195] Updated weights for policy 0, policy_version 66330 (0.0010) +[2023-10-08 18:24:56,174][21194] Updated weights for policy 1, policy_version 65830 (0.0008) +[2023-10-08 18:24:56,541][21194] Updated weights for policy 1, policy_version 65840 (0.0009) +[2023-10-08 18:24:56,904][21194] Updated weights for policy 1, policy_version 65850 (0.0007) +[2023-10-08 18:24:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 135364608. Throughput: 0: 1750.6, 1: 1701.5. Samples: 33852274. Policy #0 lag: (min: 12.0, avg: 12.8, max: 31.0) +[2023-10-08 18:24:58,803][19739] Avg episode reward: [(0, '1033.010'), (1, '841.140')] +[2023-10-08 18:24:58,997][21195] Updated weights for policy 0, policy_version 66340 (0.0011) +[2023-10-08 18:24:59,390][21195] Updated weights for policy 0, policy_version 66350 (0.0009) +[2023-10-08 18:24:59,758][21195] Updated weights for policy 0, policy_version 66360 (0.0009) +[2023-10-08 18:25:00,813][21194] Updated weights for policy 1, policy_version 65860 (0.0008) +[2023-10-08 18:25:01,193][21194] Updated weights for policy 1, policy_version 65870 (0.0010) +[2023-10-08 18:25:01,561][21194] Updated weights for policy 1, policy_version 65880 (0.0011) +[2023-10-08 18:25:03,368][21195] Updated weights for policy 0, policy_version 66370 (0.0009) +[2023-10-08 18:25:03,736][21195] Updated weights for policy 0, policy_version 66380 (0.0009) +[2023-10-08 18:25:03,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 135430144. Throughput: 0: 1743.2, 1: 1723.1. Samples: 33868028. Policy #0 lag: (min: 12.0, avg: 12.8, max: 31.0) +[2023-10-08 18:25:03,804][19739] Avg episode reward: [(0, '1031.420'), (1, '841.140')] +[2023-10-08 18:25:04,111][21195] Updated weights for policy 0, policy_version 66390 (0.0010) +[2023-10-08 18:25:04,467][21195] Updated weights for policy 0, policy_version 66400 (0.0010) +[2023-10-08 18:25:05,351][21194] Updated weights for policy 1, policy_version 65890 (0.0011) +[2023-10-08 18:25:05,715][21194] Updated weights for policy 1, policy_version 65900 (0.0008) +[2023-10-08 18:25:06,083][21194] Updated weights for policy 1, policy_version 65910 (0.0009) +[2023-10-08 18:25:06,455][21194] Updated weights for policy 1, policy_version 65920 (0.0010) +[2023-10-08 18:25:08,271][21195] Updated weights for policy 0, policy_version 66410 (0.0008) +[2023-10-08 18:25:08,630][21195] Updated weights for policy 0, policy_version 66420 (0.0008) +[2023-10-08 18:25:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 135495680. Throughput: 0: 1744.8, 1: 1702.0. Samples: 33883344. Policy #0 lag: (min: 12.0, avg: 12.8, max: 31.0) +[2023-10-08 18:25:08,803][19739] Avg episode reward: [(0, '1031.420'), (1, '841.140')] +[2023-10-08 18:25:09,007][21195] Updated weights for policy 0, policy_version 66430 (0.0008) +[2023-10-08 18:25:10,584][21194] Updated weights for policy 1, policy_version 65930 (0.0008) +[2023-10-08 18:25:10,949][21194] Updated weights for policy 1, policy_version 65940 (0.0008) +[2023-10-08 18:25:11,312][21194] Updated weights for policy 1, policy_version 65950 (0.0007) +[2023-10-08 18:25:12,889][21195] Updated weights for policy 0, policy_version 66440 (0.0008) +[2023-10-08 18:25:13,259][21195] Updated weights for policy 0, policy_version 66450 (0.0009) +[2023-10-08 18:25:13,622][21195] Updated weights for policy 0, policy_version 66460 (0.0008) +[2023-10-08 18:25:13,803][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 135593984. Throughput: 0: 1757.1, 1: 1712.9. Samples: 33904436. Policy #0 lag: (min: 12.0, avg: 12.8, max: 31.0) +[2023-10-08 18:25:13,803][19739] Avg episode reward: [(0, '1001.930'), (1, '841.140')] +[2023-10-08 18:25:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000065952_67534848.pth... +[2023-10-08 18:25:13,813][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000066464_68059136.pth... +[2023-10-08 18:25:13,842][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000064352_65896448.pth +[2023-10-08 18:25:13,849][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000064832_66387968.pth +[2023-10-08 18:25:15,300][21194] Updated weights for policy 1, policy_version 65960 (0.0010) +[2023-10-08 18:25:15,664][21194] Updated weights for policy 1, policy_version 65970 (0.0012) +[2023-10-08 18:25:16,039][21194] Updated weights for policy 1, policy_version 65980 (0.0010) +[2023-10-08 18:25:17,551][21195] Updated weights for policy 0, policy_version 66470 (0.0008) +[2023-10-08 18:25:17,929][21195] Updated weights for policy 0, policy_version 66480 (0.0008) +[2023-10-08 18:25:18,295][21195] Updated weights for policy 0, policy_version 66490 (0.0010) +[2023-10-08 18:25:18,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 135659520. Throughput: 0: 1731.5, 1: 1702.8. Samples: 33919046. Policy #0 lag: (min: 12.0, avg: 12.8, max: 31.0) +[2023-10-08 18:25:18,803][19739] Avg episode reward: [(0, '1003.350'), (1, '856.130')] +[2023-10-08 18:25:20,056][21194] Updated weights for policy 1, policy_version 65990 (0.0011) +[2023-10-08 18:25:20,407][21194] Updated weights for policy 1, policy_version 66000 (0.0009) +[2023-10-08 18:25:20,775][21194] Updated weights for policy 1, policy_version 66010 (0.0011) +[2023-10-08 18:25:22,233][21195] Updated weights for policy 0, policy_version 66500 (0.0007) +[2023-10-08 18:25:22,599][21195] Updated weights for policy 0, policy_version 66510 (0.0007) +[2023-10-08 18:25:22,961][21195] Updated weights for policy 0, policy_version 66520 (0.0007) +[2023-10-08 18:25:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 135725056. Throughput: 0: 1763.2, 1: 1696.3. Samples: 33935320. Policy #0 lag: (min: 31.0, avg: 36.2, max: 63.0) +[2023-10-08 18:25:23,803][19739] Avg episode reward: [(0, '1003.350'), (1, '856.130')] +[2023-10-08 18:25:24,866][21194] Updated weights for policy 1, policy_version 66020 (0.0010) +[2023-10-08 18:25:25,224][21194] Updated weights for policy 1, policy_version 66030 (0.0009) +[2023-10-08 18:25:25,585][21194] Updated weights for policy 1, policy_version 66040 (0.0009) +[2023-10-08 18:25:26,896][21195] Updated weights for policy 0, policy_version 66530 (0.0007) +[2023-10-08 18:25:27,259][21195] Updated weights for policy 0, policy_version 66540 (0.0008) +[2023-10-08 18:25:27,623][21195] Updated weights for policy 0, policy_version 66550 (0.0008) +[2023-10-08 18:25:27,979][21195] Updated weights for policy 0, policy_version 66560 (0.0008) +[2023-10-08 18:25:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 135790592. Throughput: 0: 1732.0, 1: 1717.7. Samples: 33955602. Policy #0 lag: (min: 31.0, avg: 36.2, max: 63.0) +[2023-10-08 18:25:28,803][19739] Avg episode reward: [(0, '1003.260'), (1, '856.130')] +[2023-10-08 18:25:29,614][21194] Updated weights for policy 1, policy_version 66050 (0.0010) +[2023-10-08 18:25:29,977][21194] Updated weights for policy 1, policy_version 66060 (0.0009) +[2023-10-08 18:25:30,338][21194] Updated weights for policy 1, policy_version 66070 (0.0008) +[2023-10-08 18:25:30,709][21194] Updated weights for policy 1, policy_version 66080 (0.0010) +[2023-10-08 18:25:31,873][21195] Updated weights for policy 0, policy_version 66570 (0.0009) +[2023-10-08 18:25:32,246][21195] Updated weights for policy 0, policy_version 66580 (0.0011) +[2023-10-08 18:25:32,621][21195] Updated weights for policy 0, policy_version 66590 (0.0009) +[2023-10-08 18:25:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 135856128. Throughput: 0: 1729.8, 1: 1687.4. Samples: 33970852. Policy #0 lag: (min: 31.0, avg: 36.2, max: 63.0) +[2023-10-08 18:25:33,804][19739] Avg episode reward: [(0, '987.400'), (1, '856.130')] +[2023-10-08 18:25:34,756][21194] Updated weights for policy 1, policy_version 66090 (0.0008) +[2023-10-08 18:25:35,116][21194] Updated weights for policy 1, policy_version 66100 (0.0007) +[2023-10-08 18:25:35,482][21194] Updated weights for policy 1, policy_version 66110 (0.0008) +[2023-10-08 18:25:36,494][21195] Updated weights for policy 0, policy_version 66600 (0.0007) +[2023-10-08 18:25:36,864][21195] Updated weights for policy 0, policy_version 66610 (0.0008) +[2023-10-08 18:25:37,222][21195] Updated weights for policy 0, policy_version 66620 (0.0009) +[2023-10-08 18:25:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 135921664. Throughput: 0: 1749.6, 1: 1716.7. Samples: 33987224. Policy #0 lag: (min: 31.0, avg: 36.2, max: 63.0) +[2023-10-08 18:25:38,803][19739] Avg episode reward: [(0, '986.580'), (1, '856.130')] +[2023-10-08 18:25:39,326][21194] Updated weights for policy 1, policy_version 66120 (0.0009) +[2023-10-08 18:25:39,686][21194] Updated weights for policy 1, policy_version 66130 (0.0007) +[2023-10-08 18:25:40,045][21194] Updated weights for policy 1, policy_version 66140 (0.0008) +[2023-10-08 18:25:41,160][21195] Updated weights for policy 0, policy_version 66630 (0.0009) +[2023-10-08 18:25:41,522][21195] Updated weights for policy 0, policy_version 66640 (0.0009) +[2023-10-08 18:25:41,899][21195] Updated weights for policy 0, policy_version 66650 (0.0007) +[2023-10-08 18:25:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 135987200. Throughput: 0: 1727.9, 1: 1732.4. Samples: 34007988. Policy #0 lag: (min: 31.0, avg: 36.2, max: 63.0) +[2023-10-08 18:25:43,803][19739] Avg episode reward: [(0, '986.280'), (1, '856.130')] +[2023-10-08 18:25:43,849][21194] Updated weights for policy 1, policy_version 66150 (0.0009) +[2023-10-08 18:25:44,223][21194] Updated weights for policy 1, policy_version 66160 (0.0009) +[2023-10-08 18:25:44,603][21194] Updated weights for policy 1, policy_version 66170 (0.0011) +[2023-10-08 18:25:45,865][21195] Updated weights for policy 0, policy_version 66660 (0.0008) +[2023-10-08 18:25:46,256][21195] Updated weights for policy 0, policy_version 66670 (0.0011) +[2023-10-08 18:25:46,625][21195] Updated weights for policy 0, policy_version 66680 (0.0008) +[2023-10-08 18:25:48,615][21194] Updated weights for policy 1, policy_version 66180 (0.0009) +[2023-10-08 18:25:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 136052736. Throughput: 0: 1740.1, 1: 1709.1. Samples: 34023240. Policy #0 lag: (min: 31.0, avg: 36.2, max: 63.0) +[2023-10-08 18:25:48,803][19739] Avg episode reward: [(0, '986.280'), (1, '851.810')] +[2023-10-08 18:25:48,995][21194] Updated weights for policy 1, policy_version 66190 (0.0009) +[2023-10-08 18:25:49,369][21194] Updated weights for policy 1, policy_version 66200 (0.0008) +[2023-10-08 18:25:50,491][21195] Updated weights for policy 0, policy_version 66690 (0.0008) +[2023-10-08 18:25:50,853][21195] Updated weights for policy 0, policy_version 66700 (0.0009) +[2023-10-08 18:25:51,220][21195] Updated weights for policy 0, policy_version 66710 (0.0007) +[2023-10-08 18:25:51,592][21195] Updated weights for policy 0, policy_version 66720 (0.0007) +[2023-10-08 18:25:53,322][21194] Updated weights for policy 1, policy_version 66210 (0.0007) +[2023-10-08 18:25:53,683][21194] Updated weights for policy 1, policy_version 66220 (0.0010) +[2023-10-08 18:25:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 136118272. Throughput: 0: 1726.0, 1: 1721.9. Samples: 34038500. Policy #0 lag: (min: 31.0, avg: 36.2, max: 63.0) +[2023-10-08 18:25:53,803][19739] Avg episode reward: [(0, '986.280'), (1, '852.700')] +[2023-10-08 18:25:54,042][21194] Updated weights for policy 1, policy_version 66230 (0.0009) +[2023-10-08 18:25:54,411][21194] Updated weights for policy 1, policy_version 66240 (0.0009) +[2023-10-08 18:25:55,484][21195] Updated weights for policy 0, policy_version 66730 (0.0010) +[2023-10-08 18:25:55,850][21195] Updated weights for policy 0, policy_version 66740 (0.0009) +[2023-10-08 18:25:56,226][21195] Updated weights for policy 0, policy_version 66750 (0.0010) +[2023-10-08 18:25:58,177][21194] Updated weights for policy 1, policy_version 66250 (0.0011) +[2023-10-08 18:25:58,541][21194] Updated weights for policy 1, policy_version 66260 (0.0007) +[2023-10-08 18:25:58,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 136183808. Throughput: 0: 1733.2, 1: 1725.1. Samples: 34060062. Policy #0 lag: (min: 31.0, avg: 36.2, max: 63.0) +[2023-10-08 18:25:58,803][19739] Avg episode reward: [(0, '986.120'), (1, '852.700')] +[2023-10-08 18:25:58,903][21194] Updated weights for policy 1, policy_version 66270 (0.0010) +[2023-10-08 18:26:00,095][21195] Updated weights for policy 0, policy_version 66760 (0.0009) +[2023-10-08 18:26:00,460][21195] Updated weights for policy 0, policy_version 66770 (0.0008) +[2023-10-08 18:26:00,825][21195] Updated weights for policy 0, policy_version 66780 (0.0007) +[2023-10-08 18:26:02,766][21194] Updated weights for policy 1, policy_version 66280 (0.0010) +[2023-10-08 18:26:03,124][21194] Updated weights for policy 1, policy_version 66290 (0.0010) +[2023-10-08 18:26:03,496][21194] Updated weights for policy 1, policy_version 66300 (0.0010) +[2023-10-08 18:26:03,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 136282112. Throughput: 0: 1762.7, 1: 1726.8. Samples: 34076072. Policy #0 lag: (min: 31.0, avg: 36.2, max: 63.0) +[2023-10-08 18:26:03,803][19739] Avg episode reward: [(0, '986.840'), (1, '852.700')] +[2023-10-08 18:26:04,649][21195] Updated weights for policy 0, policy_version 66790 (0.0009) +[2023-10-08 18:26:05,010][21195] Updated weights for policy 0, policy_version 66800 (0.0008) +[2023-10-08 18:26:05,384][21195] Updated weights for policy 0, policy_version 66810 (0.0009) +[2023-10-08 18:26:07,463][21194] Updated weights for policy 1, policy_version 66310 (0.0009) +[2023-10-08 18:26:07,833][21194] Updated weights for policy 1, policy_version 66320 (0.0009) +[2023-10-08 18:26:08,196][21194] Updated weights for policy 1, policy_version 66330 (0.0011) +[2023-10-08 18:26:08,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 136347648. Throughput: 0: 1733.4, 1: 1737.6. Samples: 34091514. Policy #0 lag: (min: 31.0, avg: 31.1, max: 37.0) +[2023-10-08 18:26:08,803][19739] Avg episode reward: [(0, '986.840'), (1, '852.700')] +[2023-10-08 18:26:09,344][21195] Updated weights for policy 0, policy_version 66820 (0.0008) +[2023-10-08 18:26:09,700][21195] Updated weights for policy 0, policy_version 66830 (0.0008) +[2023-10-08 18:26:10,071][21195] Updated weights for policy 0, policy_version 66840 (0.0008) +[2023-10-08 18:26:12,410][21194] Updated weights for policy 1, policy_version 66340 (0.0010) +[2023-10-08 18:26:12,779][21194] Updated weights for policy 1, policy_version 66350 (0.0010) +[2023-10-08 18:26:13,140][21194] Updated weights for policy 1, policy_version 66360 (0.0010) +[2023-10-08 18:26:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 136413184. Throughput: 0: 1757.7, 1: 1719.6. Samples: 34112078. Policy #0 lag: (min: 31.0, avg: 31.1, max: 37.0) +[2023-10-08 18:26:13,803][19739] Avg episode reward: [(0, '986.840'), (1, '868.130')] +[2023-10-08 18:26:13,876][21195] Updated weights for policy 0, policy_version 66850 (0.0010) +[2023-10-08 18:26:14,239][21195] Updated weights for policy 0, policy_version 66860 (0.0010) +[2023-10-08 18:26:14,605][21195] Updated weights for policy 0, policy_version 66870 (0.0008) +[2023-10-08 18:26:14,971][21195] Updated weights for policy 0, policy_version 66880 (0.0010) +[2023-10-08 18:26:17,107][21194] Updated weights for policy 1, policy_version 66370 (0.0010) +[2023-10-08 18:26:17,473][21194] Updated weights for policy 1, policy_version 66380 (0.0008) +[2023-10-08 18:26:17,842][21194] Updated weights for policy 1, policy_version 66390 (0.0008) +[2023-10-08 18:26:18,212][21194] Updated weights for policy 1, policy_version 66400 (0.0008) +[2023-10-08 18:26:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 136478720. Throughput: 0: 1751.5, 1: 1740.5. Samples: 34127992. Policy #0 lag: (min: 31.0, avg: 31.1, max: 37.0) +[2023-10-08 18:26:18,803][19739] Avg episode reward: [(0, '986.840'), (1, '868.130')] +[2023-10-08 18:26:18,831][21195] Updated weights for policy 0, policy_version 66890 (0.0009) +[2023-10-08 18:26:19,196][21195] Updated weights for policy 0, policy_version 66900 (0.0007) +[2023-10-08 18:26:19,564][21195] Updated weights for policy 0, policy_version 66910 (0.0008) +[2023-10-08 18:26:22,240][21194] Updated weights for policy 1, policy_version 66410 (0.0008) +[2023-10-08 18:26:22,597][21194] Updated weights for policy 1, policy_version 66420 (0.0008) +[2023-10-08 18:26:22,969][21194] Updated weights for policy 1, policy_version 66430 (0.0008) +[2023-10-08 18:26:23,492][21195] Updated weights for policy 0, policy_version 66920 (0.0008) +[2023-10-08 18:26:23,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 136544256. Throughput: 0: 1738.5, 1: 1729.9. Samples: 34143304. Policy #0 lag: (min: 31.0, avg: 31.1, max: 37.0) +[2023-10-08 18:26:23,804][19739] Avg episode reward: [(0, '986.840'), (1, '868.130')] +[2023-10-08 18:26:23,867][21195] Updated weights for policy 0, policy_version 66930 (0.0007) +[2023-10-08 18:26:24,231][21195] Updated weights for policy 0, policy_version 66940 (0.0008) +[2023-10-08 18:26:26,842][21194] Updated weights for policy 1, policy_version 66440 (0.0007) +[2023-10-08 18:26:27,215][21194] Updated weights for policy 1, policy_version 66450 (0.0007) +[2023-10-08 18:26:27,579][21194] Updated weights for policy 1, policy_version 66460 (0.0008) +[2023-10-08 18:26:28,197][21195] Updated weights for policy 0, policy_version 66950 (0.0009) +[2023-10-08 18:26:28,567][21195] Updated weights for policy 0, policy_version 66960 (0.0009) +[2023-10-08 18:26:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 136609792. Throughput: 0: 1761.7, 1: 1701.6. Samples: 34163836. Policy #0 lag: (min: 31.0, avg: 31.1, max: 37.0) +[2023-10-08 18:26:28,803][19739] Avg episode reward: [(0, '986.840'), (1, '868.130')] +[2023-10-08 18:26:28,941][21195] Updated weights for policy 0, policy_version 66970 (0.0008) +[2023-10-08 18:26:31,534][21194] Updated weights for policy 1, policy_version 66470 (0.0008) +[2023-10-08 18:26:31,908][21194] Updated weights for policy 1, policy_version 66480 (0.0007) +[2023-10-08 18:26:32,278][21194] Updated weights for policy 1, policy_version 66490 (0.0007) +[2023-10-08 18:26:32,925][21195] Updated weights for policy 0, policy_version 66980 (0.0008) +[2023-10-08 18:26:33,317][21195] Updated weights for policy 0, policy_version 66990 (0.0007) +[2023-10-08 18:26:33,682][21195] Updated weights for policy 0, policy_version 67000 (0.0009) +[2023-10-08 18:26:33,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 136675328. Throughput: 0: 1733.0, 1: 1735.6. Samples: 34179328. Policy #0 lag: (min: 31.0, avg: 31.1, max: 37.0) +[2023-10-08 18:26:33,803][19739] Avg episode reward: [(0, '1000.930'), (1, '868.130')] +[2023-10-08 18:26:36,182][21194] Updated weights for policy 1, policy_version 66500 (0.0009) +[2023-10-08 18:26:36,575][21194] Updated weights for policy 1, policy_version 66510 (0.0009) +[2023-10-08 18:26:36,938][21194] Updated weights for policy 1, policy_version 66520 (0.0008) +[2023-10-08 18:26:37,566][21195] Updated weights for policy 0, policy_version 67010 (0.0009) +[2023-10-08 18:26:37,924][21195] Updated weights for policy 0, policy_version 67020 (0.0010) +[2023-10-08 18:26:38,299][21195] Updated weights for policy 0, policy_version 67030 (0.0010) +[2023-10-08 18:26:38,655][21195] Updated weights for policy 0, policy_version 67040 (0.0010) +[2023-10-08 18:26:38,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 136773632. Throughput: 0: 1755.9, 1: 1712.8. Samples: 34194594. Policy #0 lag: (min: 31.0, avg: 31.1, max: 37.0) +[2023-10-08 18:26:38,803][19739] Avg episode reward: [(0, '1000.930'), (1, '868.130')] +[2023-10-08 18:26:40,904][21194] Updated weights for policy 1, policy_version 66530 (0.0008) +[2023-10-08 18:26:41,271][21194] Updated weights for policy 1, policy_version 66540 (0.0010) +[2023-10-08 18:26:41,632][21194] Updated weights for policy 1, policy_version 66550 (0.0008) +[2023-10-08 18:26:41,994][21194] Updated weights for policy 1, policy_version 66560 (0.0008) +[2023-10-08 18:26:42,575][21195] Updated weights for policy 0, policy_version 67050 (0.0008) +[2023-10-08 18:26:42,953][21195] Updated weights for policy 0, policy_version 67060 (0.0009) +[2023-10-08 18:26:43,324][21195] Updated weights for policy 0, policy_version 67070 (0.0008) +[2023-10-08 18:26:43,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 136839168. Throughput: 0: 1735.3, 1: 1706.2. Samples: 34214930. Policy #0 lag: (min: 31.0, avg: 31.1, max: 37.0) +[2023-10-08 18:26:43,803][19739] Avg episode reward: [(0, '1000.200'), (1, '868.130')] +[2023-10-08 18:26:46,140][21194] Updated weights for policy 1, policy_version 66570 (0.0008) +[2023-10-08 18:26:46,508][21194] Updated weights for policy 1, policy_version 66580 (0.0008) +[2023-10-08 18:26:46,880][21194] Updated weights for policy 1, policy_version 66590 (0.0010) +[2023-10-08 18:26:47,324][21195] Updated weights for policy 0, policy_version 67080 (0.0009) +[2023-10-08 18:26:47,702][21195] Updated weights for policy 0, policy_version 67090 (0.0010) +[2023-10-08 18:26:48,081][21195] Updated weights for policy 0, policy_version 67100 (0.0010) +[2023-10-08 18:26:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 136904704. Throughput: 0: 1715.6, 1: 1717.6. Samples: 34230566. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:26:48,803][19739] Avg episode reward: [(0, '1000.200'), (1, '868.130')] +[2023-10-08 18:26:50,769][21194] Updated weights for policy 1, policy_version 66600 (0.0008) +[2023-10-08 18:26:51,139][21194] Updated weights for policy 1, policy_version 66610 (0.0007) +[2023-10-08 18:26:51,506][21194] Updated weights for policy 1, policy_version 66620 (0.0008) +[2023-10-08 18:26:51,904][21195] Updated weights for policy 0, policy_version 67110 (0.0011) +[2023-10-08 18:26:52,279][21195] Updated weights for policy 0, policy_version 67120 (0.0008) +[2023-10-08 18:26:52,648][21195] Updated weights for policy 0, policy_version 67130 (0.0007) +[2023-10-08 18:26:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 136970240. Throughput: 0: 1743.9, 1: 1697.1. Samples: 34246358. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:26:53,803][19739] Avg episode reward: [(0, '1000.200'), (1, '868.130')] +[2023-10-08 18:26:55,275][21194] Updated weights for policy 1, policy_version 66630 (0.0008) +[2023-10-08 18:26:55,635][21194] Updated weights for policy 1, policy_version 66640 (0.0008) +[2023-10-08 18:26:56,004][21194] Updated weights for policy 1, policy_version 66650 (0.0007) +[2023-10-08 18:26:56,560][21195] Updated weights for policy 0, policy_version 67140 (0.0009) +[2023-10-08 18:26:56,925][21195] Updated weights for policy 0, policy_version 67150 (0.0008) +[2023-10-08 18:26:57,292][21195] Updated weights for policy 0, policy_version 67160 (0.0009) +[2023-10-08 18:26:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 137035776. Throughput: 0: 1716.9, 1: 1720.0. Samples: 34266738. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:26:58,803][19739] Avg episode reward: [(0, '1000.200'), (1, '871.610')] +[2023-10-08 18:27:00,111][21194] Updated weights for policy 1, policy_version 66660 (0.0009) +[2023-10-08 18:27:00,482][21194] Updated weights for policy 1, policy_version 66670 (0.0009) +[2023-10-08 18:27:00,848][21194] Updated weights for policy 1, policy_version 66680 (0.0011) +[2023-10-08 18:27:01,188][21195] Updated weights for policy 0, policy_version 67170 (0.0008) +[2023-10-08 18:27:01,550][21195] Updated weights for policy 0, policy_version 67180 (0.0008) +[2023-10-08 18:27:01,928][21195] Updated weights for policy 0, policy_version 67190 (0.0007) +[2023-10-08 18:27:02,293][21195] Updated weights for policy 0, policy_version 67200 (0.0008) +[2023-10-08 18:27:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 137101312. Throughput: 0: 1726.5, 1: 1703.6. Samples: 34282348. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:27:03,804][19739] Avg episode reward: [(0, '1000.200'), (1, '871.610')] +[2023-10-08 18:27:04,795][21194] Updated weights for policy 1, policy_version 66690 (0.0010) +[2023-10-08 18:27:05,160][21194] Updated weights for policy 1, policy_version 66700 (0.0009) +[2023-10-08 18:27:05,520][21194] Updated weights for policy 1, policy_version 66710 (0.0009) +[2023-10-08 18:27:05,889][21194] Updated weights for policy 1, policy_version 66720 (0.0008) +[2023-10-08 18:27:06,314][21195] Updated weights for policy 0, policy_version 67210 (0.0008) +[2023-10-08 18:27:06,682][21195] Updated weights for policy 0, policy_version 67220 (0.0008) +[2023-10-08 18:27:07,038][21195] Updated weights for policy 0, policy_version 67230 (0.0008) +[2023-10-08 18:27:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 137166848. Throughput: 0: 1728.6, 1: 1709.0. Samples: 34297994. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:27:08,803][19739] Avg episode reward: [(0, '1000.200'), (1, '871.610')] +[2023-10-08 18:27:09,674][21194] Updated weights for policy 1, policy_version 66730 (0.0008) +[2023-10-08 18:27:10,045][21194] Updated weights for policy 1, policy_version 66740 (0.0009) +[2023-10-08 18:27:10,412][21194] Updated weights for policy 1, policy_version 66750 (0.0010) +[2023-10-08 18:27:11,084][21195] Updated weights for policy 0, policy_version 67240 (0.0010) +[2023-10-08 18:27:11,453][21195] Updated weights for policy 0, policy_version 67250 (0.0009) +[2023-10-08 18:27:11,814][21195] Updated weights for policy 0, policy_version 67260 (0.0007) +[2023-10-08 18:27:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 137232384. Throughput: 0: 1714.9, 1: 1735.3. Samples: 34319096. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:27:13,803][19739] Avg episode reward: [(0, '1000.200'), (1, '887.240')] +[2023-10-08 18:27:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000066752_68354048.pth... +[2023-10-08 18:27:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000067264_68878336.pth... +[2023-10-08 18:27:13,843][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000065152_66715648.pth +[2023-10-08 18:27:13,853][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000065632_67207168.pth +[2023-10-08 18:27:14,313][21194] Updated weights for policy 1, policy_version 66760 (0.0009) +[2023-10-08 18:27:14,683][21194] Updated weights for policy 1, policy_version 66770 (0.0009) +[2023-10-08 18:27:15,046][21194] Updated weights for policy 1, policy_version 66780 (0.0008) +[2023-10-08 18:27:15,862][21195] Updated weights for policy 0, policy_version 67270 (0.0008) +[2023-10-08 18:27:16,230][21195] Updated weights for policy 0, policy_version 67280 (0.0007) +[2023-10-08 18:27:16,600][21195] Updated weights for policy 0, policy_version 67290 (0.0008) +[2023-10-08 18:27:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 137297920. Throughput: 0: 1738.9, 1: 1701.1. Samples: 34334130. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:27:18,803][19739] Avg episode reward: [(0, '1000.200'), (1, '902.630')] +[2023-10-08 18:27:19,070][21194] Updated weights for policy 1, policy_version 66790 (0.0008) +[2023-10-08 18:27:19,435][21194] Updated weights for policy 1, policy_version 66800 (0.0008) +[2023-10-08 18:27:19,798][21194] Updated weights for policy 1, policy_version 66810 (0.0009) +[2023-10-08 18:27:20,402][21195] Updated weights for policy 0, policy_version 67300 (0.0008) +[2023-10-08 18:27:20,779][21195] Updated weights for policy 0, policy_version 67310 (0.0008) +[2023-10-08 18:27:21,146][21195] Updated weights for policy 0, policy_version 67320 (0.0010) +[2023-10-08 18:27:23,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 137363456. Throughput: 0: 1716.7, 1: 1726.6. Samples: 34349542. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:27:23,803][19739] Avg episode reward: [(0, '1000.200'), (1, '902.630')] +[2023-10-08 18:27:23,868][21194] Updated weights for policy 1, policy_version 66820 (0.0009) +[2023-10-08 18:27:24,268][21194] Updated weights for policy 1, policy_version 66830 (0.0009) +[2023-10-08 18:27:24,634][21194] Updated weights for policy 1, policy_version 66840 (0.0007) +[2023-10-08 18:27:25,156][21195] Updated weights for policy 0, policy_version 67330 (0.0008) +[2023-10-08 18:27:25,538][21195] Updated weights for policy 0, policy_version 67340 (0.0009) +[2023-10-08 18:27:25,912][21195] Updated weights for policy 0, policy_version 67350 (0.0009) +[2023-10-08 18:27:26,285][21195] Updated weights for policy 0, policy_version 67360 (0.0008) +[2023-10-08 18:27:28,711][21194] Updated weights for policy 1, policy_version 66850 (0.0008) +[2023-10-08 18:27:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 137428992. Throughput: 0: 1724.2, 1: 1730.9. Samples: 34370410. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:27:28,803][19739] Avg episode reward: [(0, '1000.200'), (1, '902.630')] +[2023-10-08 18:27:29,081][21194] Updated weights for policy 1, policy_version 66860 (0.0007) +[2023-10-08 18:27:29,447][21194] Updated weights for policy 1, policy_version 66870 (0.0007) +[2023-10-08 18:27:29,812][21194] Updated weights for policy 1, policy_version 66880 (0.0007) +[2023-10-08 18:27:30,197][21195] Updated weights for policy 0, policy_version 67370 (0.0009) +[2023-10-08 18:27:30,565][21195] Updated weights for policy 0, policy_version 67380 (0.0007) +[2023-10-08 18:27:30,928][21195] Updated weights for policy 0, policy_version 67390 (0.0008) +[2023-10-08 18:27:33,722][21194] Updated weights for policy 1, policy_version 66890 (0.0009) +[2023-10-08 18:27:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 137494528. Throughput: 0: 1738.5, 1: 1712.4. Samples: 34385856. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 18:27:33,804][19739] Avg episode reward: [(0, '1000.200'), (1, '917.900')] +[2023-10-08 18:27:34,087][21194] Updated weights for policy 1, policy_version 66900 (0.0007) +[2023-10-08 18:27:34,448][21194] Updated weights for policy 1, policy_version 66910 (0.0008) +[2023-10-08 18:27:34,922][21195] Updated weights for policy 0, policy_version 67400 (0.0009) +[2023-10-08 18:27:35,292][21195] Updated weights for policy 0, policy_version 67410 (0.0008) +[2023-10-08 18:27:35,657][21195] Updated weights for policy 0, policy_version 67420 (0.0009) +[2023-10-08 18:27:38,424][21194] Updated weights for policy 1, policy_version 66920 (0.0008) +[2023-10-08 18:27:38,796][21194] Updated weights for policy 1, policy_version 66930 (0.0008) +[2023-10-08 18:27:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 137560064. Throughput: 0: 1711.4, 1: 1740.8. Samples: 34401708. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 18:27:38,803][19739] Avg episode reward: [(0, '1000.200'), (1, '917.680')] +[2023-10-08 18:27:39,164][21194] Updated weights for policy 1, policy_version 66940 (0.0008) +[2023-10-08 18:27:39,433][21195] Updated weights for policy 0, policy_version 67430 (0.0010) +[2023-10-08 18:27:39,798][21195] Updated weights for policy 0, policy_version 67440 (0.0010) +[2023-10-08 18:27:40,163][21195] Updated weights for policy 0, policy_version 67450 (0.0009) +[2023-10-08 18:27:43,095][21194] Updated weights for policy 1, policy_version 66950 (0.0007) +[2023-10-08 18:27:43,465][21194] Updated weights for policy 1, policy_version 66960 (0.0009) +[2023-10-08 18:27:43,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 137625600. Throughput: 0: 1738.6, 1: 1732.5. Samples: 34422940. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 18:27:43,803][19739] Avg episode reward: [(0, '1000.280'), (1, '898.150')] +[2023-10-08 18:27:43,832][21194] Updated weights for policy 1, policy_version 66970 (0.0010) +[2023-10-08 18:27:44,137][21195] Updated weights for policy 0, policy_version 67460 (0.0009) +[2023-10-08 18:27:44,508][21195] Updated weights for policy 0, policy_version 67470 (0.0007) +[2023-10-08 18:27:44,875][21195] Updated weights for policy 0, policy_version 67480 (0.0007) +[2023-10-08 18:27:47,770][21194] Updated weights for policy 1, policy_version 66980 (0.0009) +[2023-10-08 18:27:48,126][21194] Updated weights for policy 1, policy_version 66990 (0.0008) +[2023-10-08 18:27:48,492][21194] Updated weights for policy 1, policy_version 67000 (0.0008) +[2023-10-08 18:27:48,676][21195] Updated weights for policy 0, policy_version 67490 (0.0008) +[2023-10-08 18:27:48,803][19739] Fps is (10 sec: 16383.8, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 137723904. Throughput: 0: 1733.0, 1: 1732.8. Samples: 34438306. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 18:27:48,803][19739] Avg episode reward: [(0, '1015.590'), (1, '898.550')] +[2023-10-08 18:27:49,047][21195] Updated weights for policy 0, policy_version 67500 (0.0011) +[2023-10-08 18:27:49,426][21195] Updated weights for policy 0, policy_version 67510 (0.0008) +[2023-10-08 18:27:49,796][21195] Updated weights for policy 0, policy_version 67520 (0.0008) +[2023-10-08 18:27:52,429][21194] Updated weights for policy 1, policy_version 67010 (0.0008) +[2023-10-08 18:27:52,797][21194] Updated weights for policy 1, policy_version 67020 (0.0008) +[2023-10-08 18:27:53,160][21194] Updated weights for policy 1, policy_version 67030 (0.0009) +[2023-10-08 18:27:53,519][21194] Updated weights for policy 1, policy_version 67040 (0.0008) +[2023-10-08 18:27:53,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 137789440. Throughput: 0: 1728.7, 1: 1732.0. Samples: 34453728. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 18:27:53,803][19739] Avg episode reward: [(0, '1015.590'), (1, '913.350')] +[2023-10-08 18:27:53,841][21195] Updated weights for policy 0, policy_version 67530 (0.0009) +[2023-10-08 18:27:54,213][21195] Updated weights for policy 0, policy_version 67540 (0.0008) +[2023-10-08 18:27:54,589][21195] Updated weights for policy 0, policy_version 67550 (0.0008) +[2023-10-08 18:27:57,459][21194] Updated weights for policy 1, policy_version 67050 (0.0007) +[2023-10-08 18:27:57,829][21194] Updated weights for policy 1, policy_version 67060 (0.0008) +[2023-10-08 18:27:58,195][21194] Updated weights for policy 1, policy_version 67070 (0.0007) +[2023-10-08 18:27:58,431][21195] Updated weights for policy 0, policy_version 67560 (0.0008) +[2023-10-08 18:27:58,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 137854976. Throughput: 0: 1737.6, 1: 1709.8. Samples: 34474230. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 18:27:58,803][19739] Avg episode reward: [(0, '1015.590'), (1, '913.350')] +[2023-10-08 18:27:58,807][21195] Updated weights for policy 0, policy_version 67570 (0.0011) +[2023-10-08 18:27:59,189][21195] Updated weights for policy 0, policy_version 67580 (0.0010) +[2023-10-08 18:28:02,085][21194] Updated weights for policy 1, policy_version 67080 (0.0008) +[2023-10-08 18:28:02,441][21194] Updated weights for policy 1, policy_version 67090 (0.0008) +[2023-10-08 18:28:02,811][21194] Updated weights for policy 1, policy_version 67100 (0.0009) +[2023-10-08 18:28:03,035][21195] Updated weights for policy 0, policy_version 67590 (0.0008) +[2023-10-08 18:28:03,406][21195] Updated weights for policy 0, policy_version 67600 (0.0009) +[2023-10-08 18:28:03,775][21195] Updated weights for policy 0, policy_version 67610 (0.0009) +[2023-10-08 18:28:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 137920512. Throughput: 0: 1718.7, 1: 1738.7. Samples: 34489712. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 18:28:03,804][19739] Avg episode reward: [(0, '1015.590'), (1, '913.350')] +[2023-10-08 18:28:06,768][21194] Updated weights for policy 1, policy_version 67110 (0.0008) +[2023-10-08 18:28:07,141][21194] Updated weights for policy 1, policy_version 67120 (0.0009) +[2023-10-08 18:28:07,506][21194] Updated weights for policy 1, policy_version 67130 (0.0008) +[2023-10-08 18:28:07,726][21195] Updated weights for policy 0, policy_version 67620 (0.0009) +[2023-10-08 18:28:08,089][21195] Updated weights for policy 0, policy_version 67630 (0.0010) +[2023-10-08 18:28:08,455][21195] Updated weights for policy 0, policy_version 67640 (0.0010) +[2023-10-08 18:28:08,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 138018816. Throughput: 0: 1743.1, 1: 1728.0. Samples: 34505740. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 18:28:08,803][19739] Avg episode reward: [(0, '1015.590'), (1, '913.350')] +[2023-10-08 18:28:11,609][21194] Updated weights for policy 1, policy_version 67140 (0.0008) +[2023-10-08 18:28:11,999][21194] Updated weights for policy 1, policy_version 67150 (0.0008) +[2023-10-08 18:28:12,371][21194] Updated weights for policy 1, policy_version 67160 (0.0009) +[2023-10-08 18:28:12,452][21195] Updated weights for policy 0, policy_version 67650 (0.0009) +[2023-10-08 18:28:12,858][21195] Updated weights for policy 0, policy_version 67660 (0.0008) +[2023-10-08 18:28:13,222][21195] Updated weights for policy 0, policy_version 67670 (0.0007) +[2023-10-08 18:28:13,594][21195] Updated weights for policy 0, policy_version 67680 (0.0009) +[2023-10-08 18:28:13,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 138084352. Throughput: 0: 1742.7, 1: 1709.9. Samples: 34525776. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:28:13,804][19739] Avg episode reward: [(0, '1015.590'), (1, '899.070')] +[2023-10-08 18:28:16,191][21194] Updated weights for policy 1, policy_version 67170 (0.0007) +[2023-10-08 18:28:16,547][21194] Updated weights for policy 1, policy_version 67180 (0.0007) +[2023-10-08 18:28:16,919][21194] Updated weights for policy 1, policy_version 67190 (0.0008) +[2023-10-08 18:28:17,283][21194] Updated weights for policy 1, policy_version 67200 (0.0009) +[2023-10-08 18:28:17,389][21195] Updated weights for policy 0, policy_version 67690 (0.0008) +[2023-10-08 18:28:17,764][21195] Updated weights for policy 0, policy_version 67700 (0.0008) +[2023-10-08 18:28:18,122][21195] Updated weights for policy 0, policy_version 67710 (0.0007) +[2023-10-08 18:28:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 138149888. Throughput: 0: 1720.9, 1: 1739.6. Samples: 34541576. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:28:18,803][19739] Avg episode reward: [(0, '1015.590'), (1, '908.000')] +[2023-10-08 18:28:21,228][21194] Updated weights for policy 1, policy_version 67210 (0.0009) +[2023-10-08 18:28:21,599][21194] Updated weights for policy 1, policy_version 67220 (0.0007) +[2023-10-08 18:28:21,953][21194] Updated weights for policy 1, policy_version 67230 (0.0008) +[2023-10-08 18:28:22,053][21195] Updated weights for policy 0, policy_version 67720 (0.0008) +[2023-10-08 18:28:22,420][21195] Updated weights for policy 0, policy_version 67730 (0.0007) +[2023-10-08 18:28:22,799][21195] Updated weights for policy 0, policy_version 67740 (0.0009) +[2023-10-08 18:28:23,802][19739] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 138215424. Throughput: 0: 1744.2, 1: 1700.1. Samples: 34556702. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:28:23,803][19739] Avg episode reward: [(0, '1031.160'), (1, '909.240')] +[2023-10-08 18:28:25,897][21194] Updated weights for policy 1, policy_version 67240 (0.0009) +[2023-10-08 18:28:26,268][21194] Updated weights for policy 1, policy_version 67250 (0.0007) +[2023-10-08 18:28:26,634][21194] Updated weights for policy 1, policy_version 67260 (0.0009) +[2023-10-08 18:28:26,802][21195] Updated weights for policy 0, policy_version 67750 (0.0008) +[2023-10-08 18:28:27,172][21195] Updated weights for policy 0, policy_version 67760 (0.0008) +[2023-10-08 18:28:27,547][21195] Updated weights for policy 0, policy_version 67770 (0.0009) +[2023-10-08 18:28:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 138280960. Throughput: 0: 1714.5, 1: 1706.0. Samples: 34576866. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:28:28,803][19739] Avg episode reward: [(0, '1030.680'), (1, '909.240')] +[2023-10-08 18:28:30,553][21194] Updated weights for policy 1, policy_version 67270 (0.0008) +[2023-10-08 18:28:30,921][21194] Updated weights for policy 1, policy_version 67280 (0.0007) +[2023-10-08 18:28:31,287][21194] Updated weights for policy 1, policy_version 67290 (0.0009) +[2023-10-08 18:28:31,499][21195] Updated weights for policy 0, policy_version 67780 (0.0008) +[2023-10-08 18:28:31,859][21195] Updated weights for policy 0, policy_version 67790 (0.0008) +[2023-10-08 18:28:32,233][21195] Updated weights for policy 0, policy_version 67800 (0.0009) +[2023-10-08 18:28:33,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 138346496. Throughput: 0: 1715.8, 1: 1719.2. Samples: 34592880. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:28:33,804][19739] Avg episode reward: [(0, '1030.680'), (1, '909.240')] +[2023-10-08 18:28:35,254][21194] Updated weights for policy 1, policy_version 67300 (0.0008) +[2023-10-08 18:28:35,621][21194] Updated weights for policy 1, policy_version 67310 (0.0009) +[2023-10-08 18:28:35,990][21194] Updated weights for policy 1, policy_version 67320 (0.0007) +[2023-10-08 18:28:36,245][21195] Updated weights for policy 0, policy_version 67810 (0.0007) +[2023-10-08 18:28:36,623][21195] Updated weights for policy 0, policy_version 67820 (0.0009) +[2023-10-08 18:28:37,001][21195] Updated weights for policy 0, policy_version 67830 (0.0009) +[2023-10-08 18:28:37,370][21195] Updated weights for policy 0, policy_version 67840 (0.0007) +[2023-10-08 18:28:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 138412032. Throughput: 0: 1728.5, 1: 1711.0. Samples: 34608508. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:28:38,803][19739] Avg episode reward: [(0, '1030.680'), (1, '909.240')] +[2023-10-08 18:28:39,909][21194] Updated weights for policy 1, policy_version 67330 (0.0008) +[2023-10-08 18:28:40,273][21194] Updated weights for policy 1, policy_version 67340 (0.0012) +[2023-10-08 18:28:40,643][21194] Updated weights for policy 1, policy_version 67350 (0.0010) +[2023-10-08 18:28:41,000][21194] Updated weights for policy 1, policy_version 67360 (0.0010) +[2023-10-08 18:28:41,025][21195] Updated weights for policy 0, policy_version 67850 (0.0009) +[2023-10-08 18:28:41,396][21195] Updated weights for policy 0, policy_version 67860 (0.0009) +[2023-10-08 18:28:41,764][21195] Updated weights for policy 0, policy_version 67870 (0.0008) +[2023-10-08 18:28:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 138477568. Throughput: 0: 1715.2, 1: 1730.8. Samples: 34629298. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:28:43,803][19739] Avg episode reward: [(0, '1046.190'), (1, '909.240')] +[2023-10-08 18:28:43,812][20740] Saving new best policy, reward=1046.190! +[2023-10-08 18:28:45,017][21194] Updated weights for policy 1, policy_version 67370 (0.0008) +[2023-10-08 18:28:45,391][21194] Updated weights for policy 1, policy_version 67380 (0.0008) +[2023-10-08 18:28:45,694][21195] Updated weights for policy 0, policy_version 67880 (0.0009) +[2023-10-08 18:28:45,753][21194] Updated weights for policy 1, policy_version 67390 (0.0007) +[2023-10-08 18:28:46,056][21195] Updated weights for policy 0, policy_version 67890 (0.0010) +[2023-10-08 18:28:46,421][21195] Updated weights for policy 0, policy_version 67900 (0.0007) +[2023-10-08 18:28:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 138543104. Throughput: 0: 1741.9, 1: 1703.6. Samples: 34644756. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:28:48,803][19739] Avg episode reward: [(0, '1046.190'), (1, '909.240')] +[2023-10-08 18:28:49,662][21194] Updated weights for policy 1, policy_version 67400 (0.0008) +[2023-10-08 18:28:50,029][21194] Updated weights for policy 1, policy_version 67410 (0.0010) +[2023-10-08 18:28:50,279][21195] Updated weights for policy 0, policy_version 67910 (0.0007) +[2023-10-08 18:28:50,393][21194] Updated weights for policy 1, policy_version 67420 (0.0008) +[2023-10-08 18:28:50,653][21195] Updated weights for policy 0, policy_version 67920 (0.0009) +[2023-10-08 18:28:51,022][21195] Updated weights for policy 0, policy_version 67930 (0.0009) +[2023-10-08 18:28:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 138608640. Throughput: 0: 1718.8, 1: 1714.8. Samples: 34660254. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:28:53,803][19739] Avg episode reward: [(0, '1046.190'), (1, '909.240')] +[2023-10-08 18:28:54,250][21194] Updated weights for policy 1, policy_version 67430 (0.0009) +[2023-10-08 18:28:54,609][21194] Updated weights for policy 1, policy_version 67440 (0.0009) +[2023-10-08 18:28:54,932][21195] Updated weights for policy 0, policy_version 67940 (0.0011) +[2023-10-08 18:28:54,981][21194] Updated weights for policy 1, policy_version 67450 (0.0009) +[2023-10-08 18:28:55,292][21195] Updated weights for policy 0, policy_version 67950 (0.0008) +[2023-10-08 18:28:55,663][21195] Updated weights for policy 0, policy_version 67960 (0.0010) +[2023-10-08 18:28:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 138674176. Throughput: 0: 1731.7, 1: 1736.3. Samples: 34681832. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:28:58,803][19739] Avg episode reward: [(0, '1046.190'), (1, '924.210')] +[2023-10-08 18:28:59,133][21194] Updated weights for policy 1, policy_version 67460 (0.0010) +[2023-10-08 18:28:59,520][21194] Updated weights for policy 1, policy_version 67470 (0.0011) +[2023-10-08 18:28:59,667][21195] Updated weights for policy 0, policy_version 67970 (0.0008) +[2023-10-08 18:28:59,892][21194] Updated weights for policy 1, policy_version 67480 (0.0007) +[2023-10-08 18:29:00,070][21195] Updated weights for policy 0, policy_version 67980 (0.0007) +[2023-10-08 18:29:00,437][21195] Updated weights for policy 0, policy_version 67990 (0.0010) +[2023-10-08 18:29:00,807][21195] Updated weights for policy 0, policy_version 68000 (0.0010) +[2023-10-08 18:29:03,719][21194] Updated weights for policy 1, policy_version 67490 (0.0008) +[2023-10-08 18:29:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 138739712. Throughput: 0: 1746.3, 1: 1704.5. Samples: 34696862. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:29:03,804][19739] Avg episode reward: [(0, '1046.190'), (1, '924.210')] +[2023-10-08 18:29:04,082][21194] Updated weights for policy 1, policy_version 67500 (0.0010) +[2023-10-08 18:29:04,456][21194] Updated weights for policy 1, policy_version 67510 (0.0007) +[2023-10-08 18:29:04,679][21195] Updated weights for policy 0, policy_version 68010 (0.0008) +[2023-10-08 18:29:04,813][21194] Updated weights for policy 1, policy_version 67520 (0.0008) +[2023-10-08 18:29:05,047][21195] Updated weights for policy 0, policy_version 68020 (0.0008) +[2023-10-08 18:29:05,417][21195] Updated weights for policy 0, policy_version 68030 (0.0009) +[2023-10-08 18:29:08,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 138805248. Throughput: 0: 1720.9, 1: 1738.1. Samples: 34712360. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:29:08,803][19739] Avg episode reward: [(0, '1046.190'), (1, '924.210')] +[2023-10-08 18:29:08,842][21194] Updated weights for policy 1, policy_version 67530 (0.0010) +[2023-10-08 18:29:09,199][21194] Updated weights for policy 1, policy_version 67540 (0.0009) +[2023-10-08 18:29:09,336][21195] Updated weights for policy 0, policy_version 68040 (0.0007) +[2023-10-08 18:29:09,568][21194] Updated weights for policy 1, policy_version 67550 (0.0008) +[2023-10-08 18:29:09,699][21195] Updated weights for policy 0, policy_version 68050 (0.0007) +[2023-10-08 18:29:10,071][21195] Updated weights for policy 0, policy_version 68060 (0.0011) +[2023-10-08 18:29:13,406][21194] Updated weights for policy 1, policy_version 67560 (0.0007) +[2023-10-08 18:29:13,768][21194] Updated weights for policy 1, policy_version 67570 (0.0007) +[2023-10-08 18:29:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 138870784. Throughput: 0: 1751.6, 1: 1738.4. Samples: 34733916. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:29:13,803][19739] Avg episode reward: [(0, '1040.420'), (1, '924.210')] +[2023-10-08 18:29:13,839][21195] Updated weights for policy 0, policy_version 68070 (0.0009) +[2023-10-08 18:29:14,138][21194] Updated weights for policy 1, policy_version 67580 (0.0008) +[2023-10-08 18:29:14,210][21195] Updated weights for policy 0, policy_version 68080 (0.0009) +[2023-10-08 18:29:14,282][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000067584_69206016.pth... +[2023-10-08 18:29:14,312][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000065952_67534848.pth +[2023-10-08 18:29:14,577][21195] Updated weights for policy 0, policy_version 68090 (0.0009) +[2023-10-08 18:29:14,792][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000068096_69730304.pth... +[2023-10-08 18:29:14,821][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000066464_68059136.pth +[2023-10-08 18:29:18,039][21194] Updated weights for policy 1, policy_version 67590 (0.0008) +[2023-10-08 18:29:18,408][21194] Updated weights for policy 1, policy_version 67600 (0.0010) +[2023-10-08 18:29:18,705][21195] Updated weights for policy 0, policy_version 68100 (0.0009) +[2023-10-08 18:29:18,784][21194] Updated weights for policy 1, policy_version 67610 (0.0007) +[2023-10-08 18:29:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 138936320. Throughput: 0: 1743.5, 1: 1720.9. Samples: 34748776. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:29:18,803][19739] Avg episode reward: [(0, '1040.420'), (1, '924.210')] +[2023-10-08 18:29:19,065][21195] Updated weights for policy 0, policy_version 68110 (0.0007) +[2023-10-08 18:29:19,437][21195] Updated weights for policy 0, policy_version 68120 (0.0007) +[2023-10-08 18:29:22,794][21194] Updated weights for policy 1, policy_version 67620 (0.0009) +[2023-10-08 18:29:23,160][21194] Updated weights for policy 1, policy_version 67630 (0.0010) +[2023-10-08 18:29:23,395][21195] Updated weights for policy 0, policy_version 68130 (0.0008) +[2023-10-08 18:29:23,530][21194] Updated weights for policy 1, policy_version 67640 (0.0009) +[2023-10-08 18:29:23,768][21195] Updated weights for policy 0, policy_version 68140 (0.0007) +[2023-10-08 18:29:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 139001856. Throughput: 0: 1731.5, 1: 1734.9. Samples: 34764498. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:29:23,803][19739] Avg episode reward: [(0, '1040.060'), (1, '924.210')] +[2023-10-08 18:29:24,132][21195] Updated weights for policy 0, policy_version 68150 (0.0009) +[2023-10-08 18:29:24,502][21195] Updated weights for policy 0, policy_version 68160 (0.0007) +[2023-10-08 18:29:27,482][21194] Updated weights for policy 1, policy_version 67650 (0.0008) +[2023-10-08 18:29:27,853][21194] Updated weights for policy 1, policy_version 67660 (0.0011) +[2023-10-08 18:29:28,222][21194] Updated weights for policy 1, policy_version 67670 (0.0010) +[2023-10-08 18:29:28,443][21195] Updated weights for policy 0, policy_version 68170 (0.0008) +[2023-10-08 18:29:28,582][21194] Updated weights for policy 1, policy_version 67680 (0.0007) +[2023-10-08 18:29:28,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 139100160. Throughput: 0: 1743.0, 1: 1715.9. Samples: 34784948. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:29:28,803][19739] Avg episode reward: [(0, '1039.470'), (1, '924.210')] +[2023-10-08 18:29:28,816][21195] Updated weights for policy 0, policy_version 68180 (0.0008) +[2023-10-08 18:29:29,187][21195] Updated weights for policy 0, policy_version 68190 (0.0009) +[2023-10-08 18:29:32,675][21194] Updated weights for policy 1, policy_version 67690 (0.0008) +[2023-10-08 18:29:33,041][21194] Updated weights for policy 1, policy_version 67700 (0.0008) +[2023-10-08 18:29:33,178][21195] Updated weights for policy 0, policy_version 68200 (0.0008) +[2023-10-08 18:29:33,403][21194] Updated weights for policy 1, policy_version 67710 (0.0007) +[2023-10-08 18:29:33,539][21195] Updated weights for policy 0, policy_version 68210 (0.0008) +[2023-10-08 18:29:33,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 139165696. Throughput: 0: 1716.4, 1: 1732.4. Samples: 34799956. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:29:33,803][19739] Avg episode reward: [(0, '1039.840'), (1, '929.020')] +[2023-10-08 18:29:33,908][21195] Updated weights for policy 0, policy_version 68220 (0.0011) +[2023-10-08 18:29:37,248][21194] Updated weights for policy 1, policy_version 67720 (0.0008) +[2023-10-08 18:29:37,610][21194] Updated weights for policy 1, policy_version 67730 (0.0010) +[2023-10-08 18:29:37,958][21195] Updated weights for policy 0, policy_version 68230 (0.0009) +[2023-10-08 18:29:37,981][21194] Updated weights for policy 1, policy_version 67740 (0.0008) +[2023-10-08 18:29:38,323][21195] Updated weights for policy 0, policy_version 68240 (0.0008) +[2023-10-08 18:29:38,699][21195] Updated weights for policy 0, policy_version 68250 (0.0008) +[2023-10-08 18:29:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 139231232. Throughput: 0: 1733.7, 1: 1733.2. Samples: 34816264. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:29:38,803][19739] Avg episode reward: [(0, '1039.840'), (1, '929.020')] +[2023-10-08 18:29:42,007][21194] Updated weights for policy 1, policy_version 67750 (0.0009) +[2023-10-08 18:29:42,371][21194] Updated weights for policy 1, policy_version 67760 (0.0008) +[2023-10-08 18:29:42,607][21195] Updated weights for policy 0, policy_version 68260 (0.0010) +[2023-10-08 18:29:42,742][21194] Updated weights for policy 1, policy_version 67770 (0.0007) +[2023-10-08 18:29:42,974][21195] Updated weights for policy 0, policy_version 68270 (0.0009) +[2023-10-08 18:29:43,349][21195] Updated weights for policy 0, policy_version 68280 (0.0008) +[2023-10-08 18:29:43,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 139329536. Throughput: 0: 1722.4, 1: 1700.8. Samples: 34835876. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:29:43,803][19739] Avg episode reward: [(0, '1039.840'), (1, '929.020')] +[2023-10-08 18:29:46,865][21194] Updated weights for policy 1, policy_version 67780 (0.0007) +[2023-10-08 18:29:47,255][21194] Updated weights for policy 1, policy_version 67790 (0.0008) +[2023-10-08 18:29:47,370][21195] Updated weights for policy 0, policy_version 68290 (0.0007) +[2023-10-08 18:29:47,619][21194] Updated weights for policy 1, policy_version 67800 (0.0007) +[2023-10-08 18:29:47,776][21195] Updated weights for policy 0, policy_version 68300 (0.0008) +[2023-10-08 18:29:48,150][21195] Updated weights for policy 0, policy_version 68310 (0.0010) +[2023-10-08 18:29:48,513][21195] Updated weights for policy 0, policy_version 68320 (0.0008) +[2023-10-08 18:29:48,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 139395072. Throughput: 0: 1705.6, 1: 1732.8. Samples: 34851586. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:29:48,803][19739] Avg episode reward: [(0, '1039.850'), (1, '929.020')] +[2023-10-08 18:29:51,590][21194] Updated weights for policy 1, policy_version 67810 (0.0007) +[2023-10-08 18:29:51,963][21194] Updated weights for policy 1, policy_version 67820 (0.0009) +[2023-10-08 18:29:52,322][21194] Updated weights for policy 1, policy_version 67830 (0.0007) +[2023-10-08 18:29:52,498][21195] Updated weights for policy 0, policy_version 68330 (0.0008) +[2023-10-08 18:29:52,697][21194] Updated weights for policy 1, policy_version 67840 (0.0008) +[2023-10-08 18:29:52,864][21195] Updated weights for policy 0, policy_version 68340 (0.0007) +[2023-10-08 18:29:53,230][21195] Updated weights for policy 0, policy_version 68350 (0.0009) +[2023-10-08 18:29:53,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 139460608. Throughput: 0: 1732.4, 1: 1716.5. Samples: 34867558. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:29:53,803][19739] Avg episode reward: [(0, '1035.820'), (1, '929.020')] +[2023-10-08 18:29:56,725][21194] Updated weights for policy 1, policy_version 67850 (0.0009) +[2023-10-08 18:29:57,091][21194] Updated weights for policy 1, policy_version 67860 (0.0007) +[2023-10-08 18:29:57,107][21195] Updated weights for policy 0, policy_version 68360 (0.0007) +[2023-10-08 18:29:57,459][21194] Updated weights for policy 1, policy_version 67870 (0.0008) +[2023-10-08 18:29:57,478][21195] Updated weights for policy 0, policy_version 68370 (0.0009) +[2023-10-08 18:29:57,843][21195] Updated weights for policy 0, policy_version 68380 (0.0008) +[2023-10-08 18:29:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 139526144. Throughput: 0: 1705.8, 1: 1694.5. Samples: 34886932. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:29:58,804][19739] Avg episode reward: [(0, '1035.820'), (1, '929.020')] +[2023-10-08 18:30:01,263][21194] Updated weights for policy 1, policy_version 67880 (0.0008) +[2023-10-08 18:30:01,617][21194] Updated weights for policy 1, policy_version 67890 (0.0008) +[2023-10-08 18:30:01,664][21195] Updated weights for policy 0, policy_version 68390 (0.0009) +[2023-10-08 18:30:01,992][21194] Updated weights for policy 1, policy_version 67900 (0.0009) +[2023-10-08 18:30:02,034][21195] Updated weights for policy 0, policy_version 68400 (0.0008) +[2023-10-08 18:30:02,399][21195] Updated weights for policy 0, policy_version 68410 (0.0007) +[2023-10-08 18:30:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 139591680. Throughput: 0: 1711.0, 1: 1726.5. Samples: 34903462. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:30:03,803][19739] Avg episode reward: [(0, '1035.820'), (1, '928.820')] +[2023-10-08 18:30:05,993][21194] Updated weights for policy 1, policy_version 67910 (0.0008) +[2023-10-08 18:30:06,318][21195] Updated weights for policy 0, policy_version 68420 (0.0009) +[2023-10-08 18:30:06,357][21194] Updated weights for policy 1, policy_version 67920 (0.0009) +[2023-10-08 18:30:06,681][21195] Updated weights for policy 0, policy_version 68430 (0.0009) +[2023-10-08 18:30:06,717][21194] Updated weights for policy 1, policy_version 67930 (0.0008) +[2023-10-08 18:30:07,047][21195] Updated weights for policy 0, policy_version 68440 (0.0008) +[2023-10-08 18:30:08,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 139657216. Throughput: 0: 1725.6, 1: 1691.9. Samples: 34918282. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:30:08,803][19739] Avg episode reward: [(0, '1035.820'), (1, '928.820')] +[2023-10-08 18:30:10,629][21194] Updated weights for policy 1, policy_version 67940 (0.0008) +[2023-10-08 18:30:10,996][21194] Updated weights for policy 1, policy_version 67950 (0.0009) +[2023-10-08 18:30:11,007][21195] Updated weights for policy 0, policy_version 68450 (0.0009) +[2023-10-08 18:30:11,354][21194] Updated weights for policy 1, policy_version 67960 (0.0009) +[2023-10-08 18:30:11,366][21195] Updated weights for policy 0, policy_version 68460 (0.0007) +[2023-10-08 18:30:11,730][21195] Updated weights for policy 0, policy_version 68470 (0.0008) +[2023-10-08 18:30:12,098][21195] Updated weights for policy 0, policy_version 68480 (0.0007) +[2023-10-08 18:30:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 139722752. Throughput: 0: 1713.9, 1: 1711.5. Samples: 34939090. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:30:13,803][19739] Avg episode reward: [(0, '1036.030'), (1, '928.820')] +[2023-10-08 18:30:15,381][21194] Updated weights for policy 1, policy_version 67970 (0.0009) +[2023-10-08 18:30:15,736][21194] Updated weights for policy 1, policy_version 67980 (0.0008) +[2023-10-08 18:30:15,830][21195] Updated weights for policy 0, policy_version 68490 (0.0008) +[2023-10-08 18:30:16,099][21194] Updated weights for policy 1, policy_version 67990 (0.0008) +[2023-10-08 18:30:16,205][21195] Updated weights for policy 0, policy_version 68500 (0.0007) +[2023-10-08 18:30:16,463][21194] Updated weights for policy 1, policy_version 68000 (0.0007) +[2023-10-08 18:30:16,574][21195] Updated weights for policy 0, policy_version 68510 (0.0010) +[2023-10-08 18:30:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 139788288. Throughput: 0: 1741.8, 1: 1706.1. Samples: 34955112. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:30:18,803][19739] Avg episode reward: [(0, '1036.030'), (1, '928.820')] +[2023-10-08 18:30:20,488][21194] Updated weights for policy 1, policy_version 68010 (0.0007) +[2023-10-08 18:30:20,583][21195] Updated weights for policy 0, policy_version 68520 (0.0008) +[2023-10-08 18:30:20,852][21194] Updated weights for policy 1, policy_version 68020 (0.0009) +[2023-10-08 18:30:20,945][21195] Updated weights for policy 0, policy_version 68530 (0.0009) +[2023-10-08 18:30:21,217][21194] Updated weights for policy 1, policy_version 68030 (0.0009) +[2023-10-08 18:30:21,319][21195] Updated weights for policy 0, policy_version 68540 (0.0009) +[2023-10-08 18:30:23,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 139853824. Throughput: 0: 1720.7, 1: 1695.1. Samples: 34969972. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:30:23,803][19739] Avg episode reward: [(0, '1036.030'), (1, '932.090')] +[2023-10-08 18:30:25,212][21195] Updated weights for policy 0, policy_version 68550 (0.0009) +[2023-10-08 18:30:25,271][21194] Updated weights for policy 1, policy_version 68040 (0.0008) +[2023-10-08 18:30:25,584][21195] Updated weights for policy 0, policy_version 68560 (0.0007) +[2023-10-08 18:30:25,640][21194] Updated weights for policy 1, policy_version 68050 (0.0009) +[2023-10-08 18:30:25,949][21195] Updated weights for policy 0, policy_version 68570 (0.0007) +[2023-10-08 18:30:26,004][21194] Updated weights for policy 1, policy_version 68060 (0.0009) +[2023-10-08 18:30:28,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 139919360. Throughput: 0: 1728.0, 1: 1726.6. Samples: 34991334. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:30:28,804][19739] Avg episode reward: [(0, '1036.030'), (1, '932.090')] +[2023-10-08 18:30:29,858][21194] Updated weights for policy 1, policy_version 68070 (0.0008) +[2023-10-08 18:30:29,871][21195] Updated weights for policy 0, policy_version 68580 (0.0007) +[2023-10-08 18:30:30,228][21194] Updated weights for policy 1, policy_version 68080 (0.0008) +[2023-10-08 18:30:30,230][21195] Updated weights for policy 0, policy_version 68590 (0.0007) +[2023-10-08 18:30:30,591][21194] Updated weights for policy 1, policy_version 68090 (0.0008) +[2023-10-08 18:30:30,593][21195] Updated weights for policy 0, policy_version 68600 (0.0008) +[2023-10-08 18:30:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 139984896. Throughput: 0: 1751.0, 1: 1696.9. Samples: 35006742. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:30:33,803][19739] Avg episode reward: [(0, '1036.280'), (1, '932.090')] +[2023-10-08 18:30:34,597][21195] Updated weights for policy 0, policy_version 68610 (0.0008) +[2023-10-08 18:30:34,722][21194] Updated weights for policy 1, policy_version 68100 (0.0008) +[2023-10-08 18:30:35,002][21195] Updated weights for policy 0, policy_version 68620 (0.0009) +[2023-10-08 18:30:35,110][21194] Updated weights for policy 1, policy_version 68110 (0.0009) +[2023-10-08 18:30:35,363][21195] Updated weights for policy 0, policy_version 68630 (0.0008) +[2023-10-08 18:30:35,479][21194] Updated weights for policy 1, policy_version 68120 (0.0009) +[2023-10-08 18:30:35,733][21195] Updated weights for policy 0, policy_version 68640 (0.0008) +[2023-10-08 18:30:38,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 140050432. Throughput: 0: 1724.0, 1: 1703.0. Samples: 35021774. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:30:38,803][19739] Avg episode reward: [(0, '1051.220'), (1, '932.090')] +[2023-10-08 18:30:38,804][20740] Saving new best policy, reward=1051.220! +[2023-10-08 18:30:39,433][21194] Updated weights for policy 1, policy_version 68130 (0.0009) +[2023-10-08 18:30:39,626][21195] Updated weights for policy 0, policy_version 68650 (0.0008) +[2023-10-08 18:30:39,798][21194] Updated weights for policy 1, policy_version 68140 (0.0008) +[2023-10-08 18:30:39,987][21195] Updated weights for policy 0, policy_version 68660 (0.0007) +[2023-10-08 18:30:40,156][21194] Updated weights for policy 1, policy_version 68150 (0.0008) +[2023-10-08 18:30:40,347][21195] Updated weights for policy 0, policy_version 68670 (0.0009) +[2023-10-08 18:30:40,523][21194] Updated weights for policy 1, policy_version 68160 (0.0011) +[2023-10-08 18:30:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 140115968. Throughput: 0: 1745.2, 1: 1722.8. Samples: 35042994. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:30:43,803][19739] Avg episode reward: [(0, '1051.220'), (1, '932.090')] +[2023-10-08 18:30:44,350][21195] Updated weights for policy 0, policy_version 68680 (0.0008) +[2023-10-08 18:30:44,605][21194] Updated weights for policy 1, policy_version 68170 (0.0007) +[2023-10-08 18:30:44,724][21195] Updated weights for policy 0, policy_version 68690 (0.0009) +[2023-10-08 18:30:44,966][21194] Updated weights for policy 1, policy_version 68180 (0.0008) +[2023-10-08 18:30:45,095][21195] Updated weights for policy 0, policy_version 68700 (0.0010) +[2023-10-08 18:30:45,329][21194] Updated weights for policy 1, policy_version 68190 (0.0008) +[2023-10-08 18:30:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 140181504. Throughput: 0: 1751.4, 1: 1690.1. Samples: 35058332. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:30:48,803][19739] Avg episode reward: [(0, '1051.300'), (1, '932.090')] +[2023-10-08 18:30:49,011][21195] Updated weights for policy 0, policy_version 68710 (0.0008) +[2023-10-08 18:30:49,286][21194] Updated weights for policy 1, policy_version 68200 (0.0007) +[2023-10-08 18:30:49,380][21195] Updated weights for policy 0, policy_version 68720 (0.0007) +[2023-10-08 18:30:49,649][21194] Updated weights for policy 1, policy_version 68210 (0.0007) +[2023-10-08 18:30:49,740][21195] Updated weights for policy 0, policy_version 68730 (0.0007) +[2023-10-08 18:30:49,958][20740] Saving new best policy, reward=1051.300! +[2023-10-08 18:30:50,016][21194] Updated weights for policy 1, policy_version 68220 (0.0009) +[2023-10-08 18:30:53,464][21195] Updated weights for policy 0, policy_version 68740 (0.0008) +[2023-10-08 18:30:53,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.1, 300 sec: 13773.7). Total num frames: 140247040. Throughput: 0: 1734.6, 1: 1720.2. Samples: 35073750. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:30:53,804][19739] Avg episode reward: [(0, '1051.300'), (1, '932.090')] +[2023-10-08 18:30:53,823][21195] Updated weights for policy 0, policy_version 68750 (0.0008) +[2023-10-08 18:30:53,892][21194] Updated weights for policy 1, policy_version 68230 (0.0007) +[2023-10-08 18:30:54,202][21195] Updated weights for policy 0, policy_version 68760 (0.0011) +[2023-10-08 18:30:54,267][21194] Updated weights for policy 1, policy_version 68240 (0.0008) +[2023-10-08 18:30:54,627][21194] Updated weights for policy 1, policy_version 68250 (0.0010) +[2023-10-08 18:30:58,265][21195] Updated weights for policy 0, policy_version 68770 (0.0008) +[2023-10-08 18:30:58,632][21195] Updated weights for policy 0, policy_version 68780 (0.0009) +[2023-10-08 18:30:58,717][21194] Updated weights for policy 1, policy_version 68260 (0.0009) +[2023-10-08 18:30:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 140312576. Throughput: 0: 1750.2, 1: 1718.2. Samples: 35095166. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:30:58,803][19739] Avg episode reward: [(0, '1051.300'), (1, '932.090')] +[2023-10-08 18:30:58,997][21195] Updated weights for policy 0, policy_version 68790 (0.0008) +[2023-10-08 18:30:59,087][21194] Updated weights for policy 1, policy_version 68270 (0.0008) +[2023-10-08 18:30:59,368][21195] Updated weights for policy 0, policy_version 68800 (0.0007) +[2023-10-08 18:30:59,457][21194] Updated weights for policy 1, policy_version 68280 (0.0007) +[2023-10-08 18:31:03,230][21194] Updated weights for policy 1, policy_version 68290 (0.0008) +[2023-10-08 18:31:03,289][21195] Updated weights for policy 0, policy_version 68810 (0.0007) +[2023-10-08 18:31:03,602][21194] Updated weights for policy 1, policy_version 68300 (0.0009) +[2023-10-08 18:31:03,660][21195] Updated weights for policy 0, policy_version 68820 (0.0007) +[2023-10-08 18:31:03,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 140378112. Throughput: 0: 1722.1, 1: 1709.9. Samples: 35109550. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:31:03,803][19739] Avg episode reward: [(0, '1051.300'), (1, '932.090')] +[2023-10-08 18:31:03,968][21194] Updated weights for policy 1, policy_version 68310 (0.0009) +[2023-10-08 18:31:04,034][21195] Updated weights for policy 0, policy_version 68830 (0.0007) +[2023-10-08 18:31:04,339][21194] Updated weights for policy 1, policy_version 68320 (0.0009) +[2023-10-08 18:31:07,898][21195] Updated weights for policy 0, policy_version 68840 (0.0009) +[2023-10-08 18:31:08,111][21194] Updated weights for policy 1, policy_version 68330 (0.0007) +[2023-10-08 18:31:08,267][21195] Updated weights for policy 0, policy_version 68850 (0.0009) +[2023-10-08 18:31:08,473][21194] Updated weights for policy 1, policy_version 68340 (0.0008) +[2023-10-08 18:31:08,628][21195] Updated weights for policy 0, policy_version 68860 (0.0009) +[2023-10-08 18:31:08,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 140476416. Throughput: 0: 1743.9, 1: 1723.9. Samples: 35126024. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:31:08,803][19739] Avg episode reward: [(0, '1051.300'), (1, '931.840')] +[2023-10-08 18:31:08,829][21194] Updated weights for policy 1, policy_version 68350 (0.0007) +[2023-10-08 18:31:12,563][21195] Updated weights for policy 0, policy_version 68870 (0.0009) +[2023-10-08 18:31:12,829][21194] Updated weights for policy 1, policy_version 68360 (0.0009) +[2023-10-08 18:31:12,931][21195] Updated weights for policy 0, policy_version 68880 (0.0008) +[2023-10-08 18:31:13,188][21194] Updated weights for policy 1, policy_version 68370 (0.0008) +[2023-10-08 18:31:13,298][21195] Updated weights for policy 0, policy_version 68890 (0.0009) +[2023-10-08 18:31:13,556][21194] Updated weights for policy 1, policy_version 68380 (0.0008) +[2023-10-08 18:31:13,803][19739] Fps is (10 sec: 19660.7, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 140574720. Throughput: 0: 1732.8, 1: 1713.7. Samples: 35146424. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:31:13,803][19739] Avg episode reward: [(0, '1051.300'), (1, '917.350')] +[2023-10-08 18:31:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000068896_70549504.pth... +[2023-10-08 18:31:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000068384_70025216.pth... +[2023-10-08 18:31:13,841][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000067264_68878336.pth +[2023-10-08 18:31:13,848][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000066752_68354048.pth +[2023-10-08 18:31:17,108][21195] Updated weights for policy 0, policy_version 68900 (0.0008) +[2023-10-08 18:31:17,468][21195] Updated weights for policy 0, policy_version 68910 (0.0008) +[2023-10-08 18:31:17,506][21194] Updated weights for policy 1, policy_version 68390 (0.0007) +[2023-10-08 18:31:17,837][21195] Updated weights for policy 0, policy_version 68920 (0.0008) +[2023-10-08 18:31:17,876][21194] Updated weights for policy 1, policy_version 68400 (0.0008) +[2023-10-08 18:31:18,244][21194] Updated weights for policy 1, policy_version 68410 (0.0009) +[2023-10-08 18:31:18,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 140640256. Throughput: 0: 1714.3, 1: 1726.6. Samples: 35161580. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:31:18,804][19739] Avg episode reward: [(0, '1051.300'), (1, '917.650')] +[2023-10-08 18:31:21,666][21195] Updated weights for policy 0, policy_version 68930 (0.0009) +[2023-10-08 18:31:22,034][21195] Updated weights for policy 0, policy_version 68940 (0.0008) +[2023-10-08 18:31:22,404][21195] Updated weights for policy 0, policy_version 68950 (0.0007) +[2023-10-08 18:31:22,454][21194] Updated weights for policy 1, policy_version 68420 (0.0009) +[2023-10-08 18:31:22,761][21195] Updated weights for policy 0, policy_version 68960 (0.0007) +[2023-10-08 18:31:22,835][21194] Updated weights for policy 1, policy_version 68430 (0.0010) +[2023-10-08 18:31:23,200][21194] Updated weights for policy 1, policy_version 68440 (0.0007) +[2023-10-08 18:31:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 140705792. Throughput: 0: 1735.8, 1: 1731.0. Samples: 35177782. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:31:23,803][19739] Avg episode reward: [(0, '1051.300'), (1, '917.650')] +[2023-10-08 18:31:26,753][21195] Updated weights for policy 0, policy_version 68970 (0.0008) +[2023-10-08 18:31:27,120][21195] Updated weights for policy 0, policy_version 68980 (0.0008) +[2023-10-08 18:31:27,181][21194] Updated weights for policy 1, policy_version 68450 (0.0008) +[2023-10-08 18:31:27,490][21195] Updated weights for policy 0, policy_version 68990 (0.0009) +[2023-10-08 18:31:27,546][21194] Updated weights for policy 1, policy_version 68460 (0.0008) +[2023-10-08 18:31:27,912][21194] Updated weights for policy 1, policy_version 68470 (0.0008) +[2023-10-08 18:31:28,277][21194] Updated weights for policy 1, policy_version 68480 (0.0008) +[2023-10-08 18:31:28,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 140771328. Throughput: 0: 1719.5, 1: 1706.1. Samples: 35197144. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:31:28,803][19739] Avg episode reward: [(0, '1051.300'), (1, '917.880')] +[2023-10-08 18:31:31,586][21195] Updated weights for policy 0, policy_version 69000 (0.0009) +[2023-10-08 18:31:31,952][21195] Updated weights for policy 0, policy_version 69010 (0.0009) +[2023-10-08 18:31:32,308][21195] Updated weights for policy 0, policy_version 69020 (0.0007) +[2023-10-08 18:31:32,482][21194] Updated weights for policy 1, policy_version 68490 (0.0007) +[2023-10-08 18:31:32,847][21194] Updated weights for policy 1, policy_version 68500 (0.0007) +[2023-10-08 18:31:33,216][21194] Updated weights for policy 1, policy_version 68510 (0.0007) +[2023-10-08 18:31:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 140836864. Throughput: 0: 1716.0, 1: 1728.4. Samples: 35213330. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:31:33,803][19739] Avg episode reward: [(0, '1051.300'), (1, '933.190')] +[2023-10-08 18:31:36,044][21195] Updated weights for policy 0, policy_version 69030 (0.0007) +[2023-10-08 18:31:36,420][21195] Updated weights for policy 0, policy_version 69040 (0.0010) +[2023-10-08 18:31:36,788][21195] Updated weights for policy 0, policy_version 69050 (0.0010) +[2023-10-08 18:31:37,247][21194] Updated weights for policy 1, policy_version 68520 (0.0009) +[2023-10-08 18:31:37,607][21194] Updated weights for policy 1, policy_version 68530 (0.0007) +[2023-10-08 18:31:37,976][21194] Updated weights for policy 1, policy_version 68540 (0.0009) +[2023-10-08 18:31:38,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 140902400. Throughput: 0: 1720.4, 1: 1727.3. Samples: 35228894. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:31:38,803][19739] Avg episode reward: [(0, '1051.300'), (1, '933.190')] +[2023-10-08 18:31:40,746][21195] Updated weights for policy 0, policy_version 69060 (0.0008) +[2023-10-08 18:31:41,111][21195] Updated weights for policy 0, policy_version 69070 (0.0007) +[2023-10-08 18:31:41,489][21195] Updated weights for policy 0, policy_version 69080 (0.0009) +[2023-10-08 18:31:41,965][21194] Updated weights for policy 1, policy_version 68550 (0.0009) +[2023-10-08 18:31:42,322][21194] Updated weights for policy 1, policy_version 68560 (0.0008) +[2023-10-08 18:31:42,683][21194] Updated weights for policy 1, policy_version 68570 (0.0008) +[2023-10-08 18:31:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 140967936. Throughput: 0: 1716.5, 1: 1699.6. Samples: 35248890. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:31:43,803][19739] Avg episode reward: [(0, '1051.300'), (1, '948.050')] +[2023-10-08 18:31:45,477][21195] Updated weights for policy 0, policy_version 69090 (0.0008) +[2023-10-08 18:31:45,844][21195] Updated weights for policy 0, policy_version 69100 (0.0009) +[2023-10-08 18:31:46,211][21195] Updated weights for policy 0, policy_version 69110 (0.0007) +[2023-10-08 18:31:46,543][21194] Updated weights for policy 1, policy_version 68580 (0.0008) +[2023-10-08 18:31:46,582][21195] Updated weights for policy 0, policy_version 69120 (0.0007) +[2023-10-08 18:31:46,914][21194] Updated weights for policy 1, policy_version 68590 (0.0008) +[2023-10-08 18:31:47,275][21194] Updated weights for policy 1, policy_version 68600 (0.0009) +[2023-10-08 18:31:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 141033472. Throughput: 0: 1743.3, 1: 1729.6. Samples: 35265830. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:31:48,803][19739] Avg episode reward: [(0, '1051.300'), (1, '963.510')] +[2023-10-08 18:31:50,363][21195] Updated weights for policy 0, policy_version 69130 (0.0010) +[2023-10-08 18:31:50,729][21195] Updated weights for policy 0, policy_version 69140 (0.0011) +[2023-10-08 18:31:51,096][21195] Updated weights for policy 0, policy_version 69150 (0.0008) +[2023-10-08 18:31:51,116][21194] Updated weights for policy 1, policy_version 68610 (0.0009) +[2023-10-08 18:31:51,478][21194] Updated weights for policy 1, policy_version 68620 (0.0008) +[2023-10-08 18:31:51,841][21194] Updated weights for policy 1, policy_version 68630 (0.0010) +[2023-10-08 18:31:52,213][21194] Updated weights for policy 1, policy_version 68640 (0.0007) +[2023-10-08 18:31:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 141099008. Throughput: 0: 1725.6, 1: 1704.6. Samples: 35280386. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:31:53,803][19739] Avg episode reward: [(0, '1016.960'), (1, '978.630')] +[2023-10-08 18:31:55,036][21195] Updated weights for policy 0, policy_version 69160 (0.0007) +[2023-10-08 18:31:55,419][21195] Updated weights for policy 0, policy_version 69170 (0.0008) +[2023-10-08 18:31:55,787][21195] Updated weights for policy 0, policy_version 69180 (0.0007) +[2023-10-08 18:31:56,145][21194] Updated weights for policy 1, policy_version 68650 (0.0008) +[2023-10-08 18:31:56,518][21194] Updated weights for policy 1, policy_version 68660 (0.0011) +[2023-10-08 18:31:56,878][21194] Updated weights for policy 1, policy_version 68670 (0.0009) +[2023-10-08 18:31:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 141164544. Throughput: 0: 1737.2, 1: 1712.8. Samples: 35301676. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:31:58,803][19739] Avg episode reward: [(0, '1017.000'), (1, '978.550')] +[2023-10-08 18:31:59,674][21195] Updated weights for policy 0, policy_version 69190 (0.0010) +[2023-10-08 18:32:00,037][21195] Updated weights for policy 0, policy_version 69200 (0.0011) +[2023-10-08 18:32:00,412][21195] Updated weights for policy 0, policy_version 69210 (0.0009) +[2023-10-08 18:32:00,843][21194] Updated weights for policy 1, policy_version 68680 (0.0009) +[2023-10-08 18:32:01,214][21194] Updated weights for policy 1, policy_version 68690 (0.0010) +[2023-10-08 18:32:01,589][21194] Updated weights for policy 1, policy_version 68700 (0.0009) +[2023-10-08 18:32:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 141230080. Throughput: 0: 1756.4, 1: 1717.5. Samples: 35317902. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:32:03,804][19739] Avg episode reward: [(0, '1017.000'), (1, '978.550')] +[2023-10-08 18:32:04,259][21195] Updated weights for policy 0, policy_version 69220 (0.0009) +[2023-10-08 18:32:04,625][21195] Updated weights for policy 0, policy_version 69230 (0.0007) +[2023-10-08 18:32:04,998][21195] Updated weights for policy 0, policy_version 69240 (0.0008) +[2023-10-08 18:32:05,450][21194] Updated weights for policy 1, policy_version 68710 (0.0008) +[2023-10-08 18:32:05,816][21194] Updated weights for policy 1, policy_version 68720 (0.0010) +[2023-10-08 18:32:06,178][21194] Updated weights for policy 1, policy_version 68730 (0.0008) +[2023-10-08 18:32:08,743][21195] Updated weights for policy 0, policy_version 69250 (0.0007) +[2023-10-08 18:32:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 141295616. Throughput: 0: 1738.5, 1: 1702.7. Samples: 35332636. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:32:08,803][19739] Avg episode reward: [(0, '1017.000'), (1, '987.800')] +[2023-10-08 18:32:09,132][21195] Updated weights for policy 0, policy_version 69260 (0.0010) +[2023-10-08 18:32:09,498][21195] Updated weights for policy 0, policy_version 69270 (0.0009) +[2023-10-08 18:32:09,866][21195] Updated weights for policy 0, policy_version 69280 (0.0007) +[2023-10-08 18:32:10,039][21194] Updated weights for policy 1, policy_version 68740 (0.0008) +[2023-10-08 18:32:10,426][21194] Updated weights for policy 1, policy_version 68750 (0.0007) +[2023-10-08 18:32:10,789][21194] Updated weights for policy 1, policy_version 68760 (0.0007) +[2023-10-08 18:32:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 141361152. Throughput: 0: 1755.4, 1: 1728.6. Samples: 35353924. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:32:13,804][19739] Avg episode reward: [(0, '1017.000'), (1, '999.460')] +[2023-10-08 18:32:13,904][21195] Updated weights for policy 0, policy_version 69290 (0.0009) +[2023-10-08 18:32:14,275][21195] Updated weights for policy 0, policy_version 69300 (0.0009) +[2023-10-08 18:32:14,651][21195] Updated weights for policy 0, policy_version 69310 (0.0009) +[2023-10-08 18:32:14,676][21194] Updated weights for policy 1, policy_version 68770 (0.0008) +[2023-10-08 18:32:15,048][21194] Updated weights for policy 1, policy_version 68780 (0.0007) +[2023-10-08 18:32:15,413][21194] Updated weights for policy 1, policy_version 68790 (0.0012) +[2023-10-08 18:32:15,769][21194] Updated weights for policy 1, policy_version 68800 (0.0007) +[2023-10-08 18:32:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 141426688. Throughput: 0: 1747.4, 1: 1706.5. Samples: 35368758. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:32:18,803][19739] Avg episode reward: [(0, '1017.000'), (1, '995.390')] +[2023-10-08 18:32:18,902][21195] Updated weights for policy 0, policy_version 69320 (0.0008) +[2023-10-08 18:32:19,275][21195] Updated weights for policy 0, policy_version 69330 (0.0009) +[2023-10-08 18:32:19,636][21195] Updated weights for policy 0, policy_version 69340 (0.0009) +[2023-10-08 18:32:19,731][21194] Updated weights for policy 1, policy_version 68810 (0.0007) +[2023-10-08 18:32:20,092][21194] Updated weights for policy 1, policy_version 68820 (0.0010) +[2023-10-08 18:32:20,460][21194] Updated weights for policy 1, policy_version 68830 (0.0010) +[2023-10-08 18:32:23,469][21195] Updated weights for policy 0, policy_version 69350 (0.0007) +[2023-10-08 18:32:23,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 141492224. Throughput: 0: 1743.0, 1: 1708.7. Samples: 35384220. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:32:23,803][19739] Avg episode reward: [(0, '1017.000'), (1, '995.390')] +[2023-10-08 18:32:23,837][21195] Updated weights for policy 0, policy_version 69360 (0.0009) +[2023-10-08 18:32:24,213][21195] Updated weights for policy 0, policy_version 69370 (0.0007) +[2023-10-08 18:32:24,325][21194] Updated weights for policy 1, policy_version 68840 (0.0009) +[2023-10-08 18:32:24,688][21194] Updated weights for policy 1, policy_version 68850 (0.0009) +[2023-10-08 18:32:25,064][21194] Updated weights for policy 1, policy_version 68860 (0.0009) +[2023-10-08 18:32:28,176][21195] Updated weights for policy 0, policy_version 69380 (0.0007) +[2023-10-08 18:32:28,547][21195] Updated weights for policy 0, policy_version 69390 (0.0008) +[2023-10-08 18:32:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 141557760. Throughput: 0: 1747.0, 1: 1736.8. Samples: 35405660. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:32:28,803][19739] Avg episode reward: [(0, '1017.000'), (1, '995.650')] +[2023-10-08 18:32:28,909][21195] Updated weights for policy 0, policy_version 69400 (0.0007) +[2023-10-08 18:32:29,211][21194] Updated weights for policy 1, policy_version 68870 (0.0007) +[2023-10-08 18:32:29,569][21194] Updated weights for policy 1, policy_version 68880 (0.0007) +[2023-10-08 18:32:29,934][21194] Updated weights for policy 1, policy_version 68890 (0.0008) +[2023-10-08 18:32:32,863][21195] Updated weights for policy 0, policy_version 69410 (0.0008) +[2023-10-08 18:32:33,236][21195] Updated weights for policy 0, policy_version 69420 (0.0008) +[2023-10-08 18:32:33,598][21195] Updated weights for policy 0, policy_version 69430 (0.0008) +[2023-10-08 18:32:33,773][21194] Updated weights for policy 1, policy_version 68900 (0.0009) +[2023-10-08 18:32:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 141623296. Throughput: 0: 1718.3, 1: 1707.4. Samples: 35419988. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:32:33,803][19739] Avg episode reward: [(0, '1032.060'), (1, '996.600')] +[2023-10-08 18:32:33,968][21195] Updated weights for policy 0, policy_version 69440 (0.0009) +[2023-10-08 18:32:34,146][21194] Updated weights for policy 1, policy_version 68910 (0.0009) +[2023-10-08 18:32:34,507][21194] Updated weights for policy 1, policy_version 68920 (0.0008) +[2023-10-08 18:32:37,805][21195] Updated weights for policy 0, policy_version 69450 (0.0007) +[2023-10-08 18:32:38,166][21195] Updated weights for policy 0, policy_version 69460 (0.0007) +[2023-10-08 18:32:38,404][21194] Updated weights for policy 1, policy_version 68930 (0.0008) +[2023-10-08 18:32:38,542][21195] Updated weights for policy 0, policy_version 69470 (0.0007) +[2023-10-08 18:32:38,770][21194] Updated weights for policy 1, policy_version 68940 (0.0008) +[2023-10-08 18:32:38,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 141721600. Throughput: 0: 1743.3, 1: 1734.4. Samples: 35436880. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:32:38,803][19739] Avg episode reward: [(0, '1032.060'), (1, '1010.030')] +[2023-10-08 18:32:39,131][21194] Updated weights for policy 1, policy_version 68950 (0.0008) +[2023-10-08 18:32:39,499][21194] Updated weights for policy 1, policy_version 68960 (0.0007) +[2023-10-08 18:32:42,318][21195] Updated weights for policy 0, policy_version 69480 (0.0007) +[2023-10-08 18:32:42,675][21195] Updated weights for policy 0, policy_version 69490 (0.0008) +[2023-10-08 18:32:43,044][21195] Updated weights for policy 0, policy_version 69500 (0.0007) +[2023-10-08 18:32:43,375][21194] Updated weights for policy 1, policy_version 68970 (0.0007) +[2023-10-08 18:32:43,737][21194] Updated weights for policy 1, policy_version 68980 (0.0008) +[2023-10-08 18:32:43,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 141787136. Throughput: 0: 1727.6, 1: 1741.2. Samples: 35457770. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:32:43,803][19739] Avg episode reward: [(0, '1032.060'), (1, '1010.030')] +[2023-10-08 18:32:44,102][21194] Updated weights for policy 1, policy_version 68990 (0.0010) +[2023-10-08 18:32:46,930][21195] Updated weights for policy 0, policy_version 69510 (0.0008) +[2023-10-08 18:32:47,297][21195] Updated weights for policy 0, policy_version 69520 (0.0007) +[2023-10-08 18:32:47,663][21195] Updated weights for policy 0, policy_version 69530 (0.0008) +[2023-10-08 18:32:48,122][21194] Updated weights for policy 1, policy_version 69000 (0.0009) +[2023-10-08 18:32:48,492][21194] Updated weights for policy 1, policy_version 69010 (0.0008) +[2023-10-08 18:32:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 141852672. Throughput: 0: 1720.0, 1: 1723.7. Samples: 35472868. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:32:48,803][19739] Avg episode reward: [(0, '1046.450'), (1, '1010.030')] +[2023-10-08 18:32:48,863][21194] Updated weights for policy 1, policy_version 69020 (0.0008) +[2023-10-08 18:32:51,527][21195] Updated weights for policy 0, policy_version 69540 (0.0008) +[2023-10-08 18:32:51,893][21195] Updated weights for policy 0, policy_version 69550 (0.0007) +[2023-10-08 18:32:52,266][21195] Updated weights for policy 0, policy_version 69560 (0.0008) +[2023-10-08 18:32:52,547][21194] Updated weights for policy 1, policy_version 69030 (0.0008) +[2023-10-08 18:32:52,923][21194] Updated weights for policy 1, policy_version 69040 (0.0008) +[2023-10-08 18:32:53,290][21194] Updated weights for policy 1, policy_version 69050 (0.0008) +[2023-10-08 18:32:53,803][19739] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 141950976. Throughput: 0: 1736.3, 1: 1749.8. Samples: 35489512. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:32:53,804][19739] Avg episode reward: [(0, '1046.450'), (1, '1010.030')] +[2023-10-08 18:32:56,253][21195] Updated weights for policy 0, policy_version 69570 (0.0008) +[2023-10-08 18:32:56,659][21195] Updated weights for policy 0, policy_version 69580 (0.0009) +[2023-10-08 18:32:57,022][21195] Updated weights for policy 0, policy_version 69590 (0.0007) +[2023-10-08 18:32:57,111][21194] Updated weights for policy 1, policy_version 69060 (0.0008) +[2023-10-08 18:32:57,391][21195] Updated weights for policy 0, policy_version 69600 (0.0008) +[2023-10-08 18:32:57,491][21194] Updated weights for policy 1, policy_version 69070 (0.0009) +[2023-10-08 18:32:57,854][21194] Updated weights for policy 1, policy_version 69080 (0.0009) +[2023-10-08 18:32:58,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 142016512. Throughput: 0: 1722.9, 1: 1724.0. Samples: 35509032. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:32:58,803][19739] Avg episode reward: [(0, '1046.450'), (1, '1010.030')] +[2023-10-08 18:33:01,149][21195] Updated weights for policy 0, policy_version 69610 (0.0009) +[2023-10-08 18:33:01,531][21195] Updated weights for policy 0, policy_version 69620 (0.0007) +[2023-10-08 18:33:01,898][21195] Updated weights for policy 0, policy_version 69630 (0.0012) +[2023-10-08 18:33:01,927][21194] Updated weights for policy 1, policy_version 69090 (0.0009) +[2023-10-08 18:33:02,298][21194] Updated weights for policy 1, policy_version 69100 (0.0009) +[2023-10-08 18:33:02,663][21194] Updated weights for policy 1, policy_version 69110 (0.0009) +[2023-10-08 18:33:03,031][21194] Updated weights for policy 1, policy_version 69120 (0.0008) +[2023-10-08 18:33:03,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 142082048. Throughput: 0: 1736.7, 1: 1748.9. Samples: 35525610. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:33:03,803][19739] Avg episode reward: [(0, '1046.450'), (1, '1010.030')] +[2023-10-08 18:33:05,817][21195] Updated weights for policy 0, policy_version 69640 (0.0009) +[2023-10-08 18:33:06,199][21195] Updated weights for policy 0, policy_version 69650 (0.0010) +[2023-10-08 18:33:06,561][21195] Updated weights for policy 0, policy_version 69660 (0.0008) +[2023-10-08 18:33:07,082][21194] Updated weights for policy 1, policy_version 69130 (0.0007) +[2023-10-08 18:33:07,457][21194] Updated weights for policy 1, policy_version 69140 (0.0009) +[2023-10-08 18:33:07,826][21194] Updated weights for policy 1, policy_version 69150 (0.0010) +[2023-10-08 18:33:08,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 142147584. Throughput: 0: 1735.2, 1: 1740.4. Samples: 35540622. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:33:08,803][19739] Avg episode reward: [(0, '1046.450'), (1, '1025.520')] +[2023-10-08 18:33:10,475][21195] Updated weights for policy 0, policy_version 69670 (0.0008) +[2023-10-08 18:33:10,845][21195] Updated weights for policy 0, policy_version 69680 (0.0008) +[2023-10-08 18:33:11,206][21195] Updated weights for policy 0, policy_version 69690 (0.0007) +[2023-10-08 18:33:11,905][21194] Updated weights for policy 1, policy_version 69160 (0.0009) +[2023-10-08 18:33:12,271][21194] Updated weights for policy 1, policy_version 69170 (0.0010) +[2023-10-08 18:33:12,637][21194] Updated weights for policy 1, policy_version 69180 (0.0009) +[2023-10-08 18:33:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 142213120. Throughput: 0: 1736.8, 1: 1723.3. Samples: 35561366. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:33:13,803][19739] Avg episode reward: [(0, '1046.450'), (1, '1025.520')] +[2023-10-08 18:33:13,814][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000069184_70844416.pth... +[2023-10-08 18:33:13,814][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000069696_71368704.pth... +[2023-10-08 18:33:13,846][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000067584_69206016.pth +[2023-10-08 18:33:13,849][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000068096_69730304.pth +[2023-10-08 18:33:15,153][21195] Updated weights for policy 0, policy_version 69700 (0.0007) +[2023-10-08 18:33:15,515][21195] Updated weights for policy 0, policy_version 69710 (0.0010) +[2023-10-08 18:33:15,888][21195] Updated weights for policy 0, policy_version 69720 (0.0009) +[2023-10-08 18:33:16,532][21194] Updated weights for policy 1, policy_version 69190 (0.0008) +[2023-10-08 18:33:16,909][21194] Updated weights for policy 1, policy_version 69200 (0.0008) +[2023-10-08 18:33:17,280][21194] Updated weights for policy 1, policy_version 69210 (0.0008) +[2023-10-08 18:33:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 142278656. Throughput: 0: 1758.5, 1: 1753.3. Samples: 35578020. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:33:18,803][19739] Avg episode reward: [(0, '1046.450'), (1, '1025.520')] +[2023-10-08 18:33:19,754][21195] Updated weights for policy 0, policy_version 69730 (0.0008) +[2023-10-08 18:33:20,135][21195] Updated weights for policy 0, policy_version 69740 (0.0009) +[2023-10-08 18:33:20,502][21195] Updated weights for policy 0, policy_version 69750 (0.0008) +[2023-10-08 18:33:20,869][21195] Updated weights for policy 0, policy_version 69760 (0.0009) +[2023-10-08 18:33:21,109][21194] Updated weights for policy 1, policy_version 69220 (0.0009) +[2023-10-08 18:33:21,478][21194] Updated weights for policy 1, policy_version 69230 (0.0008) +[2023-10-08 18:33:21,850][21194] Updated weights for policy 1, policy_version 69240 (0.0010) +[2023-10-08 18:33:23,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 142344192. Throughput: 0: 1728.2, 1: 1725.5. Samples: 35592294. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:33:23,804][19739] Avg episode reward: [(0, '1046.450'), (1, '1025.520')] +[2023-10-08 18:33:24,703][21195] Updated weights for policy 0, policy_version 69770 (0.0007) +[2023-10-08 18:33:25,079][21195] Updated weights for policy 0, policy_version 69780 (0.0009) +[2023-10-08 18:33:25,457][21195] Updated weights for policy 0, policy_version 69790 (0.0009) +[2023-10-08 18:33:25,752][21194] Updated weights for policy 1, policy_version 69250 (0.0007) +[2023-10-08 18:33:26,113][21194] Updated weights for policy 1, policy_version 69260 (0.0007) +[2023-10-08 18:33:26,483][21194] Updated weights for policy 1, policy_version 69270 (0.0009) +[2023-10-08 18:33:26,851][21194] Updated weights for policy 1, policy_version 69280 (0.0009) +[2023-10-08 18:33:28,803][19739] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 142409728. Throughput: 0: 1750.7, 1: 1720.3. Samples: 35613970. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:33:28,804][19739] Avg episode reward: [(0, '1056.300'), (1, '1025.520')] +[2023-10-08 18:33:28,815][20740] Saving new best policy, reward=1056.300! +[2023-10-08 18:33:29,289][21195] Updated weights for policy 0, policy_version 69800 (0.0008) +[2023-10-08 18:33:29,662][21195] Updated weights for policy 0, policy_version 69810 (0.0010) +[2023-10-08 18:33:30,028][21195] Updated weights for policy 0, policy_version 69820 (0.0009) +[2023-10-08 18:33:30,609][21194] Updated weights for policy 1, policy_version 69290 (0.0009) +[2023-10-08 18:33:30,974][21194] Updated weights for policy 1, policy_version 69300 (0.0010) +[2023-10-08 18:33:31,341][21194] Updated weights for policy 1, policy_version 69310 (0.0009) +[2023-10-08 18:33:33,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 142475264. Throughput: 0: 1757.8, 1: 1731.4. Samples: 35629880. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:33:33,803][19739] Avg episode reward: [(0, '1056.230'), (1, '1025.520')] +[2023-10-08 18:33:33,943][21195] Updated weights for policy 0, policy_version 69830 (0.0008) +[2023-10-08 18:33:34,311][21195] Updated weights for policy 0, policy_version 69840 (0.0007) +[2023-10-08 18:33:34,682][21195] Updated weights for policy 0, policy_version 69850 (0.0009) +[2023-10-08 18:33:35,257][21194] Updated weights for policy 1, policy_version 69320 (0.0007) +[2023-10-08 18:33:35,622][21194] Updated weights for policy 1, policy_version 69330 (0.0009) +[2023-10-08 18:33:35,979][21194] Updated weights for policy 1, policy_version 69340 (0.0009) +[2023-10-08 18:33:38,570][21195] Updated weights for policy 0, policy_version 69860 (0.0010) +[2023-10-08 18:33:38,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 142540800. Throughput: 0: 1742.7, 1: 1719.5. Samples: 35645310. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:33:38,804][19739] Avg episode reward: [(0, '1056.230'), (1, '1025.520')] +[2023-10-08 18:33:38,933][21195] Updated weights for policy 0, policy_version 69870 (0.0010) +[2023-10-08 18:33:39,296][21195] Updated weights for policy 0, policy_version 69880 (0.0010) +[2023-10-08 18:33:39,892][21194] Updated weights for policy 1, policy_version 69350 (0.0008) +[2023-10-08 18:33:40,253][21194] Updated weights for policy 1, policy_version 69360 (0.0011) +[2023-10-08 18:33:40,622][21194] Updated weights for policy 1, policy_version 69370 (0.0009) +[2023-10-08 18:33:43,170][21195] Updated weights for policy 0, policy_version 69890 (0.0010) +[2023-10-08 18:33:43,551][21195] Updated weights for policy 0, policy_version 69900 (0.0008) +[2023-10-08 18:33:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 142606336. Throughput: 0: 1758.3, 1: 1747.1. Samples: 35666774. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:33:43,803][19739] Avg episode reward: [(0, '1058.600'), (1, '1040.640')] +[2023-10-08 18:33:43,928][21195] Updated weights for policy 0, policy_version 69910 (0.0010) +[2023-10-08 18:33:44,287][20740] Saving new best policy, reward=1058.600! +[2023-10-08 18:33:44,288][21195] Updated weights for policy 0, policy_version 69920 (0.0008) +[2023-10-08 18:33:44,608][21194] Updated weights for policy 1, policy_version 69380 (0.0007) +[2023-10-08 18:33:45,004][21194] Updated weights for policy 1, policy_version 69390 (0.0009) +[2023-10-08 18:33:45,361][21194] Updated weights for policy 1, policy_version 69400 (0.0009) +[2023-10-08 18:33:48,073][21195] Updated weights for policy 0, policy_version 69930 (0.0009) +[2023-10-08 18:33:48,446][21195] Updated weights for policy 0, policy_version 69940 (0.0007) +[2023-10-08 18:33:48,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 142671872. Throughput: 0: 1731.0, 1: 1723.2. Samples: 35681046. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:33:48,803][19739] Avg episode reward: [(0, '1058.600'), (1, '1047.680')] +[2023-10-08 18:33:48,807][21195] Updated weights for policy 0, policy_version 69950 (0.0009) +[2023-10-08 18:33:49,164][21194] Updated weights for policy 1, policy_version 69410 (0.0008) +[2023-10-08 18:33:49,538][21194] Updated weights for policy 1, policy_version 69420 (0.0010) +[2023-10-08 18:33:49,909][21194] Updated weights for policy 1, policy_version 69430 (0.0010) +[2023-10-08 18:33:50,272][21194] Updated weights for policy 1, policy_version 69440 (0.0008) +[2023-10-08 18:33:52,800][21195] Updated weights for policy 0, policy_version 69960 (0.0008) +[2023-10-08 18:33:53,162][21195] Updated weights for policy 0, policy_version 69970 (0.0008) +[2023-10-08 18:33:53,527][21195] Updated weights for policy 0, policy_version 69980 (0.0009) +[2023-10-08 18:33:53,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 142770176. Throughput: 0: 1758.0, 1: 1730.8. Samples: 35697622. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:33:53,804][19739] Avg episode reward: [(0, '1058.600'), (1, '1047.680')] +[2023-10-08 18:33:54,202][21194] Updated weights for policy 1, policy_version 69450 (0.0007) +[2023-10-08 18:33:54,574][21194] Updated weights for policy 1, policy_version 69460 (0.0008) +[2023-10-08 18:33:54,944][21194] Updated weights for policy 1, policy_version 69470 (0.0007) +[2023-10-08 18:33:57,531][21195] Updated weights for policy 0, policy_version 69990 (0.0009) +[2023-10-08 18:33:57,906][21195] Updated weights for policy 0, policy_version 70000 (0.0007) +[2023-10-08 18:33:58,279][21195] Updated weights for policy 0, policy_version 70010 (0.0007) +[2023-10-08 18:33:58,776][21194] Updated weights for policy 1, policy_version 69480 (0.0011) +[2023-10-08 18:33:58,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 142835712. Throughput: 0: 1741.4, 1: 1756.5. Samples: 35718770. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:33:58,803][19739] Avg episode reward: [(0, '1073.050'), (1, '1047.680')] +[2023-10-08 18:33:58,813][20740] Saving new best policy, reward=1073.050! +[2023-10-08 18:33:59,152][21194] Updated weights for policy 1, policy_version 69490 (0.0009) +[2023-10-08 18:33:59,516][21194] Updated weights for policy 1, policy_version 69500 (0.0007) +[2023-10-08 18:34:02,116][21195] Updated weights for policy 0, policy_version 70020 (0.0007) +[2023-10-08 18:34:02,487][21195] Updated weights for policy 0, policy_version 70030 (0.0009) +[2023-10-08 18:34:02,856][21195] Updated weights for policy 0, policy_version 70040 (0.0008) +[2023-10-08 18:34:03,367][21194] Updated weights for policy 1, policy_version 69510 (0.0008) +[2023-10-08 18:34:03,739][21194] Updated weights for policy 1, policy_version 69520 (0.0008) +[2023-10-08 18:34:03,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 142901248. Throughput: 0: 1730.7, 1: 1726.4. Samples: 35733590. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:34:03,803][19739] Avg episode reward: [(0, '1086.310'), (1, '1047.680')] +[2023-10-08 18:34:03,804][20740] Saving new best policy, reward=1086.310! +[2023-10-08 18:34:04,097][21194] Updated weights for policy 1, policy_version 69530 (0.0007) +[2023-10-08 18:34:06,879][21195] Updated weights for policy 0, policy_version 70050 (0.0009) +[2023-10-08 18:34:07,243][21195] Updated weights for policy 0, policy_version 70060 (0.0011) +[2023-10-08 18:34:07,610][21195] Updated weights for policy 0, policy_version 70070 (0.0009) +[2023-10-08 18:34:07,982][21195] Updated weights for policy 0, policy_version 70080 (0.0009) +[2023-10-08 18:34:08,269][21194] Updated weights for policy 1, policy_version 69540 (0.0010) +[2023-10-08 18:34:08,640][21194] Updated weights for policy 1, policy_version 69550 (0.0009) +[2023-10-08 18:34:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 142966784. Throughput: 0: 1756.3, 1: 1752.2. Samples: 35750174. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:34:08,803][19739] Avg episode reward: [(0, '1086.310'), (1, '1047.680')] +[2023-10-08 18:34:09,016][21194] Updated weights for policy 1, policy_version 69560 (0.0008) +[2023-10-08 18:34:11,823][21195] Updated weights for policy 0, policy_version 70090 (0.0009) +[2023-10-08 18:34:12,188][21195] Updated weights for policy 0, policy_version 70100 (0.0008) +[2023-10-08 18:34:12,559][21195] Updated weights for policy 0, policy_version 70110 (0.0009) +[2023-10-08 18:34:12,812][21194] Updated weights for policy 1, policy_version 69570 (0.0009) +[2023-10-08 18:34:13,182][21194] Updated weights for policy 1, policy_version 69580 (0.0007) +[2023-10-08 18:34:13,539][21194] Updated weights for policy 1, policy_version 69590 (0.0007) +[2023-10-08 18:34:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 143032320. Throughput: 0: 1722.8, 1: 1747.0. Samples: 35770110. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:34:13,803][19739] Avg episode reward: [(0, '1086.310'), (1, '1047.680')] +[2023-10-08 18:34:13,909][21194] Updated weights for policy 1, policy_version 69600 (0.0008) +[2023-10-08 18:34:16,416][21195] Updated weights for policy 0, policy_version 70120 (0.0010) +[2023-10-08 18:34:16,784][21195] Updated weights for policy 0, policy_version 70130 (0.0008) +[2023-10-08 18:34:17,157][21195] Updated weights for policy 0, policy_version 70140 (0.0008) +[2023-10-08 18:34:17,861][21194] Updated weights for policy 1, policy_version 69610 (0.0011) +[2023-10-08 18:34:18,229][21194] Updated weights for policy 1, policy_version 69620 (0.0008) +[2023-10-08 18:34:18,590][21194] Updated weights for policy 1, policy_version 69630 (0.0007) +[2023-10-08 18:34:18,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13995.8). Total num frames: 143130624. Throughput: 0: 1719.7, 1: 1744.1. Samples: 35785750. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:34:18,803][19739] Avg episode reward: [(0, '1086.310'), (1, '1063.160')] +[2023-10-08 18:34:21,079][21195] Updated weights for policy 0, policy_version 70150 (0.0010) +[2023-10-08 18:34:21,441][21195] Updated weights for policy 0, policy_version 70160 (0.0007) +[2023-10-08 18:34:21,821][21195] Updated weights for policy 0, policy_version 70170 (0.0008) +[2023-10-08 18:34:22,564][21194] Updated weights for policy 1, policy_version 69640 (0.0009) +[2023-10-08 18:34:22,933][21194] Updated weights for policy 1, policy_version 69650 (0.0009) +[2023-10-08 18:34:23,306][21194] Updated weights for policy 1, policy_version 69660 (0.0008) +[2023-10-08 18:34:23,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 143196160. Throughput: 0: 1723.1, 1: 1745.6. Samples: 35801402. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:34:23,804][19739] Avg episode reward: [(0, '1085.390'), (1, '1063.160')] +[2023-10-08 18:34:25,744][21195] Updated weights for policy 0, policy_version 70180 (0.0009) +[2023-10-08 18:34:26,108][21195] Updated weights for policy 0, policy_version 70190 (0.0007) +[2023-10-08 18:34:26,481][21195] Updated weights for policy 0, policy_version 70200 (0.0009) +[2023-10-08 18:34:27,167][21194] Updated weights for policy 1, policy_version 69670 (0.0007) +[2023-10-08 18:34:27,546][21194] Updated weights for policy 1, policy_version 69680 (0.0009) +[2023-10-08 18:34:27,915][21194] Updated weights for policy 1, policy_version 69690 (0.0008) +[2023-10-08 18:34:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 143261696. Throughput: 0: 1715.7, 1: 1718.8. Samples: 35821330. Policy #0 lag: (min: 31.0, avg: 32.0, max: 52.0) +[2023-10-08 18:34:28,803][19739] Avg episode reward: [(0, '1085.390'), (1, '1063.160')] +[2023-10-08 18:34:30,497][21195] Updated weights for policy 0, policy_version 70210 (0.0011) +[2023-10-08 18:34:30,895][21195] Updated weights for policy 0, policy_version 70220 (0.0009) +[2023-10-08 18:34:31,267][21195] Updated weights for policy 0, policy_version 70230 (0.0007) +[2023-10-08 18:34:31,635][21195] Updated weights for policy 0, policy_version 70240 (0.0009) +[2023-10-08 18:34:31,882][21194] Updated weights for policy 1, policy_version 69700 (0.0008) +[2023-10-08 18:34:32,266][21194] Updated weights for policy 1, policy_version 69710 (0.0008) +[2023-10-08 18:34:32,628][21194] Updated weights for policy 1, policy_version 69720 (0.0007) +[2023-10-08 18:34:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 143327232. Throughput: 0: 1735.9, 1: 1743.3. Samples: 35837610. Policy #0 lag: (min: 31.0, avg: 32.0, max: 52.0) +[2023-10-08 18:34:33,804][19739] Avg episode reward: [(0, '1085.390'), (1, '1063.160')] +[2023-10-08 18:34:35,460][21195] Updated weights for policy 0, policy_version 70250 (0.0008) +[2023-10-08 18:34:35,818][21195] Updated weights for policy 0, policy_version 70260 (0.0007) +[2023-10-08 18:34:36,184][21195] Updated weights for policy 0, policy_version 70270 (0.0007) +[2023-10-08 18:34:36,650][21194] Updated weights for policy 1, policy_version 69730 (0.0007) +[2023-10-08 18:34:37,014][21194] Updated weights for policy 1, policy_version 69740 (0.0008) +[2023-10-08 18:34:37,378][21194] Updated weights for policy 1, policy_version 69750 (0.0007) +[2023-10-08 18:34:37,741][21194] Updated weights for policy 1, policy_version 69760 (0.0007) +[2023-10-08 18:34:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 143392768. Throughput: 0: 1710.3, 1: 1732.8. Samples: 35852562. Policy #0 lag: (min: 31.0, avg: 32.0, max: 52.0) +[2023-10-08 18:34:38,803][19739] Avg episode reward: [(0, '1085.390'), (1, '1063.040')] +[2023-10-08 18:34:40,163][21195] Updated weights for policy 0, policy_version 70280 (0.0011) +[2023-10-08 18:34:40,527][21195] Updated weights for policy 0, policy_version 70290 (0.0009) +[2023-10-08 18:34:40,899][21195] Updated weights for policy 0, policy_version 70300 (0.0010) +[2023-10-08 18:34:41,751][21194] Updated weights for policy 1, policy_version 69770 (0.0009) +[2023-10-08 18:34:42,111][21194] Updated weights for policy 1, policy_version 69780 (0.0009) +[2023-10-08 18:34:42,481][21194] Updated weights for policy 1, policy_version 69790 (0.0009) +[2023-10-08 18:34:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 143458304. Throughput: 0: 1736.7, 1: 1708.6. Samples: 35873808. Policy #0 lag: (min: 31.0, avg: 32.0, max: 52.0) +[2023-10-08 18:34:43,804][19739] Avg episode reward: [(0, '1085.390'), (1, '1063.040')] +[2023-10-08 18:34:44,780][21195] Updated weights for policy 0, policy_version 70310 (0.0008) +[2023-10-08 18:34:45,142][21195] Updated weights for policy 0, policy_version 70320 (0.0009) +[2023-10-08 18:34:45,512][21195] Updated weights for policy 0, policy_version 70330 (0.0010) +[2023-10-08 18:34:46,443][21194] Updated weights for policy 1, policy_version 69800 (0.0011) +[2023-10-08 18:34:46,817][21194] Updated weights for policy 1, policy_version 69810 (0.0010) +[2023-10-08 18:34:47,184][21194] Updated weights for policy 1, policy_version 69820 (0.0011) +[2023-10-08 18:34:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 143523840. Throughput: 0: 1755.1, 1: 1734.5. Samples: 35890624. Policy #0 lag: (min: 31.0, avg: 32.0, max: 52.0) +[2023-10-08 18:34:48,803][19739] Avg episode reward: [(0, '1099.780'), (1, '1063.040')] +[2023-10-08 18:34:48,804][20740] Saving new best policy, reward=1099.780! +[2023-10-08 18:34:49,548][21195] Updated weights for policy 0, policy_version 70340 (0.0008) +[2023-10-08 18:34:49,914][21195] Updated weights for policy 0, policy_version 70350 (0.0007) +[2023-10-08 18:34:50,283][21195] Updated weights for policy 0, policy_version 70360 (0.0008) +[2023-10-08 18:34:51,273][21194] Updated weights for policy 1, policy_version 69830 (0.0008) +[2023-10-08 18:34:51,644][21194] Updated weights for policy 1, policy_version 69840 (0.0008) +[2023-10-08 18:34:52,013][21194] Updated weights for policy 1, policy_version 69850 (0.0009) +[2023-10-08 18:34:53,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 143589376. Throughput: 0: 1731.4, 1: 1698.7. Samples: 35904528. Policy #0 lag: (min: 31.0, avg: 32.0, max: 52.0) +[2023-10-08 18:34:53,803][19739] Avg episode reward: [(0, '1090.590'), (1, '1063.690')] +[2023-10-08 18:34:54,017][21195] Updated weights for policy 0, policy_version 70370 (0.0009) +[2023-10-08 18:34:54,401][21195] Updated weights for policy 0, policy_version 70380 (0.0008) +[2023-10-08 18:34:54,761][21195] Updated weights for policy 0, policy_version 70390 (0.0007) +[2023-10-08 18:34:55,128][21195] Updated weights for policy 0, policy_version 70400 (0.0007) +[2023-10-08 18:34:55,936][21194] Updated weights for policy 1, policy_version 69860 (0.0008) +[2023-10-08 18:34:56,297][21194] Updated weights for policy 1, policy_version 69870 (0.0008) +[2023-10-08 18:34:56,658][21194] Updated weights for policy 1, policy_version 69880 (0.0008) +[2023-10-08 18:34:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 143654912. Throughput: 0: 1764.4, 1: 1699.0. Samples: 35925966. Policy #0 lag: (min: 31.0, avg: 32.0, max: 52.0) +[2023-10-08 18:34:58,803][19739] Avg episode reward: [(0, '1090.590'), (1, '1063.690')] +[2023-10-08 18:34:58,872][21195] Updated weights for policy 0, policy_version 70410 (0.0008) +[2023-10-08 18:34:59,246][21195] Updated weights for policy 0, policy_version 70420 (0.0010) +[2023-10-08 18:34:59,614][21195] Updated weights for policy 0, policy_version 70430 (0.0009) +[2023-10-08 18:35:00,571][21194] Updated weights for policy 1, policy_version 69890 (0.0009) +[2023-10-08 18:35:00,937][21194] Updated weights for policy 1, policy_version 69900 (0.0010) +[2023-10-08 18:35:01,302][21194] Updated weights for policy 1, policy_version 69910 (0.0011) +[2023-10-08 18:35:01,669][21194] Updated weights for policy 1, policy_version 69920 (0.0011) +[2023-10-08 18:35:03,492][21195] Updated weights for policy 0, policy_version 70440 (0.0007) +[2023-10-08 18:35:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 143720448. Throughput: 0: 1755.0, 1: 1708.1. Samples: 35941590. Policy #0 lag: (min: 31.0, avg: 32.0, max: 52.0) +[2023-10-08 18:35:03,803][19739] Avg episode reward: [(0, '1090.590'), (1, '1063.690')] +[2023-10-08 18:35:03,853][21195] Updated weights for policy 0, policy_version 70450 (0.0010) +[2023-10-08 18:35:04,220][21195] Updated weights for policy 0, policy_version 70460 (0.0009) +[2023-10-08 18:35:05,708][21194] Updated weights for policy 1, policy_version 69930 (0.0009) +[2023-10-08 18:35:06,075][21194] Updated weights for policy 1, policy_version 69940 (0.0008) +[2023-10-08 18:35:06,443][21194] Updated weights for policy 1, policy_version 69950 (0.0008) +[2023-10-08 18:35:08,231][21195] Updated weights for policy 0, policy_version 70470 (0.0009) +[2023-10-08 18:35:08,604][21195] Updated weights for policy 0, policy_version 70480 (0.0007) +[2023-10-08 18:35:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 143785984. Throughput: 0: 1758.4, 1: 1690.6. Samples: 35956608. Policy #0 lag: (min: 31.0, avg: 32.0, max: 52.0) +[2023-10-08 18:35:08,803][19739] Avg episode reward: [(0, '1090.590'), (1, '1063.690')] +[2023-10-08 18:35:08,977][21195] Updated weights for policy 0, policy_version 70490 (0.0008) +[2023-10-08 18:35:10,429][21194] Updated weights for policy 1, policy_version 69960 (0.0008) +[2023-10-08 18:35:10,792][21194] Updated weights for policy 1, policy_version 69970 (0.0007) +[2023-10-08 18:35:11,170][21194] Updated weights for policy 1, policy_version 69980 (0.0009) +[2023-10-08 18:35:12,818][21195] Updated weights for policy 0, policy_version 70500 (0.0008) +[2023-10-08 18:35:13,181][21195] Updated weights for policy 0, policy_version 70510 (0.0010) +[2023-10-08 18:35:13,553][21195] Updated weights for policy 0, policy_version 70520 (0.0008) +[2023-10-08 18:35:13,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 143851520. Throughput: 0: 1765.4, 1: 1713.4. Samples: 35977876. Policy #0 lag: (min: 31.0, avg: 32.0, max: 52.0) +[2023-10-08 18:35:13,804][19739] Avg episode reward: [(0, '1090.590'), (1, '1063.690')] +[2023-10-08 18:35:13,815][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000069984_71663616.pth... +[2023-10-08 18:35:13,847][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000070528_72220672.pth... +[2023-10-08 18:35:13,850][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000068384_70025216.pth +[2023-10-08 18:35:13,876][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000068896_70549504.pth +[2023-10-08 18:35:15,152][21194] Updated weights for policy 1, policy_version 69990 (0.0008) +[2023-10-08 18:35:15,517][21194] Updated weights for policy 1, policy_version 70000 (0.0009) +[2023-10-08 18:35:15,885][21194] Updated weights for policy 1, policy_version 70010 (0.0008) +[2023-10-08 18:35:17,506][21195] Updated weights for policy 0, policy_version 70530 (0.0008) +[2023-10-08 18:35:17,916][21195] Updated weights for policy 0, policy_version 70540 (0.0007) +[2023-10-08 18:35:18,282][21195] Updated weights for policy 0, policy_version 70550 (0.0008) +[2023-10-08 18:35:18,647][21195] Updated weights for policy 0, policy_version 70560 (0.0007) +[2023-10-08 18:35:18,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 143949824. Throughput: 0: 1741.9, 1: 1693.9. Samples: 35992222. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:35:18,803][19739] Avg episode reward: [(0, '1090.590'), (1, '1063.690')] +[2023-10-08 18:35:19,670][21194] Updated weights for policy 1, policy_version 70020 (0.0008) +[2023-10-08 18:35:20,033][21194] Updated weights for policy 1, policy_version 70030 (0.0007) +[2023-10-08 18:35:20,403][21194] Updated weights for policy 1, policy_version 70040 (0.0007) +[2023-10-08 18:35:22,545][21195] Updated weights for policy 0, policy_version 70570 (0.0008) +[2023-10-08 18:35:22,911][21195] Updated weights for policy 0, policy_version 70580 (0.0009) +[2023-10-08 18:35:23,279][21195] Updated weights for policy 0, policy_version 70590 (0.0010) +[2023-10-08 18:35:23,803][19739] Fps is (10 sec: 16384.3, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 144015360. Throughput: 0: 1770.9, 1: 1702.9. Samples: 36008884. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:35:23,803][19739] Avg episode reward: [(0, '1067.710'), (1, '1079.050')] +[2023-10-08 18:35:24,491][21194] Updated weights for policy 1, policy_version 70050 (0.0008) +[2023-10-08 18:35:24,884][21194] Updated weights for policy 1, policy_version 70060 (0.0008) +[2023-10-08 18:35:25,244][21194] Updated weights for policy 1, policy_version 70070 (0.0007) +[2023-10-08 18:35:25,612][21194] Updated weights for policy 1, policy_version 70080 (0.0009) +[2023-10-08 18:35:27,111][21195] Updated weights for policy 0, policy_version 70600 (0.0007) +[2023-10-08 18:35:27,478][21195] Updated weights for policy 0, policy_version 70610 (0.0008) +[2023-10-08 18:35:27,840][21195] Updated weights for policy 0, policy_version 70620 (0.0008) +[2023-10-08 18:35:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 144080896. Throughput: 0: 1734.5, 1: 1719.0. Samples: 36029214. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:35:28,803][19739] Avg episode reward: [(0, '1067.710'), (1, '1079.050')] +[2023-10-08 18:35:29,612][21194] Updated weights for policy 1, policy_version 70090 (0.0007) +[2023-10-08 18:35:29,969][21194] Updated weights for policy 1, policy_version 70100 (0.0008) +[2023-10-08 18:35:30,342][21194] Updated weights for policy 1, policy_version 70110 (0.0009) +[2023-10-08 18:35:31,792][21195] Updated weights for policy 0, policy_version 70630 (0.0009) +[2023-10-08 18:35:32,170][21195] Updated weights for policy 0, policy_version 70640 (0.0008) +[2023-10-08 18:35:32,532][21195] Updated weights for policy 0, policy_version 70650 (0.0008) +[2023-10-08 18:35:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 144146432. Throughput: 0: 1728.4, 1: 1691.3. Samples: 36044510. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:35:33,803][19739] Avg episode reward: [(0, '1067.710'), (1, '1079.050')] +[2023-10-08 18:35:34,214][21194] Updated weights for policy 1, policy_version 70120 (0.0009) +[2023-10-08 18:35:34,577][21194] Updated weights for policy 1, policy_version 70130 (0.0007) +[2023-10-08 18:35:34,949][21194] Updated weights for policy 1, policy_version 70140 (0.0008) +[2023-10-08 18:35:36,241][21195] Updated weights for policy 0, policy_version 70660 (0.0008) +[2023-10-08 18:35:36,603][21195] Updated weights for policy 0, policy_version 70670 (0.0009) +[2023-10-08 18:35:36,968][21195] Updated weights for policy 0, policy_version 70680 (0.0008) +[2023-10-08 18:35:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 144211968. Throughput: 0: 1743.9, 1: 1720.4. Samples: 36060422. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:35:38,803][19739] Avg episode reward: [(0, '1067.710'), (1, '1079.050')] +[2023-10-08 18:35:38,950][21194] Updated weights for policy 1, policy_version 70150 (0.0009) +[2023-10-08 18:35:39,316][21194] Updated weights for policy 1, policy_version 70160 (0.0008) +[2023-10-08 18:35:39,679][21194] Updated weights for policy 1, policy_version 70170 (0.0009) +[2023-10-08 18:35:40,746][21195] Updated weights for policy 0, policy_version 70690 (0.0007) +[2023-10-08 18:35:41,103][21195] Updated weights for policy 0, policy_version 70700 (0.0009) +[2023-10-08 18:35:41,481][21195] Updated weights for policy 0, policy_version 70710 (0.0007) +[2023-10-08 18:35:41,852][21195] Updated weights for policy 0, policy_version 70720 (0.0007) +[2023-10-08 18:35:43,691][21194] Updated weights for policy 1, policy_version 70180 (0.0008) +[2023-10-08 18:35:43,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 144277504. Throughput: 0: 1727.6, 1: 1727.2. Samples: 36081432. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:35:43,803][19739] Avg episode reward: [(0, '1067.710'), (1, '1106.100')] +[2023-10-08 18:35:44,056][21194] Updated weights for policy 1, policy_version 70190 (0.0009) +[2023-10-08 18:35:44,419][21194] Updated weights for policy 1, policy_version 70200 (0.0008) +[2023-10-08 18:35:44,706][20836] Saving new best policy, reward=1106.100! +[2023-10-08 18:35:45,657][21195] Updated weights for policy 0, policy_version 70730 (0.0008) +[2023-10-08 18:35:46,025][21195] Updated weights for policy 0, policy_version 70740 (0.0008) +[2023-10-08 18:35:46,397][21195] Updated weights for policy 0, policy_version 70750 (0.0008) +[2023-10-08 18:35:48,268][21194] Updated weights for policy 1, policy_version 70210 (0.0008) +[2023-10-08 18:35:48,634][21194] Updated weights for policy 1, policy_version 70220 (0.0008) +[2023-10-08 18:35:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 144343040. Throughput: 0: 1747.7, 1: 1710.4. Samples: 36097204. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:35:48,805][19739] Avg episode reward: [(0, '1067.710'), (1, '1106.100')] +[2023-10-08 18:35:48,991][21194] Updated weights for policy 1, policy_version 70230 (0.0008) +[2023-10-08 18:35:49,355][21194] Updated weights for policy 1, policy_version 70240 (0.0008) +[2023-10-08 18:35:50,281][21195] Updated weights for policy 0, policy_version 70760 (0.0009) +[2023-10-08 18:35:50,645][21195] Updated weights for policy 0, policy_version 70770 (0.0008) +[2023-10-08 18:35:51,011][21195] Updated weights for policy 0, policy_version 70780 (0.0007) +[2023-10-08 18:35:53,398][21194] Updated weights for policy 1, policy_version 70250 (0.0008) +[2023-10-08 18:35:53,756][21194] Updated weights for policy 1, policy_version 70260 (0.0007) +[2023-10-08 18:35:53,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 144408576. Throughput: 0: 1736.8, 1: 1728.1. Samples: 36112528. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:35:53,803][19739] Avg episode reward: [(0, '1067.710'), (1, '1106.100')] +[2023-10-08 18:35:54,132][21194] Updated weights for policy 1, policy_version 70270 (0.0009) +[2023-10-08 18:35:54,877][21195] Updated weights for policy 0, policy_version 70790 (0.0007) +[2023-10-08 18:35:55,241][21195] Updated weights for policy 0, policy_version 70800 (0.0009) +[2023-10-08 18:35:55,613][21195] Updated weights for policy 0, policy_version 70810 (0.0010) +[2023-10-08 18:35:58,189][21194] Updated weights for policy 1, policy_version 70280 (0.0009) +[2023-10-08 18:35:58,566][21194] Updated weights for policy 1, policy_version 70290 (0.0010) +[2023-10-08 18:35:58,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 144474112. Throughput: 0: 1745.9, 1: 1720.6. Samples: 36133868. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 18:35:58,804][19739] Avg episode reward: [(0, '1067.710'), (1, '1114.230')] +[2023-10-08 18:35:58,932][21194] Updated weights for policy 1, policy_version 70300 (0.0008) +[2023-10-08 18:35:59,076][20836] Saving new best policy, reward=1114.230! +[2023-10-08 18:35:59,436][21195] Updated weights for policy 0, policy_version 70820 (0.0008) +[2023-10-08 18:35:59,799][21195] Updated weights for policy 0, policy_version 70830 (0.0008) +[2023-10-08 18:36:00,162][21195] Updated weights for policy 0, policy_version 70840 (0.0008) +[2023-10-08 18:36:02,931][21194] Updated weights for policy 1, policy_version 70310 (0.0009) +[2023-10-08 18:36:03,298][21194] Updated weights for policy 1, policy_version 70320 (0.0009) +[2023-10-08 18:36:03,658][21194] Updated weights for policy 1, policy_version 70330 (0.0008) +[2023-10-08 18:36:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 144539648. Throughput: 0: 1775.5, 1: 1721.3. Samples: 36149576. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:36:03,803][19739] Avg episode reward: [(0, '1098.240'), (1, '1114.360')] +[2023-10-08 18:36:03,876][20836] Saving new best policy, reward=1114.360! +[2023-10-08 18:36:04,257][21195] Updated weights for policy 0, policy_version 70850 (0.0007) +[2023-10-08 18:36:04,652][21195] Updated weights for policy 0, policy_version 70860 (0.0007) +[2023-10-08 18:36:05,019][21195] Updated weights for policy 0, policy_version 70870 (0.0008) +[2023-10-08 18:36:05,384][21195] Updated weights for policy 0, policy_version 70880 (0.0011) +[2023-10-08 18:36:07,704][21194] Updated weights for policy 1, policy_version 70340 (0.0008) +[2023-10-08 18:36:08,077][21194] Updated weights for policy 1, policy_version 70350 (0.0007) +[2023-10-08 18:36:08,453][21194] Updated weights for policy 1, policy_version 70360 (0.0007) +[2023-10-08 18:36:08,802][19739] Fps is (10 sec: 16384.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 144637952. Throughput: 0: 1743.2, 1: 1725.3. Samples: 36164968. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:36:08,803][19739] Avg episode reward: [(0, '1098.240'), (1, '1114.240')] +[2023-10-08 18:36:09,073][21195] Updated weights for policy 0, policy_version 70890 (0.0008) +[2023-10-08 18:36:09,433][21195] Updated weights for policy 0, policy_version 70900 (0.0009) +[2023-10-08 18:36:09,807][21195] Updated weights for policy 0, policy_version 70910 (0.0009) +[2023-10-08 18:36:12,311][21194] Updated weights for policy 1, policy_version 70370 (0.0008) +[2023-10-08 18:36:12,720][21194] Updated weights for policy 1, policy_version 70380 (0.0007) +[2023-10-08 18:36:13,087][21194] Updated weights for policy 1, policy_version 70390 (0.0008) +[2023-10-08 18:36:13,454][21194] Updated weights for policy 1, policy_version 70400 (0.0007) +[2023-10-08 18:36:13,765][21195] Updated weights for policy 0, policy_version 70920 (0.0008) +[2023-10-08 18:36:13,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 144703488. Throughput: 0: 1766.0, 1: 1708.1. Samples: 36185546. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:36:13,803][19739] Avg episode reward: [(0, '1098.240'), (1, '1114.240')] +[2023-10-08 18:36:14,133][21195] Updated weights for policy 0, policy_version 70930 (0.0008) +[2023-10-08 18:36:14,497][21195] Updated weights for policy 0, policy_version 70940 (0.0007) +[2023-10-08 18:36:17,446][21194] Updated weights for policy 1, policy_version 70410 (0.0007) +[2023-10-08 18:36:17,814][21194] Updated weights for policy 1, policy_version 70420 (0.0009) +[2023-10-08 18:36:18,183][21194] Updated weights for policy 1, policy_version 70430 (0.0010) +[2023-10-08 18:36:18,370][21195] Updated weights for policy 0, policy_version 70950 (0.0007) +[2023-10-08 18:36:18,749][21195] Updated weights for policy 0, policy_version 70960 (0.0007) +[2023-10-08 18:36:18,802][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 144769024. Throughput: 0: 1757.5, 1: 1724.9. Samples: 36201218. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:36:18,803][19739] Avg episode reward: [(0, '1098.240'), (1, '1098.740')] +[2023-10-08 18:36:19,109][21195] Updated weights for policy 0, policy_version 70970 (0.0007) +[2023-10-08 18:36:21,952][21194] Updated weights for policy 1, policy_version 70440 (0.0009) +[2023-10-08 18:36:22,325][21194] Updated weights for policy 1, policy_version 70450 (0.0010) +[2023-10-08 18:36:22,695][21194] Updated weights for policy 1, policy_version 70460 (0.0008) +[2023-10-08 18:36:23,026][21195] Updated weights for policy 0, policy_version 70980 (0.0010) +[2023-10-08 18:36:23,384][21195] Updated weights for policy 0, policy_version 70990 (0.0009) +[2023-10-08 18:36:23,758][21195] Updated weights for policy 0, policy_version 71000 (0.0011) +[2023-10-08 18:36:23,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 144834560. Throughput: 0: 1757.6, 1: 1720.7. Samples: 36216944. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:36:23,804][19739] Avg episode reward: [(0, '1098.240'), (1, '1084.160')] +[2023-10-08 18:36:26,548][21194] Updated weights for policy 1, policy_version 70470 (0.0009) +[2023-10-08 18:36:26,902][21194] Updated weights for policy 1, policy_version 70480 (0.0007) +[2023-10-08 18:36:27,273][21194] Updated weights for policy 1, policy_version 70490 (0.0007) +[2023-10-08 18:36:27,677][21195] Updated weights for policy 0, policy_version 71010 (0.0009) +[2023-10-08 18:36:28,046][21195] Updated weights for policy 0, policy_version 71020 (0.0011) +[2023-10-08 18:36:28,414][21195] Updated weights for policy 0, policy_version 71030 (0.0010) +[2023-10-08 18:36:28,783][21195] Updated weights for policy 0, policy_version 71040 (0.0007) +[2023-10-08 18:36:28,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 144932864. Throughput: 0: 1763.5, 1: 1711.6. Samples: 36237812. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:36:28,803][19739] Avg episode reward: [(0, '1098.240'), (1, '1084.160')] +[2023-10-08 18:36:31,048][21194] Updated weights for policy 1, policy_version 70500 (0.0007) +[2023-10-08 18:36:31,403][21194] Updated weights for policy 1, policy_version 70510 (0.0007) +[2023-10-08 18:36:31,774][21194] Updated weights for policy 1, policy_version 70520 (0.0009) +[2023-10-08 18:36:32,645][21195] Updated weights for policy 0, policy_version 71050 (0.0010) +[2023-10-08 18:36:33,024][21195] Updated weights for policy 0, policy_version 71060 (0.0009) +[2023-10-08 18:36:33,388][21195] Updated weights for policy 0, policy_version 71070 (0.0008) +[2023-10-08 18:36:33,802][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 144998400. Throughput: 0: 1732.3, 1: 1736.5. Samples: 36253300. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:36:33,803][19739] Avg episode reward: [(0, '1098.240'), (1, '1099.400')] +[2023-10-08 18:36:35,782][21194] Updated weights for policy 1, policy_version 70530 (0.0007) +[2023-10-08 18:36:36,143][21194] Updated weights for policy 1, policy_version 70540 (0.0008) +[2023-10-08 18:36:36,504][21194] Updated weights for policy 1, policy_version 70550 (0.0009) +[2023-10-08 18:36:36,868][21194] Updated weights for policy 1, policy_version 70560 (0.0008) +[2023-10-08 18:36:37,217][21195] Updated weights for policy 0, policy_version 71080 (0.0008) +[2023-10-08 18:36:37,580][21195] Updated weights for policy 0, policy_version 71090 (0.0008) +[2023-10-08 18:36:37,952][21195] Updated weights for policy 0, policy_version 71100 (0.0007) +[2023-10-08 18:36:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 145063936. Throughput: 0: 1764.7, 1: 1712.4. Samples: 36268996. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:36:38,803][19739] Avg episode reward: [(0, '1098.440'), (1, '1099.400')] +[2023-10-08 18:36:40,809][21194] Updated weights for policy 1, policy_version 70570 (0.0010) +[2023-10-08 18:36:41,173][21194] Updated weights for policy 1, policy_version 70580 (0.0007) +[2023-10-08 18:36:41,537][21194] Updated weights for policy 1, policy_version 70590 (0.0009) +[2023-10-08 18:36:41,762][21195] Updated weights for policy 0, policy_version 71110 (0.0007) +[2023-10-08 18:36:42,136][21195] Updated weights for policy 0, policy_version 71120 (0.0007) +[2023-10-08 18:36:42,499][21195] Updated weights for policy 0, policy_version 71130 (0.0008) +[2023-10-08 18:36:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 145129472. Throughput: 0: 1729.2, 1: 1724.8. Samples: 36289296. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:36:43,803][19739] Avg episode reward: [(0, '1098.440'), (1, '1099.400')] +[2023-10-08 18:36:45,383][21194] Updated weights for policy 1, policy_version 70600 (0.0008) +[2023-10-08 18:36:45,742][21194] Updated weights for policy 1, policy_version 70610 (0.0010) +[2023-10-08 18:36:46,101][21194] Updated weights for policy 1, policy_version 70620 (0.0007) +[2023-10-08 18:36:46,355][21195] Updated weights for policy 0, policy_version 71140 (0.0010) +[2023-10-08 18:36:46,727][21195] Updated weights for policy 0, policy_version 71150 (0.0008) +[2023-10-08 18:36:47,098][21195] Updated weights for policy 0, policy_version 71160 (0.0008) +[2023-10-08 18:36:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 145195008. Throughput: 0: 1728.2, 1: 1726.6. Samples: 36305042. Policy #0 lag: (min: 25.0, avg: 39.9, max: 57.0) +[2023-10-08 18:36:48,803][19739] Avg episode reward: [(0, '1098.440'), (1, '1099.400')] +[2023-10-08 18:36:50,242][21194] Updated weights for policy 1, policy_version 70630 (0.0008) +[2023-10-08 18:36:50,602][21194] Updated weights for policy 1, policy_version 70640 (0.0009) +[2023-10-08 18:36:50,971][21194] Updated weights for policy 1, policy_version 70650 (0.0008) +[2023-10-08 18:36:51,060][21195] Updated weights for policy 0, policy_version 71170 (0.0009) +[2023-10-08 18:36:51,432][21195] Updated weights for policy 0, policy_version 71180 (0.0007) +[2023-10-08 18:36:51,799][21195] Updated weights for policy 0, policy_version 71190 (0.0007) +[2023-10-08 18:36:52,173][21195] Updated weights for policy 0, policy_version 71200 (0.0007) +[2023-10-08 18:36:53,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 145260544. Throughput: 0: 1740.5, 1: 1721.9. Samples: 36320778. Policy #0 lag: (min: 25.0, avg: 39.9, max: 57.0) +[2023-10-08 18:36:53,804][19739] Avg episode reward: [(0, '1098.490'), (1, '1114.350')] +[2023-10-08 18:36:54,941][21194] Updated weights for policy 1, policy_version 70660 (0.0008) +[2023-10-08 18:36:55,309][21194] Updated weights for policy 1, policy_version 70670 (0.0009) +[2023-10-08 18:36:55,671][21194] Updated weights for policy 1, policy_version 70680 (0.0009) +[2023-10-08 18:36:56,169][21195] Updated weights for policy 0, policy_version 71210 (0.0007) +[2023-10-08 18:36:56,539][21195] Updated weights for policy 0, policy_version 71220 (0.0008) +[2023-10-08 18:36:56,912][21195] Updated weights for policy 0, policy_version 71230 (0.0008) +[2023-10-08 18:36:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 145326080. Throughput: 0: 1726.0, 1: 1739.2. Samples: 36341482. Policy #0 lag: (min: 25.0, avg: 39.9, max: 57.0) +[2023-10-08 18:36:58,803][19739] Avg episode reward: [(0, '1098.490'), (1, '1114.350')] +[2023-10-08 18:36:59,577][21194] Updated weights for policy 1, policy_version 70690 (0.0007) +[2023-10-08 18:36:59,942][21194] Updated weights for policy 1, policy_version 70700 (0.0008) +[2023-10-08 18:37:00,313][21194] Updated weights for policy 1, policy_version 70710 (0.0009) +[2023-10-08 18:37:00,667][21194] Updated weights for policy 1, policy_version 70720 (0.0008) +[2023-10-08 18:37:00,780][21195] Updated weights for policy 0, policy_version 71240 (0.0009) +[2023-10-08 18:37:01,148][21195] Updated weights for policy 0, policy_version 71250 (0.0010) +[2023-10-08 18:37:01,526][21195] Updated weights for policy 0, policy_version 71260 (0.0008) +[2023-10-08 18:37:03,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 145391616. Throughput: 0: 1744.3, 1: 1721.6. Samples: 36357182. Policy #0 lag: (min: 25.0, avg: 39.9, max: 57.0) +[2023-10-08 18:37:03,803][19739] Avg episode reward: [(0, '1098.490'), (1, '1114.350')] +[2023-10-08 18:37:04,599][21194] Updated weights for policy 1, policy_version 70730 (0.0009) +[2023-10-08 18:37:04,965][21194] Updated weights for policy 1, policy_version 70740 (0.0007) +[2023-10-08 18:37:05,338][21194] Updated weights for policy 1, policy_version 70750 (0.0008) +[2023-10-08 18:37:05,429][21195] Updated weights for policy 0, policy_version 71270 (0.0009) +[2023-10-08 18:37:05,794][21195] Updated weights for policy 0, policy_version 71280 (0.0009) +[2023-10-08 18:37:06,161][21195] Updated weights for policy 0, policy_version 71290 (0.0011) +[2023-10-08 18:37:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 145457152. Throughput: 0: 1725.9, 1: 1729.0. Samples: 36372412. Policy #0 lag: (min: 25.0, avg: 39.9, max: 57.0) +[2023-10-08 18:37:08,803][19739] Avg episode reward: [(0, '1098.490'), (1, '1114.350')] +[2023-10-08 18:37:09,205][21194] Updated weights for policy 1, policy_version 70760 (0.0008) +[2023-10-08 18:37:09,576][21194] Updated weights for policy 1, policy_version 70770 (0.0007) +[2023-10-08 18:37:09,943][21194] Updated weights for policy 1, policy_version 70780 (0.0007) +[2023-10-08 18:37:10,166][21195] Updated weights for policy 0, policy_version 71300 (0.0009) +[2023-10-08 18:37:10,538][21195] Updated weights for policy 0, policy_version 71310 (0.0009) +[2023-10-08 18:37:10,903][21195] Updated weights for policy 0, policy_version 71320 (0.0009) +[2023-10-08 18:37:13,803][19739] Fps is (10 sec: 13106.6, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 145522688. Throughput: 0: 1730.2, 1: 1737.5. Samples: 36393858. Policy #0 lag: (min: 25.0, avg: 39.9, max: 57.0) +[2023-10-08 18:37:13,804][19739] Avg episode reward: [(0, '1098.490'), (1, '1114.350')] +[2023-10-08 18:37:13,817][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000071328_73039872.pth... +[2023-10-08 18:37:13,851][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000069696_71368704.pth +[2023-10-08 18:37:13,893][21194] Updated weights for policy 1, policy_version 70790 (0.0010) +[2023-10-08 18:37:14,257][21194] Updated weights for policy 1, policy_version 70800 (0.0010) +[2023-10-08 18:37:14,637][21194] Updated weights for policy 1, policy_version 70810 (0.0009) +[2023-10-08 18:37:14,844][21195] Updated weights for policy 0, policy_version 71330 (0.0007) +[2023-10-08 18:37:14,853][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000070816_72515584.pth... +[2023-10-08 18:37:14,884][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000069184_70844416.pth +[2023-10-08 18:37:15,204][21195] Updated weights for policy 0, policy_version 71340 (0.0010) +[2023-10-08 18:37:15,569][21195] Updated weights for policy 0, policy_version 71350 (0.0010) +[2023-10-08 18:37:15,939][21195] Updated weights for policy 0, policy_version 71360 (0.0010) +[2023-10-08 18:37:18,666][21194] Updated weights for policy 1, policy_version 70820 (0.0010) +[2023-10-08 18:37:18,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 145588224. Throughput: 0: 1750.3, 1: 1709.8. Samples: 36409004. Policy #0 lag: (min: 25.0, avg: 39.9, max: 57.0) +[2023-10-08 18:37:18,804][19739] Avg episode reward: [(0, '1098.490'), (1, '1118.120')] +[2023-10-08 18:37:19,035][21194] Updated weights for policy 1, policy_version 70830 (0.0011) +[2023-10-08 18:37:19,395][21194] Updated weights for policy 1, policy_version 70840 (0.0011) +[2023-10-08 18:37:19,685][20836] Saving new best policy, reward=1118.120! +[2023-10-08 18:37:19,898][21195] Updated weights for policy 0, policy_version 71370 (0.0008) +[2023-10-08 18:37:20,263][21195] Updated weights for policy 0, policy_version 71380 (0.0008) +[2023-10-08 18:37:20,637][21195] Updated weights for policy 0, policy_version 71390 (0.0009) +[2023-10-08 18:37:23,295][21194] Updated weights for policy 1, policy_version 70850 (0.0008) +[2023-10-08 18:37:23,654][21194] Updated weights for policy 1, policy_version 70860 (0.0007) +[2023-10-08 18:37:23,803][19739] Fps is (10 sec: 13107.7, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 145653760. Throughput: 0: 1716.9, 1: 1736.7. Samples: 36424408. Policy #0 lag: (min: 25.0, avg: 39.9, max: 57.0) +[2023-10-08 18:37:23,803][19739] Avg episode reward: [(0, '1098.490'), (1, '1118.120')] +[2023-10-08 18:37:24,018][21194] Updated weights for policy 1, policy_version 70870 (0.0011) +[2023-10-08 18:37:24,375][21194] Updated weights for policy 1, policy_version 70880 (0.0008) +[2023-10-08 18:37:24,533][21195] Updated weights for policy 0, policy_version 71400 (0.0008) +[2023-10-08 18:37:24,895][21195] Updated weights for policy 0, policy_version 71410 (0.0007) +[2023-10-08 18:37:25,271][21195] Updated weights for policy 0, policy_version 71420 (0.0008) +[2023-10-08 18:37:28,253][21194] Updated weights for policy 1, policy_version 70890 (0.0009) +[2023-10-08 18:37:28,611][21194] Updated weights for policy 1, policy_version 70900 (0.0007) +[2023-10-08 18:37:28,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13884.7). Total num frames: 145719296. Throughput: 0: 1743.4, 1: 1734.0. Samples: 36445778. Policy #0 lag: (min: 25.0, avg: 39.9, max: 57.0) +[2023-10-08 18:37:28,803][19739] Avg episode reward: [(0, '1098.490'), (1, '1118.120')] +[2023-10-08 18:37:28,980][21194] Updated weights for policy 1, policy_version 70910 (0.0009) +[2023-10-08 18:37:29,145][21195] Updated weights for policy 0, policy_version 71430 (0.0008) +[2023-10-08 18:37:29,512][21195] Updated weights for policy 0, policy_version 71440 (0.0008) +[2023-10-08 18:37:29,888][21195] Updated weights for policy 0, policy_version 71450 (0.0009) +[2023-10-08 18:37:32,947][21194] Updated weights for policy 1, policy_version 70920 (0.0010) +[2023-10-08 18:37:33,307][21194] Updated weights for policy 1, policy_version 70930 (0.0009) +[2023-10-08 18:37:33,673][21194] Updated weights for policy 1, policy_version 70940 (0.0009) +[2023-10-08 18:37:33,762][21195] Updated weights for policy 0, policy_version 71460 (0.0010) +[2023-10-08 18:37:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 145784832. Throughput: 0: 1739.0, 1: 1730.9. Samples: 36461190. Policy #0 lag: (min: 25.0, avg: 39.9, max: 57.0) +[2023-10-08 18:37:33,803][19739] Avg episode reward: [(0, '1098.490'), (1, '1118.120')] +[2023-10-08 18:37:34,132][21195] Updated weights for policy 0, policy_version 71470 (0.0010) +[2023-10-08 18:37:34,503][21195] Updated weights for policy 0, policy_version 71480 (0.0009) +[2023-10-08 18:37:37,814][21194] Updated weights for policy 1, policy_version 70950 (0.0009) +[2023-10-08 18:37:38,190][21194] Updated weights for policy 1, policy_version 70960 (0.0010) +[2023-10-08 18:37:38,199][21195] Updated weights for policy 0, policy_version 71490 (0.0008) +[2023-10-08 18:37:38,545][21194] Updated weights for policy 1, policy_version 70970 (0.0008) +[2023-10-08 18:37:38,564][21195] Updated weights for policy 0, policy_version 71500 (0.0007) +[2023-10-08 18:37:38,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 145883136. Throughput: 0: 1737.9, 1: 1733.9. Samples: 36477006. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 18:37:38,803][19739] Avg episode reward: [(0, '1106.770'), (1, '1118.120')] +[2023-10-08 18:37:38,920][21195] Updated weights for policy 0, policy_version 71510 (0.0011) +[2023-10-08 18:37:39,286][20740] Saving new best policy, reward=1106.770! +[2023-10-08 18:37:39,291][21195] Updated weights for policy 0, policy_version 71520 (0.0009) +[2023-10-08 18:37:42,456][21194] Updated weights for policy 1, policy_version 70980 (0.0007) +[2023-10-08 18:37:42,832][21194] Updated weights for policy 1, policy_version 70990 (0.0010) +[2023-10-08 18:37:43,186][21194] Updated weights for policy 1, policy_version 71000 (0.0008) +[2023-10-08 18:37:43,382][21195] Updated weights for policy 0, policy_version 71530 (0.0009) +[2023-10-08 18:37:43,745][21195] Updated weights for policy 0, policy_version 71540 (0.0008) +[2023-10-08 18:37:43,803][19739] Fps is (10 sec: 16383.7, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 145948672. Throughput: 0: 1756.0, 1: 1721.2. Samples: 36497958. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 18:37:43,804][19739] Avg episode reward: [(0, '1122.260'), (1, '1118.120')] +[2023-10-08 18:37:44,124][21195] Updated weights for policy 0, policy_version 71550 (0.0009) +[2023-10-08 18:37:44,191][20740] Saving new best policy, reward=1122.260! +[2023-10-08 18:37:47,337][21194] Updated weights for policy 1, policy_version 71010 (0.0010) +[2023-10-08 18:37:47,732][21194] Updated weights for policy 1, policy_version 71020 (0.0008) +[2023-10-08 18:37:47,975][21195] Updated weights for policy 0, policy_version 71560 (0.0008) +[2023-10-08 18:37:48,090][21194] Updated weights for policy 1, policy_version 71030 (0.0008) +[2023-10-08 18:37:48,336][21195] Updated weights for policy 0, policy_version 71570 (0.0007) +[2023-10-08 18:37:48,450][21194] Updated weights for policy 1, policy_version 71040 (0.0008) +[2023-10-08 18:37:48,709][21195] Updated weights for policy 0, policy_version 71580 (0.0008) +[2023-10-08 18:37:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 146014208. Throughput: 0: 1719.1, 1: 1736.6. Samples: 36512686. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 18:37:48,803][19739] Avg episode reward: [(0, '1122.260'), (1, '1118.120')] +[2023-10-08 18:37:52,374][21194] Updated weights for policy 1, policy_version 71050 (0.0008) +[2023-10-08 18:37:52,636][21195] Updated weights for policy 0, policy_version 71590 (0.0007) +[2023-10-08 18:37:52,729][21194] Updated weights for policy 1, policy_version 71060 (0.0008) +[2023-10-08 18:37:52,994][21195] Updated weights for policy 0, policy_version 71600 (0.0008) +[2023-10-08 18:37:53,103][21194] Updated weights for policy 1, policy_version 71070 (0.0007) +[2023-10-08 18:37:53,364][21195] Updated weights for policy 0, policy_version 71610 (0.0009) +[2023-10-08 18:37:53,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 146112512. Throughput: 0: 1749.6, 1: 1729.3. Samples: 36528960. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 18:37:53,803][19739] Avg episode reward: [(0, '1122.260'), (1, '1118.120')] +[2023-10-08 18:37:57,070][21194] Updated weights for policy 1, policy_version 71080 (0.0009) +[2023-10-08 18:37:57,311][21195] Updated weights for policy 0, policy_version 71620 (0.0010) +[2023-10-08 18:37:57,430][21194] Updated weights for policy 1, policy_version 71090 (0.0008) +[2023-10-08 18:37:57,679][21195] Updated weights for policy 0, policy_version 71630 (0.0008) +[2023-10-08 18:37:57,792][21194] Updated weights for policy 1, policy_version 71100 (0.0008) +[2023-10-08 18:37:58,045][21195] Updated weights for policy 0, policy_version 71640 (0.0008) +[2023-10-08 18:37:58,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 146178048. Throughput: 0: 1734.9, 1: 1701.1. Samples: 36548476. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 18:37:58,803][19739] Avg episode reward: [(0, '1107.240'), (1, '1133.310')] +[2023-10-08 18:37:58,812][20836] Saving new best policy, reward=1133.310! +[2023-10-08 18:38:01,770][21194] Updated weights for policy 1, policy_version 71110 (0.0010) +[2023-10-08 18:38:01,920][21195] Updated weights for policy 0, policy_version 71650 (0.0008) +[2023-10-08 18:38:02,132][21194] Updated weights for policy 1, policy_version 71120 (0.0008) +[2023-10-08 18:38:02,297][21195] Updated weights for policy 0, policy_version 71660 (0.0009) +[2023-10-08 18:38:02,510][21194] Updated weights for policy 1, policy_version 71130 (0.0009) +[2023-10-08 18:38:02,663][21195] Updated weights for policy 0, policy_version 71670 (0.0008) +[2023-10-08 18:38:03,031][21195] Updated weights for policy 0, policy_version 71680 (0.0008) +[2023-10-08 18:38:03,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 146243584. Throughput: 0: 1725.2, 1: 1731.2. Samples: 36564542. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 18:38:03,803][19739] Avg episode reward: [(0, '1107.250'), (1, '1133.310')] +[2023-10-08 18:38:06,312][21194] Updated weights for policy 1, policy_version 71140 (0.0009) +[2023-10-08 18:38:06,682][21194] Updated weights for policy 1, policy_version 71150 (0.0009) +[2023-10-08 18:38:06,955][21195] Updated weights for policy 0, policy_version 71690 (0.0008) +[2023-10-08 18:38:07,056][21194] Updated weights for policy 1, policy_version 71160 (0.0008) +[2023-10-08 18:38:07,336][21195] Updated weights for policy 0, policy_version 71700 (0.0008) +[2023-10-08 18:38:07,713][21195] Updated weights for policy 0, policy_version 71710 (0.0007) +[2023-10-08 18:38:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 146309120. Throughput: 0: 1756.6, 1: 1713.5. Samples: 36580560. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 18:38:08,803][19739] Avg episode reward: [(0, '1107.250'), (1, '1133.310')] +[2023-10-08 18:38:11,121][21194] Updated weights for policy 1, policy_version 71170 (0.0009) +[2023-10-08 18:38:11,488][21194] Updated weights for policy 1, policy_version 71180 (0.0009) +[2023-10-08 18:38:11,628][21195] Updated weights for policy 0, policy_version 71720 (0.0008) +[2023-10-08 18:38:11,857][21194] Updated weights for policy 1, policy_version 71190 (0.0008) +[2023-10-08 18:38:11,999][21195] Updated weights for policy 0, policy_version 71730 (0.0007) +[2023-10-08 18:38:12,224][21194] Updated weights for policy 1, policy_version 71200 (0.0008) +[2023-10-08 18:38:12,376][21195] Updated weights for policy 0, policy_version 71740 (0.0007) +[2023-10-08 18:38:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.6, 300 sec: 13884.7). Total num frames: 146374656. Throughput: 0: 1730.6, 1: 1705.5. Samples: 36600402. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 18:38:13,803][19739] Avg episode reward: [(0, '1108.500'), (1, '1133.310')] +[2023-10-08 18:38:16,224][21195] Updated weights for policy 0, policy_version 71750 (0.0008) +[2023-10-08 18:38:16,281][21194] Updated weights for policy 1, policy_version 71210 (0.0007) +[2023-10-08 18:38:16,592][21195] Updated weights for policy 0, policy_version 71760 (0.0009) +[2023-10-08 18:38:16,640][21194] Updated weights for policy 1, policy_version 71220 (0.0008) +[2023-10-08 18:38:16,958][21195] Updated weights for policy 0, policy_version 71770 (0.0008) +[2023-10-08 18:38:16,997][21194] Updated weights for policy 1, policy_version 71230 (0.0007) +[2023-10-08 18:38:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 146440192. Throughput: 0: 1736.4, 1: 1723.7. Samples: 36616898. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 18:38:18,803][19739] Avg episode reward: [(0, '1108.650'), (1, '1133.310')] +[2023-10-08 18:38:20,875][21194] Updated weights for policy 1, policy_version 71240 (0.0008) +[2023-10-08 18:38:20,969][21195] Updated weights for policy 0, policy_version 71780 (0.0008) +[2023-10-08 18:38:21,235][21194] Updated weights for policy 1, policy_version 71250 (0.0009) +[2023-10-08 18:38:21,342][21195] Updated weights for policy 0, policy_version 71790 (0.0007) +[2023-10-08 18:38:21,601][21194] Updated weights for policy 1, policy_version 71260 (0.0007) +[2023-10-08 18:38:21,701][21195] Updated weights for policy 0, policy_version 71800 (0.0007) +[2023-10-08 18:38:23,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13884.8). Total num frames: 146505728. Throughput: 0: 1734.0, 1: 1695.9. Samples: 36631354. Policy #0 lag: (min: 29.0, avg: 31.7, max: 61.0) +[2023-10-08 18:38:23,804][19739] Avg episode reward: [(0, '1093.710'), (1, '1133.310')] +[2023-10-08 18:38:25,448][21195] Updated weights for policy 0, policy_version 71810 (0.0008) +[2023-10-08 18:38:25,516][21194] Updated weights for policy 1, policy_version 71270 (0.0008) +[2023-10-08 18:38:25,815][21195] Updated weights for policy 0, policy_version 71820 (0.0009) +[2023-10-08 18:38:25,887][21194] Updated weights for policy 1, policy_version 71280 (0.0007) +[2023-10-08 18:38:26,180][21195] Updated weights for policy 0, policy_version 71830 (0.0008) +[2023-10-08 18:38:26,257][21194] Updated weights for policy 1, policy_version 71290 (0.0008) +[2023-10-08 18:38:26,540][21195] Updated weights for policy 0, policy_version 71840 (0.0009) +[2023-10-08 18:38:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 146571264. Throughput: 0: 1726.7, 1: 1713.2. Samples: 36652752. Policy #0 lag: (min: 29.0, avg: 31.7, max: 61.0) +[2023-10-08 18:38:28,803][19739] Avg episode reward: [(0, '1094.240'), (1, '1133.140')] +[2023-10-08 18:38:30,061][21194] Updated weights for policy 1, policy_version 71300 (0.0008) +[2023-10-08 18:38:30,423][21194] Updated weights for policy 1, policy_version 71310 (0.0008) +[2023-10-08 18:38:30,550][21195] Updated weights for policy 0, policy_version 71850 (0.0008) +[2023-10-08 18:38:30,787][21194] Updated weights for policy 1, policy_version 71320 (0.0007) +[2023-10-08 18:38:30,920][21195] Updated weights for policy 0, policy_version 71860 (0.0007) +[2023-10-08 18:38:31,287][21195] Updated weights for policy 0, policy_version 71870 (0.0009) +[2023-10-08 18:38:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 146636800. Throughput: 0: 1751.7, 1: 1703.1. Samples: 36668152. Policy #0 lag: (min: 29.0, avg: 31.7, max: 61.0) +[2023-10-08 18:38:33,804][19739] Avg episode reward: [(0, '1079.120'), (1, '1133.140')] +[2023-10-08 18:38:34,846][21194] Updated weights for policy 1, policy_version 71330 (0.0009) +[2023-10-08 18:38:35,074][21195] Updated weights for policy 0, policy_version 71880 (0.0009) +[2023-10-08 18:38:35,229][21194] Updated weights for policy 1, policy_version 71340 (0.0009) +[2023-10-08 18:38:35,443][21195] Updated weights for policy 0, policy_version 71890 (0.0009) +[2023-10-08 18:38:35,593][21194] Updated weights for policy 1, policy_version 71350 (0.0007) +[2023-10-08 18:38:35,809][21195] Updated weights for policy 0, policy_version 71900 (0.0008) +[2023-10-08 18:38:35,955][21194] Updated weights for policy 1, policy_version 71360 (0.0009) +[2023-10-08 18:38:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 146702336. Throughput: 0: 1725.6, 1: 1701.3. Samples: 36683172. Policy #0 lag: (min: 29.0, avg: 31.7, max: 61.0) +[2023-10-08 18:38:38,803][19739] Avg episode reward: [(0, '1079.120'), (1, '1133.140')] +[2023-10-08 18:38:39,811][21195] Updated weights for policy 0, policy_version 71910 (0.0008) +[2023-10-08 18:38:39,874][21194] Updated weights for policy 1, policy_version 71370 (0.0008) +[2023-10-08 18:38:40,181][21195] Updated weights for policy 0, policy_version 71920 (0.0009) +[2023-10-08 18:38:40,241][21194] Updated weights for policy 1, policy_version 71380 (0.0008) +[2023-10-08 18:38:40,547][21195] Updated weights for policy 0, policy_version 71930 (0.0008) +[2023-10-08 18:38:40,596][21194] Updated weights for policy 1, policy_version 71390 (0.0009) +[2023-10-08 18:38:43,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 146767872. Throughput: 0: 1738.4, 1: 1729.3. Samples: 36704522. Policy #0 lag: (min: 29.0, avg: 31.7, max: 61.0) +[2023-10-08 18:38:43,803][19739] Avg episode reward: [(0, '1079.120'), (1, '1133.140')] +[2023-10-08 18:38:44,478][21195] Updated weights for policy 0, policy_version 71940 (0.0009) +[2023-10-08 18:38:44,676][21194] Updated weights for policy 1, policy_version 71400 (0.0009) +[2023-10-08 18:38:44,850][21195] Updated weights for policy 0, policy_version 71950 (0.0008) +[2023-10-08 18:38:45,035][21194] Updated weights for policy 1, policy_version 71410 (0.0007) +[2023-10-08 18:38:45,229][21195] Updated weights for policy 0, policy_version 71960 (0.0008) +[2023-10-08 18:38:45,392][21194] Updated weights for policy 1, policy_version 71420 (0.0008) +[2023-10-08 18:38:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 146833408. Throughput: 0: 1750.4, 1: 1702.1. Samples: 36719908. Policy #0 lag: (min: 29.0, avg: 31.7, max: 61.0) +[2023-10-08 18:38:48,803][19739] Avg episode reward: [(0, '1092.710'), (1, '1147.050')] +[2023-10-08 18:38:48,804][20836] Saving new best policy, reward=1147.050! +[2023-10-08 18:38:49,237][21195] Updated weights for policy 0, policy_version 71970 (0.0011) +[2023-10-08 18:38:49,612][21195] Updated weights for policy 0, policy_version 71980 (0.0008) +[2023-10-08 18:38:49,644][21194] Updated weights for policy 1, policy_version 71430 (0.0008) +[2023-10-08 18:38:49,976][21195] Updated weights for policy 0, policy_version 71990 (0.0007) +[2023-10-08 18:38:50,008][21194] Updated weights for policy 1, policy_version 71440 (0.0008) +[2023-10-08 18:38:50,336][21195] Updated weights for policy 0, policy_version 72000 (0.0008) +[2023-10-08 18:38:50,378][21194] Updated weights for policy 1, policy_version 71450 (0.0007) +[2023-10-08 18:38:53,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 146898944. Throughput: 0: 1719.9, 1: 1710.4. Samples: 36734922. Policy #0 lag: (min: 29.0, avg: 31.7, max: 61.0) +[2023-10-08 18:38:53,804][19739] Avg episode reward: [(0, '1092.710'), (1, '1131.950')] +[2023-10-08 18:38:54,168][21194] Updated weights for policy 1, policy_version 71460 (0.0008) +[2023-10-08 18:38:54,280][21195] Updated weights for policy 0, policy_version 72010 (0.0007) +[2023-10-08 18:38:54,536][21194] Updated weights for policy 1, policy_version 71470 (0.0008) +[2023-10-08 18:38:54,654][21195] Updated weights for policy 0, policy_version 72020 (0.0007) +[2023-10-08 18:38:54,898][21194] Updated weights for policy 1, policy_version 71480 (0.0007) +[2023-10-08 18:38:55,018][21195] Updated weights for policy 0, policy_version 72030 (0.0007) +[2023-10-08 18:38:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 146964480. Throughput: 0: 1746.6, 1: 1719.5. Samples: 36756376. Policy #0 lag: (min: 29.0, avg: 31.7, max: 61.0) +[2023-10-08 18:38:58,803][19739] Avg episode reward: [(0, '1106.540'), (1, '1131.950')] +[2023-10-08 18:38:58,846][21195] Updated weights for policy 0, policy_version 72040 (0.0008) +[2023-10-08 18:38:58,856][21194] Updated weights for policy 1, policy_version 71490 (0.0008) +[2023-10-08 18:38:59,216][21195] Updated weights for policy 0, policy_version 72050 (0.0008) +[2023-10-08 18:38:59,226][21194] Updated weights for policy 1, policy_version 71500 (0.0009) +[2023-10-08 18:38:59,579][21195] Updated weights for policy 0, policy_version 72060 (0.0008) +[2023-10-08 18:38:59,586][21194] Updated weights for policy 1, policy_version 71510 (0.0008) +[2023-10-08 18:38:59,952][21194] Updated weights for policy 1, policy_version 71520 (0.0010) +[2023-10-08 18:39:03,403][21195] Updated weights for policy 0, policy_version 72070 (0.0009) +[2023-10-08 18:39:03,767][21195] Updated weights for policy 0, policy_version 72080 (0.0008) +[2023-10-08 18:39:03,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 147030016. Throughput: 0: 1733.6, 1: 1694.9. Samples: 36771182. Policy #0 lag: (min: 29.0, avg: 31.7, max: 61.0) +[2023-10-08 18:39:03,803][19739] Avg episode reward: [(0, '1106.540'), (1, '1131.950')] +[2023-10-08 18:39:04,025][21194] Updated weights for policy 1, policy_version 71530 (0.0009) +[2023-10-08 18:39:04,140][21195] Updated weights for policy 0, policy_version 72090 (0.0007) +[2023-10-08 18:39:04,391][21194] Updated weights for policy 1, policy_version 71540 (0.0008) +[2023-10-08 18:39:04,755][21194] Updated weights for policy 1, policy_version 71550 (0.0009) +[2023-10-08 18:39:08,052][21195] Updated weights for policy 0, policy_version 72100 (0.0008) +[2023-10-08 18:39:08,419][21195] Updated weights for policy 0, policy_version 72110 (0.0007) +[2023-10-08 18:39:08,692][21194] Updated weights for policy 1, policy_version 71560 (0.0008) +[2023-10-08 18:39:08,795][21195] Updated weights for policy 0, policy_version 72120 (0.0008) +[2023-10-08 18:39:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 147095552. Throughput: 0: 1746.0, 1: 1720.5. Samples: 36787344. Policy #0 lag: (min: 29.0, avg: 31.7, max: 61.0) +[2023-10-08 18:39:08,803][19739] Avg episode reward: [(0, '1106.540'), (1, '1131.950')] +[2023-10-08 18:39:09,059][21194] Updated weights for policy 1, policy_version 71570 (0.0008) +[2023-10-08 18:39:09,419][21194] Updated weights for policy 1, policy_version 71580 (0.0008) +[2023-10-08 18:39:12,589][21195] Updated weights for policy 0, policy_version 72130 (0.0008) +[2023-10-08 18:39:12,957][21195] Updated weights for policy 0, policy_version 72140 (0.0007) +[2023-10-08 18:39:13,331][21195] Updated weights for policy 0, policy_version 72150 (0.0008) +[2023-10-08 18:39:13,418][21194] Updated weights for policy 1, policy_version 71590 (0.0007) +[2023-10-08 18:39:13,699][21195] Updated weights for policy 0, policy_version 72160 (0.0009) +[2023-10-08 18:39:13,776][21194] Updated weights for policy 1, policy_version 71600 (0.0008) +[2023-10-08 18:39:13,803][19739] Fps is (10 sec: 16383.8, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 147193856. Throughput: 0: 1744.5, 1: 1719.6. Samples: 36808638. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 18:39:13,803][19739] Avg episode reward: [(0, '1106.540'), (1, '1131.950')] +[2023-10-08 18:39:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000072160_73891840.pth... +[2023-10-08 18:39:13,840][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000070528_72220672.pth +[2023-10-08 18:39:14,150][21194] Updated weights for policy 1, policy_version 71610 (0.0008) +[2023-10-08 18:39:14,361][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000071616_73334784.pth... +[2023-10-08 18:39:14,390][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000069984_71663616.pth +[2023-10-08 18:39:17,772][21195] Updated weights for policy 0, policy_version 72170 (0.0007) +[2023-10-08 18:39:18,106][21194] Updated weights for policy 1, policy_version 71620 (0.0008) +[2023-10-08 18:39:18,139][21195] Updated weights for policy 0, policy_version 72180 (0.0008) +[2023-10-08 18:39:18,472][21194] Updated weights for policy 1, policy_version 71630 (0.0009) +[2023-10-08 18:39:18,512][21195] Updated weights for policy 0, policy_version 72190 (0.0007) +[2023-10-08 18:39:18,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 147259392. Throughput: 0: 1723.6, 1: 1714.0. Samples: 36822840. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 18:39:18,803][19739] Avg episode reward: [(0, '1106.540'), (1, '1131.950')] +[2023-10-08 18:39:18,836][21194] Updated weights for policy 1, policy_version 71640 (0.0009) +[2023-10-08 18:39:22,371][21195] Updated weights for policy 0, policy_version 72200 (0.0008) +[2023-10-08 18:39:22,750][21195] Updated weights for policy 0, policy_version 72210 (0.0008) +[2023-10-08 18:39:22,969][21194] Updated weights for policy 1, policy_version 71650 (0.0008) +[2023-10-08 18:39:23,119][21195] Updated weights for policy 0, policy_version 72220 (0.0009) +[2023-10-08 18:39:23,381][21194] Updated weights for policy 1, policy_version 71660 (0.0007) +[2023-10-08 18:39:23,752][21194] Updated weights for policy 1, policy_version 71670 (0.0008) +[2023-10-08 18:39:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 147324928. Throughput: 0: 1754.4, 1: 1722.4. Samples: 36839630. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 18:39:23,803][19739] Avg episode reward: [(0, '1106.540'), (1, '1116.110')] +[2023-10-08 18:39:24,117][21194] Updated weights for policy 1, policy_version 71680 (0.0009) +[2023-10-08 18:39:26,939][21195] Updated weights for policy 0, policy_version 72230 (0.0007) +[2023-10-08 18:39:27,302][21195] Updated weights for policy 0, policy_version 72240 (0.0009) +[2023-10-08 18:39:27,678][21195] Updated weights for policy 0, policy_version 72250 (0.0008) +[2023-10-08 18:39:27,923][21194] Updated weights for policy 1, policy_version 71690 (0.0007) +[2023-10-08 18:39:28,284][21194] Updated weights for policy 1, policy_version 71700 (0.0008) +[2023-10-08 18:39:28,655][21194] Updated weights for policy 1, policy_version 71710 (0.0011) +[2023-10-08 18:39:28,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 147423232. Throughput: 0: 1729.6, 1: 1714.5. Samples: 36859508. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 18:39:28,803][19739] Avg episode reward: [(0, '1106.540'), (1, '1101.150')] +[2023-10-08 18:39:31,531][21195] Updated weights for policy 0, policy_version 72260 (0.0007) +[2023-10-08 18:39:31,890][21195] Updated weights for policy 0, policy_version 72270 (0.0008) +[2023-10-08 18:39:32,266][21195] Updated weights for policy 0, policy_version 72280 (0.0007) +[2023-10-08 18:39:32,710][21194] Updated weights for policy 1, policy_version 71720 (0.0008) +[2023-10-08 18:39:33,085][21194] Updated weights for policy 1, policy_version 71730 (0.0008) +[2023-10-08 18:39:33,439][21194] Updated weights for policy 1, policy_version 71740 (0.0009) +[2023-10-08 18:39:33,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 147488768. Throughput: 0: 1729.6, 1: 1721.5. Samples: 36875210. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 18:39:33,803][19739] Avg episode reward: [(0, '1106.540'), (1, '1101.150')] +[2023-10-08 18:39:36,268][21195] Updated weights for policy 0, policy_version 72290 (0.0008) +[2023-10-08 18:39:36,632][21195] Updated weights for policy 0, policy_version 72300 (0.0009) +[2023-10-08 18:39:37,000][21195] Updated weights for policy 0, policy_version 72310 (0.0009) +[2023-10-08 18:39:37,288][21194] Updated weights for policy 1, policy_version 71750 (0.0008) +[2023-10-08 18:39:37,369][21195] Updated weights for policy 0, policy_version 72320 (0.0009) +[2023-10-08 18:39:37,663][21194] Updated weights for policy 1, policy_version 71760 (0.0009) +[2023-10-08 18:39:38,029][21194] Updated weights for policy 1, policy_version 71770 (0.0009) +[2023-10-08 18:39:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.8). Total num frames: 147554304. Throughput: 0: 1743.3, 1: 1732.7. Samples: 36891342. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 18:39:38,803][19739] Avg episode reward: [(0, '1106.540'), (1, '1116.140')] +[2023-10-08 18:39:41,266][21195] Updated weights for policy 0, policy_version 72330 (0.0011) +[2023-10-08 18:39:41,638][21195] Updated weights for policy 0, policy_version 72340 (0.0010) +[2023-10-08 18:39:41,924][21194] Updated weights for policy 1, policy_version 71780 (0.0008) +[2023-10-08 18:39:42,010][21195] Updated weights for policy 0, policy_version 72350 (0.0008) +[2023-10-08 18:39:42,288][21194] Updated weights for policy 1, policy_version 71790 (0.0008) +[2023-10-08 18:39:42,666][21194] Updated weights for policy 1, policy_version 71800 (0.0008) +[2023-10-08 18:39:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 147619840. Throughput: 0: 1730.1, 1: 1702.8. Samples: 36910854. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 18:39:43,803][19739] Avg episode reward: [(0, '1106.540'), (1, '1116.140')] +[2023-10-08 18:39:45,886][21195] Updated weights for policy 0, policy_version 72360 (0.0009) +[2023-10-08 18:39:46,257][21195] Updated weights for policy 0, policy_version 72370 (0.0008) +[2023-10-08 18:39:46,620][21195] Updated weights for policy 0, policy_version 72380 (0.0009) +[2023-10-08 18:39:46,664][21194] Updated weights for policy 1, policy_version 71810 (0.0007) +[2023-10-08 18:39:47,032][21194] Updated weights for policy 1, policy_version 71820 (0.0009) +[2023-10-08 18:39:47,399][21194] Updated weights for policy 1, policy_version 71830 (0.0009) +[2023-10-08 18:39:47,755][21194] Updated weights for policy 1, policy_version 71840 (0.0010) +[2023-10-08 18:39:48,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 147685376. Throughput: 0: 1738.9, 1: 1733.9. Samples: 36927456. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 18:39:48,803][19739] Avg episode reward: [(0, '1106.540'), (1, '1101.430')] +[2023-10-08 18:39:50,564][21195] Updated weights for policy 0, policy_version 72390 (0.0010) +[2023-10-08 18:39:50,920][21195] Updated weights for policy 0, policy_version 72400 (0.0009) +[2023-10-08 18:39:51,291][21195] Updated weights for policy 0, policy_version 72410 (0.0008) +[2023-10-08 18:39:51,655][21194] Updated weights for policy 1, policy_version 71850 (0.0010) +[2023-10-08 18:39:52,008][21194] Updated weights for policy 1, policy_version 71860 (0.0009) +[2023-10-08 18:39:52,371][21194] Updated weights for policy 1, policy_version 71870 (0.0008) +[2023-10-08 18:39:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 147750912. Throughput: 0: 1718.3, 1: 1721.9. Samples: 36942150. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 18:39:53,803][19739] Avg episode reward: [(0, '1106.540'), (1, '1100.590')] +[2023-10-08 18:39:55,193][21195] Updated weights for policy 0, policy_version 72420 (0.0007) +[2023-10-08 18:39:55,569][21195] Updated weights for policy 0, policy_version 72430 (0.0007) +[2023-10-08 18:39:55,935][21195] Updated weights for policy 0, policy_version 72440 (0.0010) +[2023-10-08 18:39:56,303][21194] Updated weights for policy 1, policy_version 71880 (0.0009) +[2023-10-08 18:39:56,657][21194] Updated weights for policy 1, policy_version 71890 (0.0010) +[2023-10-08 18:39:57,031][21194] Updated weights for policy 1, policy_version 71900 (0.0009) +[2023-10-08 18:39:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 147816448. Throughput: 0: 1728.4, 1: 1705.2. Samples: 36963146. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:39:58,803][19739] Avg episode reward: [(0, '1106.540'), (1, '1085.780')] +[2023-10-08 18:39:59,630][21195] Updated weights for policy 0, policy_version 72450 (0.0007) +[2023-10-08 18:40:00,012][21195] Updated weights for policy 0, policy_version 72460 (0.0008) +[2023-10-08 18:40:00,375][21195] Updated weights for policy 0, policy_version 72470 (0.0008) +[2023-10-08 18:40:00,741][21195] Updated weights for policy 0, policy_version 72480 (0.0010) +[2023-10-08 18:40:00,902][21194] Updated weights for policy 1, policy_version 71910 (0.0009) +[2023-10-08 18:40:01,260][21194] Updated weights for policy 1, policy_version 71920 (0.0008) +[2023-10-08 18:40:01,624][21194] Updated weights for policy 1, policy_version 71930 (0.0008) +[2023-10-08 18:40:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 147881984. Throughput: 0: 1757.5, 1: 1728.2. Samples: 36979696. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:40:03,803][19739] Avg episode reward: [(0, '1106.540'), (1, '1108.960')] +[2023-10-08 18:40:04,693][21195] Updated weights for policy 0, policy_version 72490 (0.0008) +[2023-10-08 18:40:05,070][21195] Updated weights for policy 0, policy_version 72500 (0.0008) +[2023-10-08 18:40:05,441][21195] Updated weights for policy 0, policy_version 72510 (0.0010) +[2023-10-08 18:40:05,658][21194] Updated weights for policy 1, policy_version 71940 (0.0008) +[2023-10-08 18:40:06,033][21194] Updated weights for policy 1, policy_version 71950 (0.0007) +[2023-10-08 18:40:06,401][21194] Updated weights for policy 1, policy_version 71960 (0.0008) +[2023-10-08 18:40:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 147947520. Throughput: 0: 1726.2, 1: 1706.6. Samples: 36994106. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:40:08,803][19739] Avg episode reward: [(0, '1106.540'), (1, '1092.900')] +[2023-10-08 18:40:09,312][21195] Updated weights for policy 0, policy_version 72520 (0.0007) +[2023-10-08 18:40:09,679][21195] Updated weights for policy 0, policy_version 72530 (0.0007) +[2023-10-08 18:40:10,056][21195] Updated weights for policy 0, policy_version 72540 (0.0009) +[2023-10-08 18:40:10,372][21194] Updated weights for policy 1, policy_version 71970 (0.0008) +[2023-10-08 18:40:10,783][21194] Updated weights for policy 1, policy_version 71980 (0.0007) +[2023-10-08 18:40:11,155][21194] Updated weights for policy 1, policy_version 71990 (0.0008) +[2023-10-08 18:40:11,519][21194] Updated weights for policy 1, policy_version 72000 (0.0007) +[2023-10-08 18:40:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 148013056. Throughput: 0: 1752.0, 1: 1709.0. Samples: 37015254. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:40:13,803][19739] Avg episode reward: [(0, '1106.320'), (1, '1092.900')] +[2023-10-08 18:40:13,954][21195] Updated weights for policy 0, policy_version 72550 (0.0009) +[2023-10-08 18:40:14,325][21195] Updated weights for policy 0, policy_version 72560 (0.0008) +[2023-10-08 18:40:14,691][21195] Updated weights for policy 0, policy_version 72570 (0.0008) +[2023-10-08 18:40:15,563][21194] Updated weights for policy 1, policy_version 72010 (0.0011) +[2023-10-08 18:40:15,927][21194] Updated weights for policy 1, policy_version 72020 (0.0009) +[2023-10-08 18:40:16,286][21194] Updated weights for policy 1, policy_version 72030 (0.0009) +[2023-10-08 18:40:18,636][21195] Updated weights for policy 0, policy_version 72580 (0.0007) +[2023-10-08 18:40:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 148078592. Throughput: 0: 1747.2, 1: 1707.7. Samples: 37030684. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:40:18,803][19739] Avg episode reward: [(0, '1106.630'), (1, '1078.200')] +[2023-10-08 18:40:19,003][21195] Updated weights for policy 0, policy_version 72590 (0.0007) +[2023-10-08 18:40:19,368][21195] Updated weights for policy 0, policy_version 72600 (0.0010) +[2023-10-08 18:40:20,315][21194] Updated weights for policy 1, policy_version 72040 (0.0009) +[2023-10-08 18:40:20,681][21194] Updated weights for policy 1, policy_version 72050 (0.0008) +[2023-10-08 18:40:21,055][21194] Updated weights for policy 1, policy_version 72060 (0.0009) +[2023-10-08 18:40:23,286][21195] Updated weights for policy 0, policy_version 72610 (0.0011) +[2023-10-08 18:40:23,649][21195] Updated weights for policy 0, policy_version 72620 (0.0007) +[2023-10-08 18:40:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 148144128. Throughput: 0: 1742.2, 1: 1695.4. Samples: 37046032. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:40:23,803][19739] Avg episode reward: [(0, '1106.630'), (1, '1063.340')] +[2023-10-08 18:40:24,013][21195] Updated weights for policy 0, policy_version 72630 (0.0008) +[2023-10-08 18:40:24,382][21195] Updated weights for policy 0, policy_version 72640 (0.0007) +[2023-10-08 18:40:24,975][21194] Updated weights for policy 1, policy_version 72070 (0.0008) +[2023-10-08 18:40:25,345][21194] Updated weights for policy 1, policy_version 72080 (0.0008) +[2023-10-08 18:40:25,709][21194] Updated weights for policy 1, policy_version 72090 (0.0009) +[2023-10-08 18:40:28,334][21195] Updated weights for policy 0, policy_version 72650 (0.0007) +[2023-10-08 18:40:28,715][21195] Updated weights for policy 0, policy_version 72660 (0.0008) +[2023-10-08 18:40:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 148209664. Throughput: 0: 1759.6, 1: 1720.8. Samples: 37067472. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:40:28,803][19739] Avg episode reward: [(0, '1106.630'), (1, '1066.150')] +[2023-10-08 18:40:29,077][21195] Updated weights for policy 0, policy_version 72670 (0.0008) +[2023-10-08 18:40:29,785][21194] Updated weights for policy 1, policy_version 72100 (0.0007) +[2023-10-08 18:40:30,155][21194] Updated weights for policy 1, policy_version 72110 (0.0007) +[2023-10-08 18:40:30,523][21194] Updated weights for policy 1, policy_version 72120 (0.0007) +[2023-10-08 18:40:32,972][21195] Updated weights for policy 0, policy_version 72680 (0.0007) +[2023-10-08 18:40:33,349][21195] Updated weights for policy 0, policy_version 72690 (0.0008) +[2023-10-08 18:40:33,718][21195] Updated weights for policy 0, policy_version 72700 (0.0007) +[2023-10-08 18:40:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 148275200. Throughput: 0: 1736.4, 1: 1692.9. Samples: 37081772. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:40:33,803][19739] Avg episode reward: [(0, '1106.630'), (1, '1050.850')] +[2023-10-08 18:40:34,511][21194] Updated weights for policy 1, policy_version 72130 (0.0008) +[2023-10-08 18:40:34,877][21194] Updated weights for policy 1, policy_version 72140 (0.0011) +[2023-10-08 18:40:35,256][21194] Updated weights for policy 1, policy_version 72150 (0.0009) +[2023-10-08 18:40:35,620][21194] Updated weights for policy 1, policy_version 72160 (0.0011) +[2023-10-08 18:40:37,528][21195] Updated weights for policy 0, policy_version 72710 (0.0007) +[2023-10-08 18:40:37,906][21195] Updated weights for policy 0, policy_version 72720 (0.0009) +[2023-10-08 18:40:38,270][21195] Updated weights for policy 0, policy_version 72730 (0.0007) +[2023-10-08 18:40:38,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 148373504. Throughput: 0: 1769.4, 1: 1702.5. Samples: 37098388. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:40:38,803][19739] Avg episode reward: [(0, '1106.630'), (1, '1050.850')] +[2023-10-08 18:40:39,660][21194] Updated weights for policy 1, policy_version 72170 (0.0012) +[2023-10-08 18:40:40,024][21194] Updated weights for policy 1, policy_version 72180 (0.0010) +[2023-10-08 18:40:40,392][21194] Updated weights for policy 1, policy_version 72190 (0.0008) +[2023-10-08 18:40:42,170][21195] Updated weights for policy 0, policy_version 72740 (0.0010) +[2023-10-08 18:40:42,540][21195] Updated weights for policy 0, policy_version 72750 (0.0010) +[2023-10-08 18:40:42,905][21195] Updated weights for policy 0, policy_version 72760 (0.0008) +[2023-10-08 18:40:43,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 148439040. Throughput: 0: 1741.9, 1: 1715.5. Samples: 37118730. Policy #0 lag: (min: 31.0, avg: 32.8, max: 60.0) +[2023-10-08 18:40:43,803][19739] Avg episode reward: [(0, '1107.010'), (1, '1065.040')] +[2023-10-08 18:40:44,421][21194] Updated weights for policy 1, policy_version 72200 (0.0008) +[2023-10-08 18:40:44,793][21194] Updated weights for policy 1, policy_version 72210 (0.0008) +[2023-10-08 18:40:45,152][21194] Updated weights for policy 1, policy_version 72220 (0.0008) +[2023-10-08 18:40:46,812][21195] Updated weights for policy 0, policy_version 72770 (0.0008) +[2023-10-08 18:40:47,189][21195] Updated weights for policy 0, policy_version 72780 (0.0008) +[2023-10-08 18:40:47,557][21195] Updated weights for policy 0, policy_version 72790 (0.0008) +[2023-10-08 18:40:47,919][21195] Updated weights for policy 0, policy_version 72800 (0.0010) +[2023-10-08 18:40:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 148504576. Throughput: 0: 1730.4, 1: 1692.6. Samples: 37133734. Policy #0 lag: (min: 31.0, avg: 32.8, max: 60.0) +[2023-10-08 18:40:48,803][19739] Avg episode reward: [(0, '1107.010'), (1, '1065.040')] +[2023-10-08 18:40:49,051][21194] Updated weights for policy 1, policy_version 72230 (0.0008) +[2023-10-08 18:40:49,413][21194] Updated weights for policy 1, policy_version 72240 (0.0007) +[2023-10-08 18:40:49,782][21194] Updated weights for policy 1, policy_version 72250 (0.0007) +[2023-10-08 18:40:52,060][21195] Updated weights for policy 0, policy_version 72810 (0.0008) +[2023-10-08 18:40:52,432][21195] Updated weights for policy 0, policy_version 72820 (0.0007) +[2023-10-08 18:40:52,804][21195] Updated weights for policy 0, policy_version 72830 (0.0007) +[2023-10-08 18:40:53,722][21194] Updated weights for policy 1, policy_version 72260 (0.0009) +[2023-10-08 18:40:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 148570112. Throughput: 0: 1753.0, 1: 1718.7. Samples: 37150334. Policy #0 lag: (min: 31.0, avg: 32.8, max: 60.0) +[2023-10-08 18:40:53,803][19739] Avg episode reward: [(0, '1114.810'), (1, '1065.040')] +[2023-10-08 18:40:54,093][21194] Updated weights for policy 1, policy_version 72270 (0.0011) +[2023-10-08 18:40:54,455][21194] Updated weights for policy 1, policy_version 72280 (0.0009) +[2023-10-08 18:40:56,633][21195] Updated weights for policy 0, policy_version 72840 (0.0008) +[2023-10-08 18:40:56,995][21195] Updated weights for policy 0, policy_version 72850 (0.0009) +[2023-10-08 18:40:57,353][21195] Updated weights for policy 0, policy_version 72860 (0.0007) +[2023-10-08 18:40:58,399][21194] Updated weights for policy 1, policy_version 72290 (0.0008) +[2023-10-08 18:40:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 148635648. Throughput: 0: 1725.3, 1: 1726.0. Samples: 37170564. Policy #0 lag: (min: 31.0, avg: 32.8, max: 60.0) +[2023-10-08 18:40:58,803][19739] Avg episode reward: [(0, '1114.770'), (1, '1065.040')] +[2023-10-08 18:40:58,811][21194] Updated weights for policy 1, policy_version 72300 (0.0011) +[2023-10-08 18:40:59,184][21194] Updated weights for policy 1, policy_version 72310 (0.0010) +[2023-10-08 18:40:59,549][21194] Updated weights for policy 1, policy_version 72320 (0.0011) +[2023-10-08 18:41:01,135][21195] Updated weights for policy 0, policy_version 72870 (0.0007) +[2023-10-08 18:41:01,511][21195] Updated weights for policy 0, policy_version 72880 (0.0009) +[2023-10-08 18:41:01,885][21195] Updated weights for policy 0, policy_version 72890 (0.0008) +[2023-10-08 18:41:03,417][21194] Updated weights for policy 1, policy_version 72330 (0.0007) +[2023-10-08 18:41:03,780][21194] Updated weights for policy 1, policy_version 72340 (0.0009) +[2023-10-08 18:41:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 148701184. Throughput: 0: 1734.9, 1: 1714.4. Samples: 37185904. Policy #0 lag: (min: 31.0, avg: 32.8, max: 60.0) +[2023-10-08 18:41:03,803][19739] Avg episode reward: [(0, '1114.770'), (1, '1065.040')] +[2023-10-08 18:41:04,135][21194] Updated weights for policy 1, policy_version 72350 (0.0009) +[2023-10-08 18:41:05,776][21195] Updated weights for policy 0, policy_version 72900 (0.0008) +[2023-10-08 18:41:06,138][21195] Updated weights for policy 0, policy_version 72910 (0.0007) +[2023-10-08 18:41:06,513][21195] Updated weights for policy 0, policy_version 72920 (0.0009) +[2023-10-08 18:41:08,259][21194] Updated weights for policy 1, policy_version 72360 (0.0010) +[2023-10-08 18:41:08,615][21194] Updated weights for policy 1, policy_version 72370 (0.0009) +[2023-10-08 18:41:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 148766720. Throughput: 0: 1728.1, 1: 1720.8. Samples: 37201232. Policy #0 lag: (min: 31.0, avg: 32.8, max: 60.0) +[2023-10-08 18:41:08,803][19739] Avg episode reward: [(0, '1114.770'), (1, '1070.910')] +[2023-10-08 18:41:08,989][21194] Updated weights for policy 1, policy_version 72380 (0.0008) +[2023-10-08 18:41:10,337][21195] Updated weights for policy 0, policy_version 72930 (0.0008) +[2023-10-08 18:41:10,718][21195] Updated weights for policy 0, policy_version 72940 (0.0009) +[2023-10-08 18:41:11,088][21195] Updated weights for policy 0, policy_version 72950 (0.0008) +[2023-10-08 18:41:11,453][21195] Updated weights for policy 0, policy_version 72960 (0.0007) +[2023-10-08 18:41:13,006][21194] Updated weights for policy 1, policy_version 72390 (0.0007) +[2023-10-08 18:41:13,375][21194] Updated weights for policy 1, policy_version 72400 (0.0009) +[2023-10-08 18:41:13,741][21194] Updated weights for policy 1, policy_version 72410 (0.0009) +[2023-10-08 18:41:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 148832256. Throughput: 0: 1723.2, 1: 1718.8. Samples: 37222362. Policy #0 lag: (min: 31.0, avg: 32.8, max: 60.0) +[2023-10-08 18:41:13,803][19739] Avg episode reward: [(0, '1114.770'), (1, '1070.910')] +[2023-10-08 18:41:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000072960_74711040.pth... +[2023-10-08 18:41:13,847][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000071328_73039872.pth +[2023-10-08 18:41:13,851][20740] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p0/milestones/checkpoint_000072960_74711040.pth +[2023-10-08 18:41:13,960][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000072416_74153984.pth... +[2023-10-08 18:41:14,002][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000070816_72515584.pth +[2023-10-08 18:41:14,008][20836] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p1/milestones/checkpoint_000072416_74153984.pth +[2023-10-08 18:41:15,351][21195] Updated weights for policy 0, policy_version 72970 (0.0009) +[2023-10-08 18:41:15,726][21195] Updated weights for policy 0, policy_version 72980 (0.0010) +[2023-10-08 18:41:16,095][21195] Updated weights for policy 0, policy_version 72990 (0.0008) +[2023-10-08 18:41:17,497][21194] Updated weights for policy 1, policy_version 72420 (0.0008) +[2023-10-08 18:41:17,857][21194] Updated weights for policy 1, policy_version 72430 (0.0010) +[2023-10-08 18:41:18,221][21194] Updated weights for policy 1, policy_version 72440 (0.0009) +[2023-10-08 18:41:18,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 148930560. Throughput: 0: 1744.7, 1: 1725.6. Samples: 37237934. Policy #0 lag: (min: 31.0, avg: 32.8, max: 60.0) +[2023-10-08 18:41:18,803][19739] Avg episode reward: [(0, '1114.770'), (1, '1070.910')] +[2023-10-08 18:41:20,172][21195] Updated weights for policy 0, policy_version 73000 (0.0007) +[2023-10-08 18:41:20,532][21195] Updated weights for policy 0, policy_version 73010 (0.0008) +[2023-10-08 18:41:20,909][21195] Updated weights for policy 0, policy_version 73020 (0.0010) +[2023-10-08 18:41:22,357][21194] Updated weights for policy 1, policy_version 72450 (0.0007) +[2023-10-08 18:41:22,720][21194] Updated weights for policy 1, policy_version 72460 (0.0008) +[2023-10-08 18:41:23,083][21194] Updated weights for policy 1, policy_version 72470 (0.0007) +[2023-10-08 18:41:23,449][21194] Updated weights for policy 1, policy_version 72480 (0.0008) +[2023-10-08 18:41:23,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 148996096. Throughput: 0: 1711.2, 1: 1730.4. Samples: 37253262. Policy #0 lag: (min: 31.0, avg: 32.8, max: 60.0) +[2023-10-08 18:41:23,803][19739] Avg episode reward: [(0, '1114.770'), (1, '1070.910')] +[2023-10-08 18:41:24,744][21195] Updated weights for policy 0, policy_version 73030 (0.0010) +[2023-10-08 18:41:25,114][21195] Updated weights for policy 0, policy_version 73040 (0.0008) +[2023-10-08 18:41:25,497][21195] Updated weights for policy 0, policy_version 73050 (0.0010) +[2023-10-08 18:41:27,364][21194] Updated weights for policy 1, policy_version 72490 (0.0009) +[2023-10-08 18:41:27,727][21194] Updated weights for policy 1, policy_version 72500 (0.0008) +[2023-10-08 18:41:28,094][21194] Updated weights for policy 1, policy_version 72510 (0.0007) +[2023-10-08 18:41:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 149061632. Throughput: 0: 1735.6, 1: 1707.6. Samples: 37273674. Policy #0 lag: (min: 31.0, avg: 32.8, max: 60.0) +[2023-10-08 18:41:28,803][19739] Avg episode reward: [(0, '1114.770'), (1, '1070.930')] +[2023-10-08 18:41:29,399][21195] Updated weights for policy 0, policy_version 73060 (0.0007) +[2023-10-08 18:41:29,774][21195] Updated weights for policy 0, policy_version 73070 (0.0007) +[2023-10-08 18:41:30,139][21195] Updated weights for policy 0, policy_version 73080 (0.0007) +[2023-10-08 18:41:32,150][21194] Updated weights for policy 1, policy_version 72520 (0.0010) +[2023-10-08 18:41:32,508][21194] Updated weights for policy 1, policy_version 72530 (0.0011) +[2023-10-08 18:41:32,869][21194] Updated weights for policy 1, policy_version 72540 (0.0007) +[2023-10-08 18:41:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 149127168. Throughput: 0: 1746.9, 1: 1733.5. Samples: 37290352. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) +[2023-10-08 18:41:33,803][19739] Avg episode reward: [(0, '1114.770'), (1, '1070.930')] +[2023-10-08 18:41:33,999][21195] Updated weights for policy 0, policy_version 73090 (0.0012) +[2023-10-08 18:41:34,372][21195] Updated weights for policy 0, policy_version 73100 (0.0008) +[2023-10-08 18:41:34,738][21195] Updated weights for policy 0, policy_version 73110 (0.0008) +[2023-10-08 18:41:35,093][21195] Updated weights for policy 0, policy_version 73120 (0.0008) +[2023-10-08 18:41:36,797][21194] Updated weights for policy 1, policy_version 72550 (0.0008) +[2023-10-08 18:41:37,168][21194] Updated weights for policy 1, policy_version 72560 (0.0008) +[2023-10-08 18:41:37,531][21194] Updated weights for policy 1, policy_version 72570 (0.0010) +[2023-10-08 18:41:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 149192704. Throughput: 0: 1726.0, 1: 1714.6. Samples: 37305162. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) +[2023-10-08 18:41:38,803][19739] Avg episode reward: [(0, '1114.770'), (1, '1070.930')] +[2023-10-08 18:41:39,269][21195] Updated weights for policy 0, policy_version 73130 (0.0008) +[2023-10-08 18:41:39,627][21195] Updated weights for policy 0, policy_version 73140 (0.0007) +[2023-10-08 18:41:39,995][21195] Updated weights for policy 0, policy_version 73150 (0.0008) +[2023-10-08 18:41:41,625][21194] Updated weights for policy 1, policy_version 72580 (0.0008) +[2023-10-08 18:41:41,988][21194] Updated weights for policy 1, policy_version 72590 (0.0009) +[2023-10-08 18:41:42,368][21194] Updated weights for policy 1, policy_version 72600 (0.0009) +[2023-10-08 18:41:43,712][21195] Updated weights for policy 0, policy_version 73160 (0.0008) +[2023-10-08 18:41:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 149258240. Throughput: 0: 1753.3, 1: 1690.7. Samples: 37325544. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) +[2023-10-08 18:41:43,803][19739] Avg episode reward: [(0, '1110.980'), (1, '1070.930')] +[2023-10-08 18:41:44,085][21195] Updated weights for policy 0, policy_version 73170 (0.0009) +[2023-10-08 18:41:44,446][21195] Updated weights for policy 0, policy_version 73180 (0.0007) +[2023-10-08 18:41:46,389][21194] Updated weights for policy 1, policy_version 72610 (0.0009) +[2023-10-08 18:41:46,785][21194] Updated weights for policy 1, policy_version 72620 (0.0010) +[2023-10-08 18:41:47,140][21194] Updated weights for policy 1, policy_version 72630 (0.0007) +[2023-10-08 18:41:47,502][21194] Updated weights for policy 1, policy_version 72640 (0.0009) +[2023-10-08 18:41:48,359][21195] Updated weights for policy 0, policy_version 73190 (0.0009) +[2023-10-08 18:41:48,724][21195] Updated weights for policy 0, policy_version 73200 (0.0010) +[2023-10-08 18:41:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 149323776. Throughput: 0: 1736.8, 1: 1723.1. Samples: 37341598. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) +[2023-10-08 18:41:48,803][19739] Avg episode reward: [(0, '1066.880'), (1, '1070.930')] +[2023-10-08 18:41:49,091][21195] Updated weights for policy 0, policy_version 73210 (0.0008) +[2023-10-08 18:41:51,353][21194] Updated weights for policy 1, policy_version 72650 (0.0007) +[2023-10-08 18:41:51,714][21194] Updated weights for policy 1, policy_version 72660 (0.0008) +[2023-10-08 18:41:52,083][21194] Updated weights for policy 1, policy_version 72670 (0.0009) +[2023-10-08 18:41:53,041][21195] Updated weights for policy 0, policy_version 73220 (0.0009) +[2023-10-08 18:41:53,410][21195] Updated weights for policy 0, policy_version 73230 (0.0007) +[2023-10-08 18:41:53,783][21195] Updated weights for policy 0, policy_version 73240 (0.0010) +[2023-10-08 18:41:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 149389312. Throughput: 0: 1750.0, 1: 1698.7. Samples: 37356424. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) +[2023-10-08 18:41:53,803][19739] Avg episode reward: [(0, '1081.620'), (1, '1057.460')] +[2023-10-08 18:41:55,946][21194] Updated weights for policy 1, policy_version 72680 (0.0010) +[2023-10-08 18:41:56,304][21194] Updated weights for policy 1, policy_version 72690 (0.0009) +[2023-10-08 18:41:56,663][21194] Updated weights for policy 1, policy_version 72700 (0.0010) +[2023-10-08 18:41:57,561][21195] Updated weights for policy 0, policy_version 73250 (0.0008) +[2023-10-08 18:41:57,933][21195] Updated weights for policy 0, policy_version 73260 (0.0008) +[2023-10-08 18:41:58,293][21195] Updated weights for policy 0, policy_version 73270 (0.0008) +[2023-10-08 18:41:58,666][21195] Updated weights for policy 0, policy_version 73280 (0.0007) +[2023-10-08 18:41:58,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 149487616. Throughput: 0: 1750.7, 1: 1700.4. Samples: 37377662. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) +[2023-10-08 18:41:58,803][19739] Avg episode reward: [(0, '1066.420'), (1, '1057.460')] +[2023-10-08 18:42:00,583][21194] Updated weights for policy 1, policy_version 72710 (0.0009) +[2023-10-08 18:42:00,945][21194] Updated weights for policy 1, policy_version 72720 (0.0008) +[2023-10-08 18:42:01,309][21194] Updated weights for policy 1, policy_version 72730 (0.0007) +[2023-10-08 18:42:02,484][21195] Updated weights for policy 0, policy_version 73290 (0.0008) +[2023-10-08 18:42:02,842][21195] Updated weights for policy 0, policy_version 73300 (0.0008) +[2023-10-08 18:42:03,212][21195] Updated weights for policy 0, policy_version 73310 (0.0010) +[2023-10-08 18:42:03,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 149553152. Throughput: 0: 1734.3, 1: 1707.3. Samples: 37392806. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) +[2023-10-08 18:42:03,803][19739] Avg episode reward: [(0, '1052.140'), (1, '1057.460')] +[2023-10-08 18:42:05,387][21194] Updated weights for policy 1, policy_version 72740 (0.0007) +[2023-10-08 18:42:05,748][21194] Updated weights for policy 1, policy_version 72750 (0.0008) +[2023-10-08 18:42:06,125][21194] Updated weights for policy 1, policy_version 72760 (0.0010) +[2023-10-08 18:42:07,198][21195] Updated weights for policy 0, policy_version 73320 (0.0008) +[2023-10-08 18:42:07,571][21195] Updated weights for policy 0, policy_version 73330 (0.0007) +[2023-10-08 18:42:07,944][21195] Updated weights for policy 0, policy_version 73340 (0.0008) +[2023-10-08 18:42:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 149618688. Throughput: 0: 1763.6, 1: 1698.3. Samples: 37409050. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) +[2023-10-08 18:42:08,803][19739] Avg episode reward: [(0, '1051.680'), (1, '1057.460')] +[2023-10-08 18:42:09,944][21194] Updated weights for policy 1, policy_version 72770 (0.0009) +[2023-10-08 18:42:10,303][21194] Updated weights for policy 1, policy_version 72780 (0.0008) +[2023-10-08 18:42:10,672][21194] Updated weights for policy 1, policy_version 72790 (0.0011) +[2023-10-08 18:42:11,033][21194] Updated weights for policy 1, policy_version 72800 (0.0008) +[2023-10-08 18:42:11,869][21195] Updated weights for policy 0, policy_version 73350 (0.0009) +[2023-10-08 18:42:12,243][21195] Updated weights for policy 0, policy_version 73360 (0.0007) +[2023-10-08 18:42:12,607][21195] Updated weights for policy 0, policy_version 73370 (0.0010) +[2023-10-08 18:42:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 149684224. Throughput: 0: 1732.8, 1: 1729.2. Samples: 37429468. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) +[2023-10-08 18:42:13,803][19739] Avg episode reward: [(0, '1051.680'), (1, '1057.480')] +[2023-10-08 18:42:14,969][21194] Updated weights for policy 1, policy_version 72810 (0.0007) +[2023-10-08 18:42:15,333][21194] Updated weights for policy 1, policy_version 72820 (0.0009) +[2023-10-08 18:42:15,703][21194] Updated weights for policy 1, policy_version 72830 (0.0010) +[2023-10-08 18:42:16,468][21195] Updated weights for policy 0, policy_version 73380 (0.0008) +[2023-10-08 18:42:16,837][21195] Updated weights for policy 0, policy_version 73390 (0.0008) +[2023-10-08 18:42:17,193][21195] Updated weights for policy 0, policy_version 73400 (0.0007) +[2023-10-08 18:42:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 149749760. Throughput: 0: 1725.6, 1: 1705.1. Samples: 37444734. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:42:18,803][19739] Avg episode reward: [(0, '1051.680'), (1, '1057.480')] +[2023-10-08 18:42:19,681][21194] Updated weights for policy 1, policy_version 72840 (0.0010) +[2023-10-08 18:42:20,038][21194] Updated weights for policy 1, policy_version 72850 (0.0010) +[2023-10-08 18:42:20,402][21194] Updated weights for policy 1, policy_version 72860 (0.0008) +[2023-10-08 18:42:21,174][21195] Updated weights for policy 0, policy_version 73410 (0.0008) +[2023-10-08 18:42:21,539][21195] Updated weights for policy 0, policy_version 73420 (0.0008) +[2023-10-08 18:42:21,908][21195] Updated weights for policy 0, policy_version 73430 (0.0010) +[2023-10-08 18:42:22,276][21195] Updated weights for policy 0, policy_version 73440 (0.0007) +[2023-10-08 18:42:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 149815296. Throughput: 0: 1736.7, 1: 1720.5. Samples: 37460734. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:42:23,803][19739] Avg episode reward: [(0, '1051.680'), (1, '1057.480')] +[2023-10-08 18:42:24,262][21194] Updated weights for policy 1, policy_version 72870 (0.0010) +[2023-10-08 18:42:24,634][21194] Updated weights for policy 1, policy_version 72880 (0.0008) +[2023-10-08 18:42:24,998][21194] Updated weights for policy 1, policy_version 72890 (0.0007) +[2023-10-08 18:42:26,027][21195] Updated weights for policy 0, policy_version 73450 (0.0009) +[2023-10-08 18:42:26,398][21195] Updated weights for policy 0, policy_version 73460 (0.0007) +[2023-10-08 18:42:26,766][21195] Updated weights for policy 0, policy_version 73470 (0.0007) +[2023-10-08 18:42:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 149880832. Throughput: 0: 1726.3, 1: 1744.9. Samples: 37481746. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:42:28,803][19739] Avg episode reward: [(0, '1067.260'), (1, '1057.480')] +[2023-10-08 18:42:28,974][21194] Updated weights for policy 1, policy_version 72900 (0.0007) +[2023-10-08 18:42:29,346][21194] Updated weights for policy 1, policy_version 72910 (0.0008) +[2023-10-08 18:42:29,717][21194] Updated weights for policy 1, policy_version 72920 (0.0008) +[2023-10-08 18:42:30,711][21195] Updated weights for policy 0, policy_version 73480 (0.0008) +[2023-10-08 18:42:31,074][21195] Updated weights for policy 0, policy_version 73490 (0.0010) +[2023-10-08 18:42:31,443][21195] Updated weights for policy 0, policy_version 73500 (0.0008) +[2023-10-08 18:42:33,604][21194] Updated weights for policy 1, policy_version 72930 (0.0009) +[2023-10-08 18:42:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 149946368. Throughput: 0: 1737.1, 1: 1717.7. Samples: 37497062. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:42:33,803][19739] Avg episode reward: [(0, '1067.240'), (1, '1057.480')] +[2023-10-08 18:42:34,001][21194] Updated weights for policy 1, policy_version 72940 (0.0009) +[2023-10-08 18:42:34,359][21194] Updated weights for policy 1, policy_version 72950 (0.0007) +[2023-10-08 18:42:34,738][21194] Updated weights for policy 1, policy_version 72960 (0.0008) +[2023-10-08 18:42:35,330][21195] Updated weights for policy 0, policy_version 73510 (0.0011) +[2023-10-08 18:42:35,705][21195] Updated weights for policy 0, policy_version 73520 (0.0010) +[2023-10-08 18:42:36,083][21195] Updated weights for policy 0, policy_version 73530 (0.0010) +[2023-10-08 18:42:38,678][21194] Updated weights for policy 1, policy_version 72970 (0.0007) +[2023-10-08 18:42:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 150011904. Throughput: 0: 1722.6, 1: 1746.8. Samples: 37512550. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:42:38,803][19739] Avg episode reward: [(0, '1009.390'), (1, '1057.480')] +[2023-10-08 18:42:39,044][21194] Updated weights for policy 1, policy_version 72980 (0.0008) +[2023-10-08 18:42:39,401][21194] Updated weights for policy 1, policy_version 72990 (0.0009) +[2023-10-08 18:42:39,699][21195] Updated weights for policy 0, policy_version 73540 (0.0009) +[2023-10-08 18:42:40,070][21195] Updated weights for policy 0, policy_version 73550 (0.0008) +[2023-10-08 18:42:40,437][21195] Updated weights for policy 0, policy_version 73560 (0.0008) +[2023-10-08 18:42:43,186][21194] Updated weights for policy 1, policy_version 73000 (0.0007) +[2023-10-08 18:42:43,544][21194] Updated weights for policy 1, policy_version 73010 (0.0008) +[2023-10-08 18:42:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 150077440. Throughput: 0: 1729.0, 1: 1751.7. Samples: 37534294. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:42:43,803][19739] Avg episode reward: [(0, '993.940'), (1, '1072.590')] +[2023-10-08 18:42:43,912][21194] Updated weights for policy 1, policy_version 73020 (0.0009) +[2023-10-08 18:42:44,258][21195] Updated weights for policy 0, policy_version 73570 (0.0007) +[2023-10-08 18:42:44,616][21195] Updated weights for policy 0, policy_version 73580 (0.0008) +[2023-10-08 18:42:44,985][21195] Updated weights for policy 0, policy_version 73590 (0.0009) +[2023-10-08 18:42:45,352][21195] Updated weights for policy 0, policy_version 73600 (0.0008) +[2023-10-08 18:42:47,940][21194] Updated weights for policy 1, policy_version 73030 (0.0008) +[2023-10-08 18:42:48,302][21194] Updated weights for policy 1, policy_version 73040 (0.0010) +[2023-10-08 18:42:48,670][21194] Updated weights for policy 1, policy_version 73050 (0.0009) +[2023-10-08 18:42:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 150142976. Throughput: 0: 1753.7, 1: 1741.0. Samples: 37550066. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:42:48,803][19739] Avg episode reward: [(0, '993.940'), (1, '1072.590')] +[2023-10-08 18:42:49,386][21195] Updated weights for policy 0, policy_version 73610 (0.0009) +[2023-10-08 18:42:49,748][21195] Updated weights for policy 0, policy_version 73620 (0.0008) +[2023-10-08 18:42:50,117][21195] Updated weights for policy 0, policy_version 73630 (0.0010) +[2023-10-08 18:42:52,569][21194] Updated weights for policy 1, policy_version 73060 (0.0009) +[2023-10-08 18:42:52,939][21194] Updated weights for policy 1, policy_version 73070 (0.0011) +[2023-10-08 18:42:53,306][21194] Updated weights for policy 1, policy_version 73080 (0.0009) +[2023-10-08 18:42:53,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 150241280. Throughput: 0: 1724.9, 1: 1751.4. Samples: 37565484. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:42:53,803][19739] Avg episode reward: [(0, '909.290'), (1, '1072.590')] +[2023-10-08 18:42:53,952][21195] Updated weights for policy 0, policy_version 73640 (0.0009) +[2023-10-08 18:42:54,321][21195] Updated weights for policy 0, policy_version 73650 (0.0008) +[2023-10-08 18:42:54,691][21195] Updated weights for policy 0, policy_version 73660 (0.0008) +[2023-10-08 18:42:57,176][21194] Updated weights for policy 1, policy_version 73090 (0.0008) +[2023-10-08 18:42:57,540][21194] Updated weights for policy 1, policy_version 73100 (0.0008) +[2023-10-08 18:42:57,905][21194] Updated weights for policy 1, policy_version 73110 (0.0011) +[2023-10-08 18:42:58,273][21194] Updated weights for policy 1, policy_version 73120 (0.0008) +[2023-10-08 18:42:58,611][21195] Updated weights for policy 0, policy_version 73670 (0.0008) +[2023-10-08 18:42:58,803][19739] Fps is (10 sec: 16383.7, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 150306816. Throughput: 0: 1760.5, 1: 1721.4. Samples: 37586152. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:42:58,804][19739] Avg episode reward: [(0, '909.290'), (1, '1072.330')] +[2023-10-08 18:42:58,981][21195] Updated weights for policy 0, policy_version 73680 (0.0009) +[2023-10-08 18:42:59,349][21195] Updated weights for policy 0, policy_version 73690 (0.0007) +[2023-10-08 18:43:02,244][21194] Updated weights for policy 1, policy_version 73130 (0.0008) +[2023-10-08 18:43:02,617][21194] Updated weights for policy 1, policy_version 73140 (0.0007) +[2023-10-08 18:43:02,986][21194] Updated weights for policy 1, policy_version 73150 (0.0007) +[2023-10-08 18:43:03,349][21195] Updated weights for policy 0, policy_version 73700 (0.0008) +[2023-10-08 18:43:03,715][21195] Updated weights for policy 0, policy_version 73710 (0.0007) +[2023-10-08 18:43:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 150372352. Throughput: 0: 1751.7, 1: 1741.8. Samples: 37601940. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:43:03,803][19739] Avg episode reward: [(0, '894.460'), (1, '1072.330')] +[2023-10-08 18:43:04,083][21195] Updated weights for policy 0, policy_version 73720 (0.0008) +[2023-10-08 18:43:06,821][21194] Updated weights for policy 1, policy_version 73160 (0.0008) +[2023-10-08 18:43:07,189][21194] Updated weights for policy 1, policy_version 73170 (0.0007) +[2023-10-08 18:43:07,554][21194] Updated weights for policy 1, policy_version 73180 (0.0008) +[2023-10-08 18:43:07,818][21195] Updated weights for policy 0, policy_version 73730 (0.0009) +[2023-10-08 18:43:08,187][21195] Updated weights for policy 0, policy_version 73740 (0.0010) +[2023-10-08 18:43:08,564][21195] Updated weights for policy 0, policy_version 73750 (0.0008) +[2023-10-08 18:43:08,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 150437888. Throughput: 0: 1757.0, 1: 1734.4. Samples: 37617846. Policy #0 lag: (min: 3.0, avg: 8.3, max: 35.0) +[2023-10-08 18:43:08,803][19739] Avg episode reward: [(0, '894.460'), (1, '1072.330')] +[2023-10-08 18:43:08,936][21195] Updated weights for policy 0, policy_version 73760 (0.0008) +[2023-10-08 18:43:11,483][21194] Updated weights for policy 1, policy_version 73190 (0.0008) +[2023-10-08 18:43:11,840][21194] Updated weights for policy 1, policy_version 73200 (0.0010) +[2023-10-08 18:43:12,203][21194] Updated weights for policy 1, policy_version 73210 (0.0011) +[2023-10-08 18:43:13,026][21195] Updated weights for policy 0, policy_version 73770 (0.0009) +[2023-10-08 18:43:13,397][21195] Updated weights for policy 0, policy_version 73780 (0.0007) +[2023-10-08 18:43:13,768][21195] Updated weights for policy 0, policy_version 73790 (0.0007) +[2023-10-08 18:43:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 150503424. Throughput: 0: 1763.7, 1: 1717.1. Samples: 37638382. Policy #0 lag: (min: 3.0, avg: 8.3, max: 35.0) +[2023-10-08 18:43:13,803][19739] Avg episode reward: [(0, '889.600'), (1, '1072.330')] +[2023-10-08 18:43:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000073216_74973184.pth... +[2023-10-08 18:43:13,833][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000073792_75563008.pth... +[2023-10-08 18:43:13,851][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000071616_73334784.pth +[2023-10-08 18:43:13,872][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000072160_73891840.pth +[2023-10-08 18:43:16,175][21194] Updated weights for policy 1, policy_version 73220 (0.0009) +[2023-10-08 18:43:16,533][21194] Updated weights for policy 1, policy_version 73230 (0.0008) +[2023-10-08 18:43:16,896][21194] Updated weights for policy 1, policy_version 73240 (0.0007) +[2023-10-08 18:43:17,769][21195] Updated weights for policy 0, policy_version 73800 (0.0008) +[2023-10-08 18:43:18,142][21195] Updated weights for policy 0, policy_version 73810 (0.0008) +[2023-10-08 18:43:18,501][21195] Updated weights for policy 0, policy_version 73820 (0.0007) +[2023-10-08 18:43:18,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 150601728. Throughput: 0: 1737.7, 1: 1748.5. Samples: 37653944. Policy #0 lag: (min: 3.0, avg: 8.3, max: 35.0) +[2023-10-08 18:43:18,804][19739] Avg episode reward: [(0, '889.600'), (1, '1072.330')] +[2023-10-08 18:43:20,872][21194] Updated weights for policy 1, policy_version 73250 (0.0008) +[2023-10-08 18:43:21,245][21194] Updated weights for policy 1, policy_version 73260 (0.0009) +[2023-10-08 18:43:21,607][21194] Updated weights for policy 1, policy_version 73270 (0.0010) +[2023-10-08 18:43:21,969][21194] Updated weights for policy 1, policy_version 73280 (0.0009) +[2023-10-08 18:43:22,465][21195] Updated weights for policy 0, policy_version 73830 (0.0008) +[2023-10-08 18:43:22,832][21195] Updated weights for policy 0, policy_version 73840 (0.0009) +[2023-10-08 18:43:23,206][21195] Updated weights for policy 0, policy_version 73850 (0.0009) +[2023-10-08 18:43:23,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 150667264. Throughput: 0: 1768.6, 1: 1716.9. Samples: 37669398. Policy #0 lag: (min: 3.0, avg: 8.3, max: 35.0) +[2023-10-08 18:43:23,803][19739] Avg episode reward: [(0, '889.600'), (1, '1072.330')] +[2023-10-08 18:43:26,069][21194] Updated weights for policy 1, policy_version 73290 (0.0007) +[2023-10-08 18:43:26,447][21194] Updated weights for policy 1, policy_version 73300 (0.0009) +[2023-10-08 18:43:26,817][21194] Updated weights for policy 1, policy_version 73310 (0.0008) +[2023-10-08 18:43:26,901][21195] Updated weights for policy 0, policy_version 73860 (0.0009) +[2023-10-08 18:43:27,278][21195] Updated weights for policy 0, policy_version 73870 (0.0007) +[2023-10-08 18:43:27,653][21195] Updated weights for policy 0, policy_version 73880 (0.0009) +[2023-10-08 18:43:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.8). Total num frames: 150732800. Throughput: 0: 1741.6, 1: 1711.8. Samples: 37689698. Policy #0 lag: (min: 3.0, avg: 8.3, max: 35.0) +[2023-10-08 18:43:28,803][19739] Avg episode reward: [(0, '889.600'), (1, '1072.330')] +[2023-10-08 18:43:30,829][21194] Updated weights for policy 1, policy_version 73320 (0.0008) +[2023-10-08 18:43:31,204][21194] Updated weights for policy 1, policy_version 73330 (0.0008) +[2023-10-08 18:43:31,562][21194] Updated weights for policy 1, policy_version 73340 (0.0008) +[2023-10-08 18:43:31,570][21195] Updated weights for policy 0, policy_version 73890 (0.0009) +[2023-10-08 18:43:31,935][21195] Updated weights for policy 0, policy_version 73900 (0.0008) +[2023-10-08 18:43:32,306][21195] Updated weights for policy 0, policy_version 73910 (0.0009) +[2023-10-08 18:43:32,673][21195] Updated weights for policy 0, policy_version 73920 (0.0011) +[2023-10-08 18:43:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 150798336. Throughput: 0: 1731.7, 1: 1722.8. Samples: 37705516. Policy #0 lag: (min: 3.0, avg: 8.3, max: 35.0) +[2023-10-08 18:43:33,803][19739] Avg episode reward: [(0, '865.610'), (1, '1072.330')] +[2023-10-08 18:43:35,552][21194] Updated weights for policy 1, policy_version 73350 (0.0008) +[2023-10-08 18:43:35,927][21194] Updated weights for policy 1, policy_version 73360 (0.0009) +[2023-10-08 18:43:36,291][21194] Updated weights for policy 1, policy_version 73370 (0.0008) +[2023-10-08 18:43:36,593][21195] Updated weights for policy 0, policy_version 73930 (0.0009) +[2023-10-08 18:43:36,962][21195] Updated weights for policy 0, policy_version 73940 (0.0009) +[2023-10-08 18:43:37,326][21195] Updated weights for policy 0, policy_version 73950 (0.0007) +[2023-10-08 18:43:38,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 150863872. Throughput: 0: 1749.6, 1: 1704.0. Samples: 37720896. Policy #0 lag: (min: 3.0, avg: 8.3, max: 35.0) +[2023-10-08 18:43:38,803][19739] Avg episode reward: [(0, '865.610'), (1, '1071.710')] +[2023-10-08 18:43:40,183][21194] Updated weights for policy 1, policy_version 73380 (0.0007) +[2023-10-08 18:43:40,559][21194] Updated weights for policy 1, policy_version 73390 (0.0007) +[2023-10-08 18:43:40,923][21194] Updated weights for policy 1, policy_version 73400 (0.0009) +[2023-10-08 18:43:41,214][21195] Updated weights for policy 0, policy_version 73960 (0.0007) +[2023-10-08 18:43:41,579][21195] Updated weights for policy 0, policy_version 73970 (0.0007) +[2023-10-08 18:43:41,953][21195] Updated weights for policy 0, policy_version 73980 (0.0008) +[2023-10-08 18:43:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 150929408. Throughput: 0: 1727.1, 1: 1731.0. Samples: 37741766. Policy #0 lag: (min: 3.0, avg: 8.3, max: 35.0) +[2023-10-08 18:43:43,803][19739] Avg episode reward: [(0, '865.610'), (1, '1071.710')] +[2023-10-08 18:43:44,795][21194] Updated weights for policy 1, policy_version 73410 (0.0007) +[2023-10-08 18:43:45,157][21194] Updated weights for policy 1, policy_version 73420 (0.0007) +[2023-10-08 18:43:45,516][21194] Updated weights for policy 1, policy_version 73430 (0.0011) +[2023-10-08 18:43:45,806][21195] Updated weights for policy 0, policy_version 73990 (0.0008) +[2023-10-08 18:43:45,881][21194] Updated weights for policy 1, policy_version 73440 (0.0008) +[2023-10-08 18:43:46,182][21195] Updated weights for policy 0, policy_version 74000 (0.0008) +[2023-10-08 18:43:46,554][21195] Updated weights for policy 0, policy_version 74010 (0.0010) +[2023-10-08 18:43:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 150994944. Throughput: 0: 1736.1, 1: 1709.6. Samples: 37756994. Policy #0 lag: (min: 3.0, avg: 8.3, max: 35.0) +[2023-10-08 18:43:48,803][19739] Avg episode reward: [(0, '865.610'), (1, '1071.680')] +[2023-10-08 18:43:49,750][21194] Updated weights for policy 1, policy_version 73450 (0.0011) +[2023-10-08 18:43:50,120][21194] Updated weights for policy 1, policy_version 73460 (0.0009) +[2023-10-08 18:43:50,480][21194] Updated weights for policy 1, policy_version 73470 (0.0009) +[2023-10-08 18:43:50,487][21195] Updated weights for policy 0, policy_version 74020 (0.0010) +[2023-10-08 18:43:50,853][21195] Updated weights for policy 0, policy_version 74030 (0.0009) +[2023-10-08 18:43:51,220][21195] Updated weights for policy 0, policy_version 74040 (0.0010) +[2023-10-08 18:43:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 151060480. Throughput: 0: 1717.6, 1: 1719.1. Samples: 37772498. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:43:53,804][19739] Avg episode reward: [(0, '865.610'), (1, '1071.680')] +[2023-10-08 18:43:54,398][21194] Updated weights for policy 1, policy_version 73480 (0.0008) +[2023-10-08 18:43:54,769][21194] Updated weights for policy 1, policy_version 73490 (0.0007) +[2023-10-08 18:43:55,136][21194] Updated weights for policy 1, policy_version 73500 (0.0008) +[2023-10-08 18:43:55,337][21195] Updated weights for policy 0, policy_version 74050 (0.0009) +[2023-10-08 18:43:55,705][21195] Updated weights for policy 0, policy_version 74060 (0.0007) +[2023-10-08 18:43:56,077][21195] Updated weights for policy 0, policy_version 74070 (0.0009) +[2023-10-08 18:43:56,443][21195] Updated weights for policy 0, policy_version 74080 (0.0009) +[2023-10-08 18:43:58,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 151126016. Throughput: 0: 1719.6, 1: 1736.0. Samples: 37793884. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:43:58,804][19739] Avg episode reward: [(0, '852.920'), (1, '1071.680')] +[2023-10-08 18:43:59,193][21194] Updated weights for policy 1, policy_version 73510 (0.0010) +[2023-10-08 18:43:59,560][21194] Updated weights for policy 1, policy_version 73520 (0.0010) +[2023-10-08 18:43:59,926][21194] Updated weights for policy 1, policy_version 73530 (0.0007) +[2023-10-08 18:44:00,280][21195] Updated weights for policy 0, policy_version 74090 (0.0010) +[2023-10-08 18:44:00,646][21195] Updated weights for policy 0, policy_version 74100 (0.0010) +[2023-10-08 18:44:01,012][21195] Updated weights for policy 0, policy_version 74110 (0.0009) +[2023-10-08 18:44:03,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 151191552. Throughput: 0: 1748.9, 1: 1701.4. Samples: 37809204. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:44:03,803][19739] Avg episode reward: [(0, '852.920'), (1, '1071.680')] +[2023-10-08 18:44:03,884][21194] Updated weights for policy 1, policy_version 73540 (0.0007) +[2023-10-08 18:44:04,257][21194] Updated weights for policy 1, policy_version 73550 (0.0009) +[2023-10-08 18:44:04,632][21194] Updated weights for policy 1, policy_version 73560 (0.0007) +[2023-10-08 18:44:05,016][21195] Updated weights for policy 0, policy_version 74120 (0.0007) +[2023-10-08 18:44:05,393][21195] Updated weights for policy 0, policy_version 74130 (0.0010) +[2023-10-08 18:44:05,750][21195] Updated weights for policy 0, policy_version 74140 (0.0009) +[2023-10-08 18:44:08,474][21194] Updated weights for policy 1, policy_version 73570 (0.0007) +[2023-10-08 18:44:08,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 151257088. Throughput: 0: 1716.9, 1: 1726.7. Samples: 37824360. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:44:08,803][19739] Avg episode reward: [(0, '852.920'), (1, '1071.680')] +[2023-10-08 18:44:08,850][21194] Updated weights for policy 1, policy_version 73580 (0.0009) +[2023-10-08 18:44:09,205][21194] Updated weights for policy 1, policy_version 73590 (0.0008) +[2023-10-08 18:44:09,576][21194] Updated weights for policy 1, policy_version 73600 (0.0008) +[2023-10-08 18:44:09,583][21195] Updated weights for policy 0, policy_version 74150 (0.0009) +[2023-10-08 18:44:09,956][21195] Updated weights for policy 0, policy_version 74160 (0.0009) +[2023-10-08 18:44:10,327][21195] Updated weights for policy 0, policy_version 74170 (0.0008) +[2023-10-08 18:44:13,633][21194] Updated weights for policy 1, policy_version 73610 (0.0011) +[2023-10-08 18:44:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 151322624. Throughput: 0: 1739.5, 1: 1737.6. Samples: 37846166. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:44:13,803][19739] Avg episode reward: [(0, '852.920'), (1, '1076.150')] +[2023-10-08 18:44:14,002][21194] Updated weights for policy 1, policy_version 73620 (0.0009) +[2023-10-08 18:44:14,324][21195] Updated weights for policy 0, policy_version 74180 (0.0008) +[2023-10-08 18:44:14,355][21194] Updated weights for policy 1, policy_version 73630 (0.0009) +[2023-10-08 18:44:14,706][21195] Updated weights for policy 0, policy_version 74190 (0.0008) +[2023-10-08 18:44:15,083][21195] Updated weights for policy 0, policy_version 74200 (0.0007) +[2023-10-08 18:44:18,239][21194] Updated weights for policy 1, policy_version 73640 (0.0009) +[2023-10-08 18:44:18,605][21194] Updated weights for policy 1, policy_version 73650 (0.0007) +[2023-10-08 18:44:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 151388160. Throughput: 0: 1744.1, 1: 1720.1. Samples: 37861404. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:44:18,803][19739] Avg episode reward: [(0, '852.990'), (1, '1076.150')] +[2023-10-08 18:44:18,972][21194] Updated weights for policy 1, policy_version 73660 (0.0008) +[2023-10-08 18:44:19,008][21195] Updated weights for policy 0, policy_version 74210 (0.0007) +[2023-10-08 18:44:19,382][21195] Updated weights for policy 0, policy_version 74220 (0.0008) +[2023-10-08 18:44:19,750][21195] Updated weights for policy 0, policy_version 74230 (0.0008) +[2023-10-08 18:44:20,125][21195] Updated weights for policy 0, policy_version 74240 (0.0007) +[2023-10-08 18:44:22,933][21194] Updated weights for policy 1, policy_version 73670 (0.0007) +[2023-10-08 18:44:23,305][21194] Updated weights for policy 1, policy_version 73680 (0.0007) +[2023-10-08 18:44:23,675][21194] Updated weights for policy 1, policy_version 73690 (0.0007) +[2023-10-08 18:44:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 151453696. Throughput: 0: 1726.2, 1: 1741.4. Samples: 37876938. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:44:23,803][19739] Avg episode reward: [(0, '852.990'), (1, '1075.480')] +[2023-10-08 18:44:24,048][21195] Updated weights for policy 0, policy_version 74250 (0.0007) +[2023-10-08 18:44:24,414][21195] Updated weights for policy 0, policy_version 74260 (0.0007) +[2023-10-08 18:44:24,792][21195] Updated weights for policy 0, policy_version 74270 (0.0007) +[2023-10-08 18:44:27,655][21194] Updated weights for policy 1, policy_version 73700 (0.0009) +[2023-10-08 18:44:28,022][21194] Updated weights for policy 1, policy_version 73710 (0.0007) +[2023-10-08 18:44:28,391][21194] Updated weights for policy 1, policy_version 73720 (0.0007) +[2023-10-08 18:44:28,529][21195] Updated weights for policy 0, policy_version 74280 (0.0009) +[2023-10-08 18:44:28,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 151552000. Throughput: 0: 1749.8, 1: 1723.2. Samples: 37898054. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:44:28,803][19739] Avg episode reward: [(0, '853.000'), (1, '1075.480')] +[2023-10-08 18:44:28,898][21195] Updated weights for policy 0, policy_version 74290 (0.0008) +[2023-10-08 18:44:29,267][21195] Updated weights for policy 0, policy_version 74300 (0.0007) +[2023-10-08 18:44:32,504][21194] Updated weights for policy 1, policy_version 73730 (0.0008) +[2023-10-08 18:44:32,872][21194] Updated weights for policy 1, policy_version 73740 (0.0007) +[2023-10-08 18:44:33,178][21195] Updated weights for policy 0, policy_version 74310 (0.0009) +[2023-10-08 18:44:33,233][21194] Updated weights for policy 1, policy_version 73750 (0.0007) +[2023-10-08 18:44:33,535][21195] Updated weights for policy 0, policy_version 74320 (0.0008) +[2023-10-08 18:44:33,598][21194] Updated weights for policy 1, policy_version 73760 (0.0009) +[2023-10-08 18:44:33,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 151617536. Throughput: 0: 1730.4, 1: 1737.1. Samples: 37913032. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:44:33,803][19739] Avg episode reward: [(0, '853.000'), (1, '1086.390')] +[2023-10-08 18:44:33,908][21195] Updated weights for policy 0, policy_version 74330 (0.0008) +[2023-10-08 18:44:37,547][21194] Updated weights for policy 1, policy_version 73770 (0.0009) +[2023-10-08 18:44:37,786][21195] Updated weights for policy 0, policy_version 74340 (0.0008) +[2023-10-08 18:44:37,900][21194] Updated weights for policy 1, policy_version 73780 (0.0007) +[2023-10-08 18:44:38,153][21195] Updated weights for policy 0, policy_version 74350 (0.0009) +[2023-10-08 18:44:38,263][21194] Updated weights for policy 1, policy_version 73790 (0.0009) +[2023-10-08 18:44:38,517][21195] Updated weights for policy 0, policy_version 74360 (0.0009) +[2023-10-08 18:44:38,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 151683072. Throughput: 0: 1750.6, 1: 1735.6. Samples: 37929378. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 18:44:38,803][19739] Avg episode reward: [(0, '853.000'), (1, '1086.390')] +[2023-10-08 18:44:42,329][21194] Updated weights for policy 1, policy_version 73800 (0.0007) +[2023-10-08 18:44:42,655][21195] Updated weights for policy 0, policy_version 74370 (0.0010) +[2023-10-08 18:44:42,692][21194] Updated weights for policy 1, policy_version 73810 (0.0008) +[2023-10-08 18:44:43,018][21195] Updated weights for policy 0, policy_version 74380 (0.0009) +[2023-10-08 18:44:43,056][21194] Updated weights for policy 1, policy_version 73820 (0.0007) +[2023-10-08 18:44:43,397][21195] Updated weights for policy 0, policy_version 74390 (0.0009) +[2023-10-08 18:44:43,763][21195] Updated weights for policy 0, policy_version 74400 (0.0009) +[2023-10-08 18:44:43,803][19739] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 151781376. Throughput: 0: 1744.5, 1: 1705.6. Samples: 37949140. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:44:43,804][19739] Avg episode reward: [(0, '822.880'), (1, '1086.440')] +[2023-10-08 18:44:46,817][21194] Updated weights for policy 1, policy_version 73830 (0.0008) +[2023-10-08 18:44:47,187][21194] Updated weights for policy 1, policy_version 73840 (0.0008) +[2023-10-08 18:44:47,558][21194] Updated weights for policy 1, policy_version 73850 (0.0009) +[2023-10-08 18:44:47,806][21195] Updated weights for policy 0, policy_version 74410 (0.0008) +[2023-10-08 18:44:48,176][21195] Updated weights for policy 0, policy_version 74420 (0.0009) +[2023-10-08 18:44:48,545][21195] Updated weights for policy 0, policy_version 74430 (0.0009) +[2023-10-08 18:44:48,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 151846912. Throughput: 0: 1710.8, 1: 1733.4. Samples: 37964194. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:44:48,803][19739] Avg episode reward: [(0, '822.880'), (1, '1071.500')] +[2023-10-08 18:44:51,711][21194] Updated weights for policy 1, policy_version 73860 (0.0007) +[2023-10-08 18:44:52,074][21194] Updated weights for policy 1, policy_version 73870 (0.0009) +[2023-10-08 18:44:52,426][21195] Updated weights for policy 0, policy_version 74440 (0.0008) +[2023-10-08 18:44:52,447][21194] Updated weights for policy 1, policy_version 73880 (0.0007) +[2023-10-08 18:44:52,796][21195] Updated weights for policy 0, policy_version 74450 (0.0007) +[2023-10-08 18:44:53,161][21195] Updated weights for policy 0, policy_version 74460 (0.0010) +[2023-10-08 18:44:53,802][19739] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 151912448. Throughput: 0: 1741.1, 1: 1729.8. Samples: 37980550. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:44:53,803][19739] Avg episode reward: [(0, '822.920'), (1, '1071.600')] +[2023-10-08 18:44:56,387][21194] Updated weights for policy 1, policy_version 73890 (0.0007) +[2023-10-08 18:44:56,754][21194] Updated weights for policy 1, policy_version 73900 (0.0007) +[2023-10-08 18:44:57,090][21195] Updated weights for policy 0, policy_version 74470 (0.0010) +[2023-10-08 18:44:57,112][21194] Updated weights for policy 1, policy_version 73910 (0.0007) +[2023-10-08 18:44:57,454][21195] Updated weights for policy 0, policy_version 74480 (0.0008) +[2023-10-08 18:44:57,481][21194] Updated weights for policy 1, policy_version 73920 (0.0008) +[2023-10-08 18:44:57,818][21195] Updated weights for policy 0, policy_version 74490 (0.0011) +[2023-10-08 18:44:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 151977984. Throughput: 0: 1715.6, 1: 1702.4. Samples: 37999976. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:44:58,803][19739] Avg episode reward: [(0, '822.920'), (1, '1071.600')] +[2023-10-08 18:45:01,433][21194] Updated weights for policy 1, policy_version 73930 (0.0009) +[2023-10-08 18:45:01,795][21194] Updated weights for policy 1, policy_version 73940 (0.0009) +[2023-10-08 18:45:01,820][21195] Updated weights for policy 0, policy_version 74500 (0.0008) +[2023-10-08 18:45:02,165][21194] Updated weights for policy 1, policy_version 73950 (0.0008) +[2023-10-08 18:45:02,187][21195] Updated weights for policy 0, policy_version 74510 (0.0007) +[2023-10-08 18:45:02,559][21195] Updated weights for policy 0, policy_version 74520 (0.0008) +[2023-10-08 18:45:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 152043520. Throughput: 0: 1705.7, 1: 1736.0. Samples: 38016278. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:45:03,803][19739] Avg episode reward: [(0, '837.600'), (1, '1071.600')] +[2023-10-08 18:45:05,953][21194] Updated weights for policy 1, policy_version 73960 (0.0010) +[2023-10-08 18:45:06,319][21194] Updated weights for policy 1, policy_version 73970 (0.0011) +[2023-10-08 18:45:06,542][21195] Updated weights for policy 0, policy_version 74530 (0.0009) +[2023-10-08 18:45:06,683][21194] Updated weights for policy 1, policy_version 73980 (0.0009) +[2023-10-08 18:45:06,914][21195] Updated weights for policy 0, policy_version 74540 (0.0008) +[2023-10-08 18:45:07,275][21195] Updated weights for policy 0, policy_version 74550 (0.0009) +[2023-10-08 18:45:07,649][21195] Updated weights for policy 0, policy_version 74560 (0.0010) +[2023-10-08 18:45:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 152109056. Throughput: 0: 1727.1, 1: 1700.1. Samples: 38031162. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:45:08,803][19739] Avg episode reward: [(0, '837.600'), (1, '1071.600')] +[2023-10-08 18:45:10,731][21194] Updated weights for policy 1, policy_version 73990 (0.0007) +[2023-10-08 18:45:11,100][21194] Updated weights for policy 1, policy_version 74000 (0.0011) +[2023-10-08 18:45:11,462][21194] Updated weights for policy 1, policy_version 74010 (0.0007) +[2023-10-08 18:45:11,609][21195] Updated weights for policy 0, policy_version 74570 (0.0007) +[2023-10-08 18:45:11,979][21195] Updated weights for policy 0, policy_version 74580 (0.0008) +[2023-10-08 18:45:12,343][21195] Updated weights for policy 0, policy_version 74590 (0.0009) +[2023-10-08 18:45:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 152174592. Throughput: 0: 1694.6, 1: 1714.7. Samples: 38051474. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:45:13,803][19739] Avg episode reward: [(0, '837.600'), (1, '1071.600')] +[2023-10-08 18:45:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000074016_75792384.pth... +[2023-10-08 18:45:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000074592_76382208.pth... +[2023-10-08 18:45:13,849][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000072416_74153984.pth +[2023-10-08 18:45:13,857][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000072960_74711040.pth +[2023-10-08 18:45:15,318][21194] Updated weights for policy 1, policy_version 74020 (0.0010) +[2023-10-08 18:45:15,695][21194] Updated weights for policy 1, policy_version 74030 (0.0009) +[2023-10-08 18:45:16,060][21194] Updated weights for policy 1, policy_version 74040 (0.0008) +[2023-10-08 18:45:16,276][21195] Updated weights for policy 0, policy_version 74600 (0.0007) +[2023-10-08 18:45:16,645][21195] Updated weights for policy 0, policy_version 74610 (0.0007) +[2023-10-08 18:45:17,024][21195] Updated weights for policy 0, policy_version 74620 (0.0009) +[2023-10-08 18:45:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 152240128. Throughput: 0: 1713.7, 1: 1711.3. Samples: 38067158. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:45:18,803][19739] Avg episode reward: [(0, '837.600'), (1, '1071.530')] +[2023-10-08 18:45:20,109][21194] Updated weights for policy 1, policy_version 74050 (0.0007) +[2023-10-08 18:45:20,476][21194] Updated weights for policy 1, policy_version 74060 (0.0008) +[2023-10-08 18:45:20,840][21194] Updated weights for policy 1, policy_version 74070 (0.0008) +[2023-10-08 18:45:21,051][21195] Updated weights for policy 0, policy_version 74630 (0.0009) +[2023-10-08 18:45:21,207][21194] Updated weights for policy 1, policy_version 74080 (0.0008) +[2023-10-08 18:45:21,416][21195] Updated weights for policy 0, policy_version 74640 (0.0008) +[2023-10-08 18:45:21,796][21195] Updated weights for policy 0, policy_version 74650 (0.0008) +[2023-10-08 18:45:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 152305664. Throughput: 0: 1701.4, 1: 1699.2. Samples: 38082404. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 18:45:23,803][19739] Avg episode reward: [(0, '837.600'), (1, '1071.530')] +[2023-10-08 18:45:25,173][21194] Updated weights for policy 1, policy_version 74090 (0.0007) +[2023-10-08 18:45:25,438][21195] Updated weights for policy 0, policy_version 74660 (0.0007) +[2023-10-08 18:45:25,542][21194] Updated weights for policy 1, policy_version 74100 (0.0008) +[2023-10-08 18:45:25,810][21195] Updated weights for policy 0, policy_version 74670 (0.0007) +[2023-10-08 18:45:25,905][21194] Updated weights for policy 1, policy_version 74110 (0.0007) +[2023-10-08 18:45:26,172][21195] Updated weights for policy 0, policy_version 74680 (0.0007) +[2023-10-08 18:45:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 152371200. Throughput: 0: 1711.4, 1: 1726.7. Samples: 38103854. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 18:45:28,803][19739] Avg episode reward: [(0, '837.600'), (1, '1071.530')] +[2023-10-08 18:45:29,818][21194] Updated weights for policy 1, policy_version 74120 (0.0008) +[2023-10-08 18:45:30,187][21195] Updated weights for policy 0, policy_version 74690 (0.0009) +[2023-10-08 18:45:30,188][21194] Updated weights for policy 1, policy_version 74130 (0.0007) +[2023-10-08 18:45:30,553][21194] Updated weights for policy 1, policy_version 74140 (0.0008) +[2023-10-08 18:45:30,554][21195] Updated weights for policy 0, policy_version 74700 (0.0007) +[2023-10-08 18:45:30,925][21195] Updated weights for policy 0, policy_version 74710 (0.0008) +[2023-10-08 18:45:31,288][21195] Updated weights for policy 0, policy_version 74720 (0.0007) +[2023-10-08 18:45:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 152436736. Throughput: 0: 1744.6, 1: 1703.2. Samples: 38119344. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 18:45:33,804][19739] Avg episode reward: [(0, '837.600'), (1, '1071.530')] +[2023-10-08 18:45:34,456][21194] Updated weights for policy 1, policy_version 74150 (0.0009) +[2023-10-08 18:45:34,821][21194] Updated weights for policy 1, policy_version 74160 (0.0008) +[2023-10-08 18:45:35,192][21194] Updated weights for policy 1, policy_version 74170 (0.0008) +[2023-10-08 18:45:35,210][21195] Updated weights for policy 0, policy_version 74730 (0.0008) +[2023-10-08 18:45:35,573][21195] Updated weights for policy 0, policy_version 74740 (0.0008) +[2023-10-08 18:45:35,954][21195] Updated weights for policy 0, policy_version 74750 (0.0010) +[2023-10-08 18:45:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 152502272. Throughput: 0: 1711.0, 1: 1712.4. Samples: 38134604. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 18:45:38,803][19739] Avg episode reward: [(0, '837.600'), (1, '1085.350')] +[2023-10-08 18:45:39,166][21194] Updated weights for policy 1, policy_version 74180 (0.0009) +[2023-10-08 18:45:39,530][21194] Updated weights for policy 1, policy_version 74190 (0.0009) +[2023-10-08 18:45:39,855][21195] Updated weights for policy 0, policy_version 74760 (0.0009) +[2023-10-08 18:45:39,900][21194] Updated weights for policy 1, policy_version 74200 (0.0008) +[2023-10-08 18:45:40,224][21195] Updated weights for policy 0, policy_version 74770 (0.0008) +[2023-10-08 18:45:40,585][21195] Updated weights for policy 0, policy_version 74780 (0.0008) +[2023-10-08 18:45:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 152567808. Throughput: 0: 1734.7, 1: 1729.4. Samples: 38155862. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 18:45:43,803][19739] Avg episode reward: [(0, '811.790'), (1, '1085.350')] +[2023-10-08 18:45:43,906][21194] Updated weights for policy 1, policy_version 74210 (0.0008) +[2023-10-08 18:45:44,264][21194] Updated weights for policy 1, policy_version 74220 (0.0008) +[2023-10-08 18:45:44,467][21195] Updated weights for policy 0, policy_version 74790 (0.0009) +[2023-10-08 18:45:44,630][21194] Updated weights for policy 1, policy_version 74230 (0.0007) +[2023-10-08 18:45:44,829][21195] Updated weights for policy 0, policy_version 74800 (0.0008) +[2023-10-08 18:45:44,994][21194] Updated weights for policy 1, policy_version 74240 (0.0008) +[2023-10-08 18:45:45,198][21195] Updated weights for policy 0, policy_version 74810 (0.0010) +[2023-10-08 18:45:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 152633344. Throughput: 0: 1744.1, 1: 1699.4. Samples: 38171236. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 18:45:48,803][19739] Avg episode reward: [(0, '734.500'), (1, '1085.350')] +[2023-10-08 18:45:48,929][21194] Updated weights for policy 1, policy_version 74250 (0.0010) +[2023-10-08 18:45:49,251][21195] Updated weights for policy 0, policy_version 74820 (0.0009) +[2023-10-08 18:45:49,301][21194] Updated weights for policy 1, policy_version 74260 (0.0008) +[2023-10-08 18:45:49,627][21195] Updated weights for policy 0, policy_version 74830 (0.0009) +[2023-10-08 18:45:49,657][21194] Updated weights for policy 1, policy_version 74270 (0.0007) +[2023-10-08 18:45:50,003][21195] Updated weights for policy 0, policy_version 74840 (0.0009) +[2023-10-08 18:45:53,634][21194] Updated weights for policy 1, policy_version 74280 (0.0009) +[2023-10-08 18:45:53,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 152698880. Throughput: 0: 1721.8, 1: 1730.0. Samples: 38186494. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 18:45:53,803][19739] Avg episode reward: [(0, '734.500'), (1, '1085.350')] +[2023-10-08 18:45:53,942][21195] Updated weights for policy 0, policy_version 74850 (0.0008) +[2023-10-08 18:45:54,000][21194] Updated weights for policy 1, policy_version 74290 (0.0007) +[2023-10-08 18:45:54,317][21195] Updated weights for policy 0, policy_version 74860 (0.0007) +[2023-10-08 18:45:54,368][21194] Updated weights for policy 1, policy_version 74300 (0.0007) +[2023-10-08 18:45:54,694][21195] Updated weights for policy 0, policy_version 74870 (0.0007) +[2023-10-08 18:45:55,069][21195] Updated weights for policy 0, policy_version 74880 (0.0007) +[2023-10-08 18:45:58,155][21194] Updated weights for policy 1, policy_version 74310 (0.0008) +[2023-10-08 18:45:58,519][21194] Updated weights for policy 1, policy_version 74320 (0.0008) +[2023-10-08 18:45:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 152764416. Throughput: 0: 1749.2, 1: 1733.2. Samples: 38208184. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 18:45:58,803][19739] Avg episode reward: [(0, '734.260'), (1, '1085.350')] +[2023-10-08 18:45:58,880][21194] Updated weights for policy 1, policy_version 74330 (0.0009) +[2023-10-08 18:45:58,948][21195] Updated weights for policy 0, policy_version 74890 (0.0009) +[2023-10-08 18:45:59,323][21195] Updated weights for policy 0, policy_version 74900 (0.0009) +[2023-10-08 18:45:59,689][21195] Updated weights for policy 0, policy_version 74910 (0.0009) +[2023-10-08 18:46:02,837][21194] Updated weights for policy 1, policy_version 74340 (0.0009) +[2023-10-08 18:46:03,209][21194] Updated weights for policy 1, policy_version 74350 (0.0008) +[2023-10-08 18:46:03,537][21195] Updated weights for policy 0, policy_version 74920 (0.0009) +[2023-10-08 18:46:03,563][21194] Updated weights for policy 1, policy_version 74360 (0.0009) +[2023-10-08 18:46:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 152829952. Throughput: 0: 1741.2, 1: 1725.7. Samples: 38223166. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 18:46:03,803][19739] Avg episode reward: [(0, '728.580'), (1, '1085.350')] +[2023-10-08 18:46:03,907][21195] Updated weights for policy 0, policy_version 74930 (0.0009) +[2023-10-08 18:46:04,276][21195] Updated weights for policy 0, policy_version 74940 (0.0008) +[2023-10-08 18:46:07,492][21194] Updated weights for policy 1, policy_version 74370 (0.0008) +[2023-10-08 18:46:07,856][21194] Updated weights for policy 1, policy_version 74380 (0.0008) +[2023-10-08 18:46:08,202][21195] Updated weights for policy 0, policy_version 74950 (0.0008) +[2023-10-08 18:46:08,215][21194] Updated weights for policy 1, policy_version 74390 (0.0009) +[2023-10-08 18:46:08,569][21195] Updated weights for policy 0, policy_version 74960 (0.0009) +[2023-10-08 18:46:08,575][21194] Updated weights for policy 1, policy_version 74400 (0.0008) +[2023-10-08 18:46:08,802][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 152928256. Throughput: 0: 1747.7, 1: 1738.5. Samples: 38239284. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 18:46:08,803][19739] Avg episode reward: [(0, '728.580'), (1, '1085.350')] +[2023-10-08 18:46:08,932][21195] Updated weights for policy 0, policy_version 74970 (0.0009) +[2023-10-08 18:46:12,601][21194] Updated weights for policy 1, policy_version 74410 (0.0007) +[2023-10-08 18:46:12,795][21195] Updated weights for policy 0, policy_version 74980 (0.0007) +[2023-10-08 18:46:12,965][21194] Updated weights for policy 1, policy_version 74420 (0.0007) +[2023-10-08 18:46:13,159][21195] Updated weights for policy 0, policy_version 74990 (0.0007) +[2023-10-08 18:46:13,329][21194] Updated weights for policy 1, policy_version 74430 (0.0007) +[2023-10-08 18:46:13,526][21195] Updated weights for policy 0, policy_version 75000 (0.0010) +[2023-10-08 18:46:13,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 152993792. Throughput: 0: 1740.3, 1: 1714.9. Samples: 38259336. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 18:46:13,803][19739] Avg episode reward: [(0, '697.930'), (1, '1085.350')] +[2023-10-08 18:46:17,287][21195] Updated weights for policy 0, policy_version 75010 (0.0010) +[2023-10-08 18:46:17,444][21194] Updated weights for policy 1, policy_version 74440 (0.0009) +[2023-10-08 18:46:17,661][21195] Updated weights for policy 0, policy_version 75020 (0.0007) +[2023-10-08 18:46:17,810][21194] Updated weights for policy 1, policy_version 74450 (0.0008) +[2023-10-08 18:46:18,020][21195] Updated weights for policy 0, policy_version 75030 (0.0008) +[2023-10-08 18:46:18,182][21194] Updated weights for policy 1, policy_version 74460 (0.0009) +[2023-10-08 18:46:18,397][21195] Updated weights for policy 0, policy_version 75040 (0.0009) +[2023-10-08 18:46:18,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 153092096. Throughput: 0: 1716.8, 1: 1733.7. Samples: 38274614. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:46:18,803][19739] Avg episode reward: [(0, '697.930'), (1, '1085.350')] +[2023-10-08 18:46:22,255][21194] Updated weights for policy 1, policy_version 74470 (0.0009) +[2023-10-08 18:46:22,524][21195] Updated weights for policy 0, policy_version 75050 (0.0008) +[2023-10-08 18:46:22,623][21194] Updated weights for policy 1, policy_version 74480 (0.0007) +[2023-10-08 18:46:22,886][21195] Updated weights for policy 0, policy_version 75060 (0.0007) +[2023-10-08 18:46:22,985][21194] Updated weights for policy 1, policy_version 74490 (0.0007) +[2023-10-08 18:46:23,251][21195] Updated weights for policy 0, policy_version 75070 (0.0008) +[2023-10-08 18:46:23,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 153157632. Throughput: 0: 1746.5, 1: 1726.0. Samples: 38290866. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:46:23,803][19739] Avg episode reward: [(0, '697.930'), (1, '1100.600')] +[2023-10-08 18:46:27,007][21194] Updated weights for policy 1, policy_version 74500 (0.0009) +[2023-10-08 18:46:27,140][21195] Updated weights for policy 0, policy_version 75080 (0.0007) +[2023-10-08 18:46:27,379][21194] Updated weights for policy 1, policy_version 74510 (0.0007) +[2023-10-08 18:46:27,512][21195] Updated weights for policy 0, policy_version 75090 (0.0007) +[2023-10-08 18:46:27,735][21194] Updated weights for policy 1, policy_version 74520 (0.0007) +[2023-10-08 18:46:27,877][21195] Updated weights for policy 0, policy_version 75100 (0.0007) +[2023-10-08 18:46:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 153223168. Throughput: 0: 1722.3, 1: 1698.9. Samples: 38309816. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:46:28,803][19739] Avg episode reward: [(0, '697.930'), (1, '1100.600')] +[2023-10-08 18:46:31,730][21194] Updated weights for policy 1, policy_version 74530 (0.0008) +[2023-10-08 18:46:31,885][21195] Updated weights for policy 0, policy_version 75110 (0.0008) +[2023-10-08 18:46:32,095][21194] Updated weights for policy 1, policy_version 74540 (0.0007) +[2023-10-08 18:46:32,262][21195] Updated weights for policy 0, policy_version 75120 (0.0008) +[2023-10-08 18:46:32,463][21194] Updated weights for policy 1, policy_version 74550 (0.0007) +[2023-10-08 18:46:32,621][21195] Updated weights for policy 0, policy_version 75130 (0.0009) +[2023-10-08 18:46:32,830][21194] Updated weights for policy 1, policy_version 74560 (0.0007) +[2023-10-08 18:46:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 153288704. Throughput: 0: 1714.8, 1: 1723.6. Samples: 38325964. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:46:33,803][19739] Avg episode reward: [(0, '697.930'), (1, '1100.600')] +[2023-10-08 18:46:36,569][21195] Updated weights for policy 0, policy_version 75140 (0.0009) +[2023-10-08 18:46:36,918][21194] Updated weights for policy 1, policy_version 74570 (0.0007) +[2023-10-08 18:46:36,936][21195] Updated weights for policy 0, policy_version 75150 (0.0008) +[2023-10-08 18:46:37,283][21194] Updated weights for policy 1, policy_version 74580 (0.0007) +[2023-10-08 18:46:37,309][21195] Updated weights for policy 0, policy_version 75160 (0.0007) +[2023-10-08 18:46:37,649][21194] Updated weights for policy 1, policy_version 74590 (0.0007) +[2023-10-08 18:46:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 153354240. Throughput: 0: 1737.8, 1: 1711.5. Samples: 38341712. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:46:38,803][19739] Avg episode reward: [(0, '697.930'), (1, '1100.600')] +[2023-10-08 18:46:41,218][21195] Updated weights for policy 0, policy_version 75170 (0.0008) +[2023-10-08 18:46:41,559][21194] Updated weights for policy 1, policy_version 74600 (0.0008) +[2023-10-08 18:46:41,587][21195] Updated weights for policy 0, policy_version 75180 (0.0007) +[2023-10-08 18:46:41,928][21194] Updated weights for policy 1, policy_version 74610 (0.0008) +[2023-10-08 18:46:41,966][21195] Updated weights for policy 0, policy_version 75190 (0.0010) +[2023-10-08 18:46:42,291][21194] Updated weights for policy 1, policy_version 74620 (0.0007) +[2023-10-08 18:46:42,330][21195] Updated weights for policy 0, policy_version 75200 (0.0007) +[2023-10-08 18:46:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 153419776. Throughput: 0: 1713.0, 1: 1693.6. Samples: 38361484. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:46:43,803][19739] Avg episode reward: [(0, '714.230'), (1, '1100.600')] +[2023-10-08 18:46:46,140][21194] Updated weights for policy 1, policy_version 74630 (0.0008) +[2023-10-08 18:46:46,206][21195] Updated weights for policy 0, policy_version 75210 (0.0007) +[2023-10-08 18:46:46,502][21194] Updated weights for policy 1, policy_version 74640 (0.0007) +[2023-10-08 18:46:46,565][21195] Updated weights for policy 0, policy_version 75220 (0.0010) +[2023-10-08 18:46:46,866][21194] Updated weights for policy 1, policy_version 74650 (0.0007) +[2023-10-08 18:46:46,927][21195] Updated weights for policy 0, policy_version 75230 (0.0009) +[2023-10-08 18:46:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 153485312. Throughput: 0: 1720.4, 1: 1714.1. Samples: 38377720. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:46:48,803][19739] Avg episode reward: [(0, '661.810'), (1, '1100.600')] +[2023-10-08 18:46:50,909][21194] Updated weights for policy 1, policy_version 74660 (0.0009) +[2023-10-08 18:46:50,921][21195] Updated weights for policy 0, policy_version 75240 (0.0008) +[2023-10-08 18:46:51,277][21194] Updated weights for policy 1, policy_version 74670 (0.0008) +[2023-10-08 18:46:51,288][21195] Updated weights for policy 0, policy_version 75250 (0.0007) +[2023-10-08 18:46:51,644][21195] Updated weights for policy 0, policy_version 75260 (0.0007) +[2023-10-08 18:46:51,646][21194] Updated weights for policy 1, policy_version 74680 (0.0008) +[2023-10-08 18:46:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 153550848. Throughput: 0: 1708.8, 1: 1685.2. Samples: 38392014. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:46:53,803][19739] Avg episode reward: [(0, '677.330'), (1, '1115.910')] +[2023-10-08 18:46:55,540][21194] Updated weights for policy 1, policy_version 74690 (0.0009) +[2023-10-08 18:46:55,626][21195] Updated weights for policy 0, policy_version 75270 (0.0008) +[2023-10-08 18:46:55,904][21194] Updated weights for policy 1, policy_version 74700 (0.0009) +[2023-10-08 18:46:55,988][21195] Updated weights for policy 0, policy_version 75280 (0.0009) +[2023-10-08 18:46:56,272][21194] Updated weights for policy 1, policy_version 74710 (0.0008) +[2023-10-08 18:46:56,351][21195] Updated weights for policy 0, policy_version 75290 (0.0010) +[2023-10-08 18:46:56,630][21194] Updated weights for policy 1, policy_version 74720 (0.0007) +[2023-10-08 18:46:58,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 153616384. Throughput: 0: 1713.1, 1: 1710.3. Samples: 38413388. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:46:58,804][19739] Avg episode reward: [(0, '677.330'), (1, '1100.890')] +[2023-10-08 18:47:00,437][21195] Updated weights for policy 0, policy_version 75300 (0.0008) +[2023-10-08 18:47:00,693][21194] Updated weights for policy 1, policy_version 74730 (0.0008) +[2023-10-08 18:47:00,797][21195] Updated weights for policy 0, policy_version 75310 (0.0008) +[2023-10-08 18:47:01,064][21194] Updated weights for policy 1, policy_version 74740 (0.0008) +[2023-10-08 18:47:01,172][21195] Updated weights for policy 0, policy_version 75320 (0.0009) +[2023-10-08 18:47:01,438][21194] Updated weights for policy 1, policy_version 74750 (0.0008) +[2023-10-08 18:47:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 153681920. Throughput: 0: 1734.5, 1: 1703.5. Samples: 38429328. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 18:47:03,804][19739] Avg episode reward: [(0, '677.250'), (1, '1100.890')] +[2023-10-08 18:47:05,088][21195] Updated weights for policy 0, policy_version 75330 (0.0008) +[2023-10-08 18:47:05,283][21194] Updated weights for policy 1, policy_version 74760 (0.0008) +[2023-10-08 18:47:05,462][21195] Updated weights for policy 0, policy_version 75340 (0.0008) +[2023-10-08 18:47:05,641][21194] Updated weights for policy 1, policy_version 74770 (0.0008) +[2023-10-08 18:47:05,826][21195] Updated weights for policy 0, policy_version 75350 (0.0008) +[2023-10-08 18:47:06,010][21194] Updated weights for policy 1, policy_version 74780 (0.0009) +[2023-10-08 18:47:06,189][21195] Updated weights for policy 0, policy_version 75360 (0.0008) +[2023-10-08 18:47:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 153747456. Throughput: 0: 1706.2, 1: 1700.7. Samples: 38444178. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 18:47:08,804][19739] Avg episode reward: [(0, '570.270'), (1, '1085.500')] +[2023-10-08 18:47:10,023][21194] Updated weights for policy 1, policy_version 74790 (0.0009) +[2023-10-08 18:47:10,238][21195] Updated weights for policy 0, policy_version 75370 (0.0009) +[2023-10-08 18:47:10,384][21194] Updated weights for policy 1, policy_version 74800 (0.0008) +[2023-10-08 18:47:10,615][21195] Updated weights for policy 0, policy_version 75380 (0.0010) +[2023-10-08 18:47:10,750][21194] Updated weights for policy 1, policy_version 74810 (0.0008) +[2023-10-08 18:47:10,983][21195] Updated weights for policy 0, policy_version 75390 (0.0009) +[2023-10-08 18:47:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 153812992. Throughput: 0: 1726.0, 1: 1729.3. Samples: 38465306. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 18:47:13,803][19739] Avg episode reward: [(0, '539.780'), (1, '1070.360')] +[2023-10-08 18:47:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000075392_77201408.pth... +[2023-10-08 18:47:13,811][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000074816_76611584.pth... +[2023-10-08 18:47:13,852][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000073792_75563008.pth +[2023-10-08 18:47:13,852][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000073216_74973184.pth +[2023-10-08 18:47:14,793][21194] Updated weights for policy 1, policy_version 74820 (0.0008) +[2023-10-08 18:47:14,878][21195] Updated weights for policy 0, policy_version 75400 (0.0007) +[2023-10-08 18:47:15,163][21194] Updated weights for policy 1, policy_version 74830 (0.0007) +[2023-10-08 18:47:15,249][21195] Updated weights for policy 0, policy_version 75410 (0.0008) +[2023-10-08 18:47:15,530][21194] Updated weights for policy 1, policy_version 74840 (0.0008) +[2023-10-08 18:47:15,610][21195] Updated weights for policy 0, policy_version 75420 (0.0008) +[2023-10-08 18:47:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 153878528. Throughput: 0: 1736.8, 1: 1704.8. Samples: 38480836. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 18:47:18,803][19739] Avg episode reward: [(0, '539.780'), (1, '1070.360')] +[2023-10-08 18:47:19,358][21194] Updated weights for policy 1, policy_version 74850 (0.0008) +[2023-10-08 18:47:19,581][21195] Updated weights for policy 0, policy_version 75430 (0.0008) +[2023-10-08 18:47:19,735][21194] Updated weights for policy 1, policy_version 74860 (0.0008) +[2023-10-08 18:47:19,956][21195] Updated weights for policy 0, policy_version 75440 (0.0007) +[2023-10-08 18:47:20,093][21194] Updated weights for policy 1, policy_version 74870 (0.0010) +[2023-10-08 18:47:20,318][21195] Updated weights for policy 0, policy_version 75450 (0.0007) +[2023-10-08 18:47:20,455][21194] Updated weights for policy 1, policy_version 74880 (0.0008) +[2023-10-08 18:47:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 153944064. Throughput: 0: 1715.3, 1: 1715.4. Samples: 38496096. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 18:47:23,803][19739] Avg episode reward: [(0, '539.780'), (1, '1070.360')] +[2023-10-08 18:47:24,182][21195] Updated weights for policy 0, policy_version 75460 (0.0008) +[2023-10-08 18:47:24,547][21195] Updated weights for policy 0, policy_version 75470 (0.0008) +[2023-10-08 18:47:24,648][21194] Updated weights for policy 1, policy_version 74890 (0.0007) +[2023-10-08 18:47:24,916][21195] Updated weights for policy 0, policy_version 75480 (0.0007) +[2023-10-08 18:47:25,018][21194] Updated weights for policy 1, policy_version 74900 (0.0008) +[2023-10-08 18:47:25,374][21194] Updated weights for policy 1, policy_version 74910 (0.0008) +[2023-10-08 18:47:28,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 154009600. Throughput: 0: 1738.9, 1: 1728.7. Samples: 38517528. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 18:47:28,803][19739] Avg episode reward: [(0, '539.780'), (1, '1070.360')] +[2023-10-08 18:47:28,868][21195] Updated weights for policy 0, policy_version 75490 (0.0009) +[2023-10-08 18:47:29,222][21195] Updated weights for policy 0, policy_version 75500 (0.0008) +[2023-10-08 18:47:29,284][21194] Updated weights for policy 1, policy_version 74920 (0.0007) +[2023-10-08 18:47:29,599][21195] Updated weights for policy 0, policy_version 75510 (0.0007) +[2023-10-08 18:47:29,653][21194] Updated weights for policy 1, policy_version 74930 (0.0008) +[2023-10-08 18:47:29,965][21195] Updated weights for policy 0, policy_version 75520 (0.0008) +[2023-10-08 18:47:30,014][21194] Updated weights for policy 1, policy_version 74940 (0.0007) +[2023-10-08 18:47:33,774][21195] Updated weights for policy 0, policy_version 75530 (0.0009) +[2023-10-08 18:47:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 154075136. Throughput: 0: 1736.3, 1: 1705.3. Samples: 38532592. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 18:47:33,804][19739] Avg episode reward: [(0, '539.780'), (1, '1070.360')] +[2023-10-08 18:47:34,010][21194] Updated weights for policy 1, policy_version 74950 (0.0009) +[2023-10-08 18:47:34,127][21195] Updated weights for policy 0, policy_version 75540 (0.0008) +[2023-10-08 18:47:34,374][21194] Updated weights for policy 1, policy_version 74960 (0.0008) +[2023-10-08 18:47:34,500][21195] Updated weights for policy 0, policy_version 75550 (0.0009) +[2023-10-08 18:47:34,744][21194] Updated weights for policy 1, policy_version 74970 (0.0008) +[2023-10-08 18:47:38,383][21195] Updated weights for policy 0, policy_version 75560 (0.0008) +[2023-10-08 18:47:38,541][21194] Updated weights for policy 1, policy_version 74980 (0.0007) +[2023-10-08 18:47:38,747][21195] Updated weights for policy 0, policy_version 75570 (0.0008) +[2023-10-08 18:47:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 154140672. Throughput: 0: 1742.2, 1: 1735.9. Samples: 38548528. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 18:47:38,803][19739] Avg episode reward: [(0, '539.780'), (1, '1070.360')] +[2023-10-08 18:47:38,902][21194] Updated weights for policy 1, policy_version 74990 (0.0008) +[2023-10-08 18:47:39,113][21195] Updated weights for policy 0, policy_version 75580 (0.0009) +[2023-10-08 18:47:39,267][21194] Updated weights for policy 1, policy_version 75000 (0.0007) +[2023-10-08 18:47:43,051][21195] Updated weights for policy 0, policy_version 75590 (0.0009) +[2023-10-08 18:47:43,271][21194] Updated weights for policy 1, policy_version 75010 (0.0010) +[2023-10-08 18:47:43,417][21195] Updated weights for policy 0, policy_version 75600 (0.0009) +[2023-10-08 18:47:43,637][21194] Updated weights for policy 1, policy_version 75020 (0.0009) +[2023-10-08 18:47:43,787][21195] Updated weights for policy 0, policy_version 75610 (0.0008) +[2023-10-08 18:47:43,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 154206208. Throughput: 0: 1743.2, 1: 1736.0. Samples: 38569950. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 18:47:43,803][19739] Avg episode reward: [(0, '539.780'), (1, '1085.310')] +[2023-10-08 18:47:43,994][21194] Updated weights for policy 1, policy_version 75030 (0.0008) +[2023-10-08 18:47:44,360][21194] Updated weights for policy 1, policy_version 75040 (0.0009) +[2023-10-08 18:47:47,709][21195] Updated weights for policy 0, policy_version 75620 (0.0007) +[2023-10-08 18:47:48,047][21194] Updated weights for policy 1, policy_version 75050 (0.0008) +[2023-10-08 18:47:48,076][21195] Updated weights for policy 0, policy_version 75630 (0.0007) +[2023-10-08 18:47:48,414][21194] Updated weights for policy 1, policy_version 75060 (0.0007) +[2023-10-08 18:47:48,457][21195] Updated weights for policy 0, policy_version 75640 (0.0009) +[2023-10-08 18:47:48,779][21194] Updated weights for policy 1, policy_version 75070 (0.0007) +[2023-10-08 18:47:48,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 154304512. Throughput: 0: 1715.6, 1: 1723.6. Samples: 38584092. Policy #0 lag: (min: 19.0, avg: 21.9, max: 51.0) +[2023-10-08 18:47:48,803][19739] Avg episode reward: [(0, '539.780'), (1, '1085.500')] +[2023-10-08 18:47:52,395][21195] Updated weights for policy 0, policy_version 75650 (0.0007) +[2023-10-08 18:47:52,766][21195] Updated weights for policy 0, policy_version 75660 (0.0008) +[2023-10-08 18:47:52,830][21194] Updated weights for policy 1, policy_version 75080 (0.0008) +[2023-10-08 18:47:53,128][21195] Updated weights for policy 0, policy_version 75670 (0.0009) +[2023-10-08 18:47:53,196][21194] Updated weights for policy 1, policy_version 75090 (0.0008) +[2023-10-08 18:47:53,496][21195] Updated weights for policy 0, policy_version 75680 (0.0007) +[2023-10-08 18:47:53,568][21194] Updated weights for policy 1, policy_version 75100 (0.0007) +[2023-10-08 18:47:53,802][19739] Fps is (10 sec: 19660.8, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 154402816. Throughput: 0: 1747.5, 1: 1731.1. Samples: 38600716. Policy #0 lag: (min: 19.0, avg: 21.9, max: 51.0) +[2023-10-08 18:47:53,803][19739] Avg episode reward: [(0, '539.780'), (1, '1085.500')] +[2023-10-08 18:47:57,433][21195] Updated weights for policy 0, policy_version 75690 (0.0009) +[2023-10-08 18:47:57,570][21194] Updated weights for policy 1, policy_version 75110 (0.0008) +[2023-10-08 18:47:57,798][21195] Updated weights for policy 0, policy_version 75700 (0.0009) +[2023-10-08 18:47:57,934][21194] Updated weights for policy 1, policy_version 75120 (0.0007) +[2023-10-08 18:47:58,163][21195] Updated weights for policy 0, policy_version 75710 (0.0007) +[2023-10-08 18:47:58,302][21194] Updated weights for policy 1, policy_version 75130 (0.0007) +[2023-10-08 18:47:58,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 154468352. Throughput: 0: 1732.3, 1: 1714.1. Samples: 38620396. Policy #0 lag: (min: 19.0, avg: 21.9, max: 51.0) +[2023-10-08 18:47:58,803][19739] Avg episode reward: [(0, '539.780'), (1, '1070.640')] +[2023-10-08 18:48:02,053][21194] Updated weights for policy 1, policy_version 75140 (0.0007) +[2023-10-08 18:48:02,059][21195] Updated weights for policy 0, policy_version 75720 (0.0008) +[2023-10-08 18:48:02,412][21194] Updated weights for policy 1, policy_version 75150 (0.0007) +[2023-10-08 18:48:02,428][21195] Updated weights for policy 0, policy_version 75730 (0.0007) +[2023-10-08 18:48:02,780][21194] Updated weights for policy 1, policy_version 75160 (0.0007) +[2023-10-08 18:48:02,790][21195] Updated weights for policy 0, policy_version 75740 (0.0007) +[2023-10-08 18:48:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 154533888. Throughput: 0: 1718.1, 1: 1732.8. Samples: 38636126. Policy #0 lag: (min: 19.0, avg: 21.9, max: 51.0) +[2023-10-08 18:48:03,803][19739] Avg episode reward: [(0, '539.780'), (1, '1070.350')] +[2023-10-08 18:48:06,616][21195] Updated weights for policy 0, policy_version 75750 (0.0008) +[2023-10-08 18:48:06,943][21194] Updated weights for policy 1, policy_version 75170 (0.0007) +[2023-10-08 18:48:06,985][21195] Updated weights for policy 0, policy_version 75760 (0.0009) +[2023-10-08 18:48:07,311][21194] Updated weights for policy 1, policy_version 75180 (0.0008) +[2023-10-08 18:48:07,361][21195] Updated weights for policy 0, policy_version 75770 (0.0008) +[2023-10-08 18:48:07,671][21194] Updated weights for policy 1, policy_version 75190 (0.0008) +[2023-10-08 18:48:08,036][21194] Updated weights for policy 1, policy_version 75200 (0.0007) +[2023-10-08 18:48:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 154599424. Throughput: 0: 1740.6, 1: 1729.6. Samples: 38652258. Policy #0 lag: (min: 19.0, avg: 21.9, max: 51.0) +[2023-10-08 18:48:08,803][19739] Avg episode reward: [(0, '539.780'), (1, '1070.350')] +[2023-10-08 18:48:11,449][21195] Updated weights for policy 0, policy_version 75780 (0.0007) +[2023-10-08 18:48:11,821][21195] Updated weights for policy 0, policy_version 75790 (0.0007) +[2023-10-08 18:48:12,196][21195] Updated weights for policy 0, policy_version 75800 (0.0009) +[2023-10-08 18:48:12,205][21194] Updated weights for policy 1, policy_version 75210 (0.0008) +[2023-10-08 18:48:12,572][21194] Updated weights for policy 1, policy_version 75220 (0.0008) +[2023-10-08 18:48:12,932][21194] Updated weights for policy 1, policy_version 75230 (0.0008) +[2023-10-08 18:48:13,803][19739] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 154664960. Throughput: 0: 1717.7, 1: 1698.2. Samples: 38671242. Policy #0 lag: (min: 19.0, avg: 21.9, max: 51.0) +[2023-10-08 18:48:13,804][19739] Avg episode reward: [(0, '539.780'), (1, '1040.330')] +[2023-10-08 18:48:16,131][21195] Updated weights for policy 0, policy_version 75810 (0.0010) +[2023-10-08 18:48:16,504][21195] Updated weights for policy 0, policy_version 75820 (0.0010) +[2023-10-08 18:48:16,743][21194] Updated weights for policy 1, policy_version 75240 (0.0007) +[2023-10-08 18:48:16,867][21195] Updated weights for policy 0, policy_version 75830 (0.0011) +[2023-10-08 18:48:17,115][21194] Updated weights for policy 1, policy_version 75250 (0.0007) +[2023-10-08 18:48:17,230][21195] Updated weights for policy 0, policy_version 75840 (0.0008) +[2023-10-08 18:48:17,481][21194] Updated weights for policy 1, policy_version 75260 (0.0008) +[2023-10-08 18:48:18,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 154730496. Throughput: 0: 1726.1, 1: 1724.7. Samples: 38687878. Policy #0 lag: (min: 19.0, avg: 21.9, max: 51.0) +[2023-10-08 18:48:18,804][19739] Avg episode reward: [(0, '539.780'), (1, '1040.370')] +[2023-10-08 18:48:21,078][21195] Updated weights for policy 0, policy_version 75850 (0.0010) +[2023-10-08 18:48:21,436][21195] Updated weights for policy 0, policy_version 75860 (0.0010) +[2023-10-08 18:48:21,600][21194] Updated weights for policy 1, policy_version 75270 (0.0008) +[2023-10-08 18:48:21,800][21195] Updated weights for policy 0, policy_version 75870 (0.0008) +[2023-10-08 18:48:21,963][21194] Updated weights for policy 1, policy_version 75280 (0.0009) +[2023-10-08 18:48:22,328][21194] Updated weights for policy 1, policy_version 75290 (0.0009) +[2023-10-08 18:48:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 154796032. Throughput: 0: 1719.6, 1: 1706.3. Samples: 38702694. Policy #0 lag: (min: 19.0, avg: 21.9, max: 51.0) +[2023-10-08 18:48:23,804][19739] Avg episode reward: [(0, '539.780'), (1, '1040.370')] +[2023-10-08 18:48:25,792][21195] Updated weights for policy 0, policy_version 75880 (0.0007) +[2023-10-08 18:48:26,164][21195] Updated weights for policy 0, policy_version 75890 (0.0007) +[2023-10-08 18:48:26,412][21194] Updated weights for policy 1, policy_version 75300 (0.0009) +[2023-10-08 18:48:26,528][21195] Updated weights for policy 0, policy_version 75900 (0.0007) +[2023-10-08 18:48:26,787][21194] Updated weights for policy 1, policy_version 75310 (0.0008) +[2023-10-08 18:48:27,149][21194] Updated weights for policy 1, policy_version 75320 (0.0007) +[2023-10-08 18:48:28,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 154861568. Throughput: 0: 1718.6, 1: 1688.7. Samples: 38723276. Policy #0 lag: (min: 19.0, avg: 21.9, max: 51.0) +[2023-10-08 18:48:28,803][19739] Avg episode reward: [(0, '539.780'), (1, '1007.460')] +[2023-10-08 18:48:30,433][21195] Updated weights for policy 0, policy_version 75910 (0.0009) +[2023-10-08 18:48:30,804][21195] Updated weights for policy 0, policy_version 75920 (0.0008) +[2023-10-08 18:48:31,065][21194] Updated weights for policy 1, policy_version 75330 (0.0009) +[2023-10-08 18:48:31,170][21195] Updated weights for policy 0, policy_version 75930 (0.0008) +[2023-10-08 18:48:31,434][21194] Updated weights for policy 1, policy_version 75340 (0.0007) +[2023-10-08 18:48:31,808][21194] Updated weights for policy 1, policy_version 75350 (0.0009) +[2023-10-08 18:48:32,176][21194] Updated weights for policy 1, policy_version 75360 (0.0009) +[2023-10-08 18:48:33,802][19739] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 154927104. Throughput: 0: 1747.2, 1: 1715.7. Samples: 38739922. Policy #0 lag: (min: 19.0, avg: 21.9, max: 51.0) +[2023-10-08 18:48:33,803][19739] Avg episode reward: [(0, '555.190'), (1, '992.760')] +[2023-10-08 18:48:35,010][21195] Updated weights for policy 0, policy_version 75940 (0.0008) +[2023-10-08 18:48:35,381][21195] Updated weights for policy 0, policy_version 75950 (0.0007) +[2023-10-08 18:48:35,741][21195] Updated weights for policy 0, policy_version 75960 (0.0009) +[2023-10-08 18:48:36,170][21194] Updated weights for policy 1, policy_version 75370 (0.0008) +[2023-10-08 18:48:36,534][21194] Updated weights for policy 1, policy_version 75380 (0.0010) +[2023-10-08 18:48:36,897][21194] Updated weights for policy 1, policy_version 75390 (0.0009) +[2023-10-08 18:48:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 154992640. Throughput: 0: 1721.2, 1: 1686.9. Samples: 38754078. Policy #0 lag: (min: 24.0, avg: 52.7, max: 56.0) +[2023-10-08 18:48:38,803][19739] Avg episode reward: [(0, '493.960'), (1, '992.760')] +[2023-10-08 18:48:39,491][21195] Updated weights for policy 0, policy_version 75970 (0.0008) +[2023-10-08 18:48:39,845][21195] Updated weights for policy 0, policy_version 75980 (0.0010) +[2023-10-08 18:48:40,222][21195] Updated weights for policy 0, policy_version 75990 (0.0009) +[2023-10-08 18:48:40,585][21195] Updated weights for policy 0, policy_version 76000 (0.0008) +[2023-10-08 18:48:40,939][21194] Updated weights for policy 1, policy_version 75400 (0.0010) +[2023-10-08 18:48:41,296][21194] Updated weights for policy 1, policy_version 75410 (0.0011) +[2023-10-08 18:48:41,662][21194] Updated weights for policy 1, policy_version 75420 (0.0007) +[2023-10-08 18:48:43,803][19739] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 155058176. Throughput: 0: 1743.0, 1: 1708.3. Samples: 38775706. Policy #0 lag: (min: 24.0, avg: 52.7, max: 56.0) +[2023-10-08 18:48:43,804][19739] Avg episode reward: [(0, '493.960'), (1, '992.520')] +[2023-10-08 18:48:44,686][21195] Updated weights for policy 0, policy_version 76010 (0.0009) +[2023-10-08 18:48:45,046][21195] Updated weights for policy 0, policy_version 76020 (0.0009) +[2023-10-08 18:48:45,425][21195] Updated weights for policy 0, policy_version 76030 (0.0009) +[2023-10-08 18:48:45,489][21194] Updated weights for policy 1, policy_version 75430 (0.0008) +[2023-10-08 18:48:45,845][21194] Updated weights for policy 1, policy_version 75440 (0.0007) +[2023-10-08 18:48:46,223][21194] Updated weights for policy 1, policy_version 75450 (0.0011) +[2023-10-08 18:48:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 155123712. Throughput: 0: 1755.7, 1: 1705.0. Samples: 38791856. Policy #0 lag: (min: 24.0, avg: 52.7, max: 56.0) +[2023-10-08 18:48:48,803][19739] Avg episode reward: [(0, '493.960'), (1, '992.520')] +[2023-10-08 18:48:49,210][21195] Updated weights for policy 0, policy_version 76040 (0.0009) +[2023-10-08 18:48:49,576][21195] Updated weights for policy 0, policy_version 76050 (0.0011) +[2023-10-08 18:48:49,953][21195] Updated weights for policy 0, policy_version 76060 (0.0010) +[2023-10-08 18:48:50,106][21194] Updated weights for policy 1, policy_version 75460 (0.0009) +[2023-10-08 18:48:50,476][21194] Updated weights for policy 1, policy_version 75470 (0.0010) +[2023-10-08 18:48:50,841][21194] Updated weights for policy 1, policy_version 75480 (0.0010) +[2023-10-08 18:48:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.1, 300 sec: 13773.7). Total num frames: 155189248. Throughput: 0: 1729.0, 1: 1696.8. Samples: 38806418. Policy #0 lag: (min: 24.0, avg: 52.7, max: 56.0) +[2023-10-08 18:48:53,804][19739] Avg episode reward: [(0, '493.960'), (1, '964.030')] +[2023-10-08 18:48:53,885][21195] Updated weights for policy 0, policy_version 76070 (0.0008) +[2023-10-08 18:48:54,265][21195] Updated weights for policy 0, policy_version 76080 (0.0010) +[2023-10-08 18:48:54,632][21195] Updated weights for policy 0, policy_version 76090 (0.0008) +[2023-10-08 18:48:54,767][21194] Updated weights for policy 1, policy_version 75490 (0.0010) +[2023-10-08 18:48:55,130][21194] Updated weights for policy 1, policy_version 75500 (0.0007) +[2023-10-08 18:48:55,493][21194] Updated weights for policy 1, policy_version 75510 (0.0009) +[2023-10-08 18:48:55,855][21194] Updated weights for policy 1, policy_version 75520 (0.0011) +[2023-10-08 18:48:58,659][21195] Updated weights for policy 0, policy_version 76100 (0.0010) +[2023-10-08 18:48:58,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 155254784. Throughput: 0: 1753.0, 1: 1739.3. Samples: 38828396. Policy #0 lag: (min: 24.0, avg: 52.7, max: 56.0) +[2023-10-08 18:48:58,803][19739] Avg episode reward: [(0, '474.040'), (1, '978.910')] +[2023-10-08 18:48:59,017][21195] Updated weights for policy 0, policy_version 76110 (0.0007) +[2023-10-08 18:48:59,386][21195] Updated weights for policy 0, policy_version 76120 (0.0007) +[2023-10-08 18:48:59,742][21194] Updated weights for policy 1, policy_version 75530 (0.0008) +[2023-10-08 18:49:00,101][21194] Updated weights for policy 1, policy_version 75540 (0.0008) +[2023-10-08 18:49:00,474][21194] Updated weights for policy 1, policy_version 75550 (0.0008) +[2023-10-08 18:49:03,269][21195] Updated weights for policy 0, policy_version 76130 (0.0009) +[2023-10-08 18:49:03,637][21195] Updated weights for policy 0, policy_version 76140 (0.0007) +[2023-10-08 18:49:03,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 155320320. Throughput: 0: 1736.7, 1: 1709.1. Samples: 38842938. Policy #0 lag: (min: 24.0, avg: 52.7, max: 56.0) +[2023-10-08 18:49:03,804][19739] Avg episode reward: [(0, '474.110'), (1, '978.860')] +[2023-10-08 18:49:04,007][21195] Updated weights for policy 0, policy_version 76150 (0.0007) +[2023-10-08 18:49:04,373][21195] Updated weights for policy 0, policy_version 76160 (0.0007) +[2023-10-08 18:49:04,407][21194] Updated weights for policy 1, policy_version 75560 (0.0009) +[2023-10-08 18:49:04,776][21194] Updated weights for policy 1, policy_version 75570 (0.0008) +[2023-10-08 18:49:05,143][21194] Updated weights for policy 1, policy_version 75580 (0.0010) +[2023-10-08 18:49:08,317][21195] Updated weights for policy 0, policy_version 76170 (0.0010) +[2023-10-08 18:49:08,694][21195] Updated weights for policy 0, policy_version 76180 (0.0010) +[2023-10-08 18:49:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 155385856. Throughput: 0: 1751.9, 1: 1726.9. Samples: 38859238. Policy #0 lag: (min: 24.0, avg: 52.7, max: 56.0) +[2023-10-08 18:49:08,803][19739] Avg episode reward: [(0, '462.380'), (1, '978.860')] +[2023-10-08 18:49:08,994][21194] Updated weights for policy 1, policy_version 75590 (0.0008) +[2023-10-08 18:49:09,059][21195] Updated weights for policy 0, policy_version 76190 (0.0008) +[2023-10-08 18:49:09,358][21194] Updated weights for policy 1, policy_version 75600 (0.0008) +[2023-10-08 18:49:09,733][21194] Updated weights for policy 1, policy_version 75610 (0.0010) +[2023-10-08 18:49:12,939][21195] Updated weights for policy 0, policy_version 76200 (0.0008) +[2023-10-08 18:49:13,314][21195] Updated weights for policy 0, policy_version 76210 (0.0009) +[2023-10-08 18:49:13,687][21195] Updated weights for policy 0, policy_version 76220 (0.0009) +[2023-10-08 18:49:13,707][21194] Updated weights for policy 1, policy_version 75620 (0.0008) +[2023-10-08 18:49:13,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.3, 300 sec: 13773.7). Total num frames: 155451392. Throughput: 0: 1751.0, 1: 1745.2. Samples: 38880602. Policy #0 lag: (min: 24.0, avg: 52.7, max: 56.0) +[2023-10-08 18:49:13,803][19739] Avg episode reward: [(0, '447.050'), (1, '966.250')] +[2023-10-08 18:49:13,825][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000076224_78053376.pth... +[2023-10-08 18:49:13,854][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000074592_76382208.pth +[2023-10-08 18:49:14,067][21194] Updated weights for policy 1, policy_version 75630 (0.0009) +[2023-10-08 18:49:14,438][21194] Updated weights for policy 1, policy_version 75640 (0.0009) +[2023-10-08 18:49:14,721][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000075648_77463552.pth... +[2023-10-08 18:49:14,750][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000074016_75792384.pth +[2023-10-08 18:49:17,388][21195] Updated weights for policy 0, policy_version 76230 (0.0010) +[2023-10-08 18:49:17,762][21195] Updated weights for policy 0, policy_version 76240 (0.0007) +[2023-10-08 18:49:18,125][21195] Updated weights for policy 0, policy_version 76250 (0.0010) +[2023-10-08 18:49:18,466][21194] Updated weights for policy 1, policy_version 75650 (0.0008) +[2023-10-08 18:49:18,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 155549696. Throughput: 0: 1729.6, 1: 1713.3. Samples: 38894856. Policy #0 lag: (min: 24.0, avg: 52.7, max: 56.0) +[2023-10-08 18:49:18,803][19739] Avg episode reward: [(0, '447.050'), (1, '966.250')] +[2023-10-08 18:49:18,845][21194] Updated weights for policy 1, policy_version 75660 (0.0008) +[2023-10-08 18:49:19,203][21194] Updated weights for policy 1, policy_version 75670 (0.0009) +[2023-10-08 18:49:19,571][21194] Updated weights for policy 1, policy_version 75680 (0.0010) +[2023-10-08 18:49:22,018][21195] Updated weights for policy 0, policy_version 76260 (0.0009) +[2023-10-08 18:49:22,385][21195] Updated weights for policy 0, policy_version 76270 (0.0007) +[2023-10-08 18:49:22,747][21195] Updated weights for policy 0, policy_version 76280 (0.0007) +[2023-10-08 18:49:23,674][21194] Updated weights for policy 1, policy_version 75690 (0.0008) +[2023-10-08 18:49:23,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 155615232. Throughput: 0: 1755.6, 1: 1739.3. Samples: 38911352. Policy #0 lag: (min: 24.0, avg: 52.7, max: 56.0) +[2023-10-08 18:49:23,803][19739] Avg episode reward: [(0, '447.050'), (1, '966.250')] +[2023-10-08 18:49:24,034][21194] Updated weights for policy 1, policy_version 75700 (0.0007) +[2023-10-08 18:49:24,401][21194] Updated weights for policy 1, policy_version 75710 (0.0009) +[2023-10-08 18:49:26,713][21195] Updated weights for policy 0, policy_version 76290 (0.0007) +[2023-10-08 18:49:27,086][21195] Updated weights for policy 0, policy_version 76300 (0.0009) +[2023-10-08 18:49:27,461][21195] Updated weights for policy 0, policy_version 76310 (0.0008) +[2023-10-08 18:49:27,835][21195] Updated weights for policy 0, policy_version 76320 (0.0007) +[2023-10-08 18:49:28,272][21194] Updated weights for policy 1, policy_version 75720 (0.0009) +[2023-10-08 18:49:28,641][21194] Updated weights for policy 1, policy_version 75730 (0.0009) +[2023-10-08 18:49:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 155680768. Throughput: 0: 1726.6, 1: 1739.0. Samples: 38931656. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 18:49:28,803][19739] Avg episode reward: [(0, '447.050'), (1, '954.110')] +[2023-10-08 18:49:28,998][21194] Updated weights for policy 1, policy_version 75740 (0.0010) +[2023-10-08 18:49:31,848][21195] Updated weights for policy 0, policy_version 76330 (0.0008) +[2023-10-08 18:49:32,210][21195] Updated weights for policy 0, policy_version 76340 (0.0008) +[2023-10-08 18:49:32,579][21195] Updated weights for policy 0, policy_version 76350 (0.0008) +[2023-10-08 18:49:32,831][21194] Updated weights for policy 1, policy_version 75750 (0.0009) +[2023-10-08 18:49:33,196][21194] Updated weights for policy 1, policy_version 75760 (0.0009) +[2023-10-08 18:49:33,558][21194] Updated weights for policy 1, policy_version 75770 (0.0010) +[2023-10-08 18:49:33,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 155779072. Throughput: 0: 1727.3, 1: 1724.3. Samples: 38947176. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 18:49:33,803][19739] Avg episode reward: [(0, '447.050'), (1, '954.220')] +[2023-10-08 18:49:36,363][21195] Updated weights for policy 0, policy_version 76360 (0.0008) +[2023-10-08 18:49:36,730][21195] Updated weights for policy 0, policy_version 76370 (0.0010) +[2023-10-08 18:49:37,107][21195] Updated weights for policy 0, policy_version 76380 (0.0009) +[2023-10-08 18:49:37,601][21194] Updated weights for policy 1, policy_version 75780 (0.0010) +[2023-10-08 18:49:37,983][21194] Updated weights for policy 1, policy_version 75790 (0.0008) +[2023-10-08 18:49:38,343][21194] Updated weights for policy 1, policy_version 75800 (0.0009) +[2023-10-08 18:49:38,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 155844608. Throughput: 0: 1740.5, 1: 1736.7. Samples: 38962892. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 18:49:38,803][19739] Avg episode reward: [(0, '447.050'), (1, '905.250')] +[2023-10-08 18:49:40,911][21195] Updated weights for policy 0, policy_version 76390 (0.0010) +[2023-10-08 18:49:41,277][21195] Updated weights for policy 0, policy_version 76400 (0.0010) +[2023-10-08 18:49:41,643][21195] Updated weights for policy 0, policy_version 76410 (0.0010) +[2023-10-08 18:49:42,315][21194] Updated weights for policy 1, policy_version 75810 (0.0009) +[2023-10-08 18:49:42,678][21194] Updated weights for policy 1, policy_version 75820 (0.0010) +[2023-10-08 18:49:43,050][21194] Updated weights for policy 1, policy_version 75830 (0.0009) +[2023-10-08 18:49:43,412][21194] Updated weights for policy 1, policy_version 75840 (0.0007) +[2023-10-08 18:49:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 155910144. Throughput: 0: 1726.2, 1: 1710.4. Samples: 38983046. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 18:49:43,803][19739] Avg episode reward: [(0, '447.050'), (1, '874.590')] +[2023-10-08 18:49:45,590][21195] Updated weights for policy 0, policy_version 76420 (0.0008) +[2023-10-08 18:49:45,964][21195] Updated weights for policy 0, policy_version 76430 (0.0009) +[2023-10-08 18:49:46,331][21195] Updated weights for policy 0, policy_version 76440 (0.0007) +[2023-10-08 18:49:47,236][21194] Updated weights for policy 1, policy_version 75850 (0.0009) +[2023-10-08 18:49:47,602][21194] Updated weights for policy 1, policy_version 75860 (0.0008) +[2023-10-08 18:49:47,967][21194] Updated weights for policy 1, policy_version 75870 (0.0008) +[2023-10-08 18:49:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 155975680. Throughput: 0: 1738.7, 1: 1735.7. Samples: 38999282. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 18:49:48,803][19739] Avg episode reward: [(0, '447.050'), (1, '866.660')] +[2023-10-08 18:49:50,342][21195] Updated weights for policy 0, policy_version 76450 (0.0009) +[2023-10-08 18:49:50,709][21195] Updated weights for policy 0, policy_version 76460 (0.0008) +[2023-10-08 18:49:51,073][21195] Updated weights for policy 0, policy_version 76470 (0.0009) +[2023-10-08 18:49:51,440][21195] Updated weights for policy 0, policy_version 76480 (0.0009) +[2023-10-08 18:49:52,045][21194] Updated weights for policy 1, policy_version 75880 (0.0008) +[2023-10-08 18:49:52,418][21194] Updated weights for policy 1, policy_version 75890 (0.0007) +[2023-10-08 18:49:52,779][21194] Updated weights for policy 1, policy_version 75900 (0.0007) +[2023-10-08 18:49:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 156041216. Throughput: 0: 1717.7, 1: 1721.3. Samples: 39013996. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 18:49:53,803][19739] Avg episode reward: [(0, '458.930'), (1, '852.390')] +[2023-10-08 18:49:55,282][21195] Updated weights for policy 0, policy_version 76490 (0.0008) +[2023-10-08 18:49:55,652][21195] Updated weights for policy 0, policy_version 76500 (0.0008) +[2023-10-08 18:49:56,009][21195] Updated weights for policy 0, policy_version 76510 (0.0007) +[2023-10-08 18:49:56,717][21194] Updated weights for policy 1, policy_version 75910 (0.0010) +[2023-10-08 18:49:57,079][21194] Updated weights for policy 1, policy_version 75920 (0.0008) +[2023-10-08 18:49:57,446][21194] Updated weights for policy 1, policy_version 75930 (0.0009) +[2023-10-08 18:49:58,803][19739] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 156106752. Throughput: 0: 1719.0, 1: 1698.4. Samples: 39034386. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 18:49:58,804][19739] Avg episode reward: [(0, '459.050'), (1, '852.390')] +[2023-10-08 18:49:59,828][21195] Updated weights for policy 0, policy_version 76520 (0.0009) +[2023-10-08 18:50:00,204][21195] Updated weights for policy 0, policy_version 76530 (0.0009) +[2023-10-08 18:50:00,576][21195] Updated weights for policy 0, policy_version 76540 (0.0009) +[2023-10-08 18:50:01,268][21194] Updated weights for policy 1, policy_version 75940 (0.0010) +[2023-10-08 18:50:01,632][21194] Updated weights for policy 1, policy_version 75950 (0.0009) +[2023-10-08 18:50:02,006][21194] Updated weights for policy 1, policy_version 75960 (0.0007) +[2023-10-08 18:50:03,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 156172288. Throughput: 0: 1739.2, 1: 1736.0. Samples: 39051240. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 18:50:03,804][19739] Avg episode reward: [(0, '458.500'), (1, '852.390')] +[2023-10-08 18:50:04,627][21195] Updated weights for policy 0, policy_version 76550 (0.0009) +[2023-10-08 18:50:04,994][21195] Updated weights for policy 0, policy_version 76560 (0.0011) +[2023-10-08 18:50:05,361][21195] Updated weights for policy 0, policy_version 76570 (0.0011) +[2023-10-08 18:50:06,179][21194] Updated weights for policy 1, policy_version 75970 (0.0008) +[2023-10-08 18:50:06,535][21194] Updated weights for policy 1, policy_version 75980 (0.0009) +[2023-10-08 18:50:06,895][21194] Updated weights for policy 1, policy_version 75990 (0.0008) +[2023-10-08 18:50:07,268][21194] Updated weights for policy 1, policy_version 76000 (0.0010) +[2023-10-08 18:50:08,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 156237824. Throughput: 0: 1710.1, 1: 1716.0. Samples: 39065524. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 18:50:08,803][19739] Avg episode reward: [(0, '458.660'), (1, '841.740')] +[2023-10-08 18:50:09,256][21195] Updated weights for policy 0, policy_version 76580 (0.0009) +[2023-10-08 18:50:09,619][21195] Updated weights for policy 0, policy_version 76590 (0.0007) +[2023-10-08 18:50:09,984][21195] Updated weights for policy 0, policy_version 76600 (0.0009) +[2023-10-08 18:50:11,085][21194] Updated weights for policy 1, policy_version 76010 (0.0010) +[2023-10-08 18:50:11,461][21194] Updated weights for policy 1, policy_version 76020 (0.0007) +[2023-10-08 18:50:11,828][21194] Updated weights for policy 1, policy_version 76030 (0.0007) +[2023-10-08 18:50:13,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 156303360. Throughput: 0: 1736.0, 1: 1710.5. Samples: 39086752. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 18:50:13,803][19739] Avg episode reward: [(0, '474.360'), (1, '841.740')] +[2023-10-08 18:50:13,991][21195] Updated weights for policy 0, policy_version 76610 (0.0007) +[2023-10-08 18:50:14,353][21195] Updated weights for policy 0, policy_version 76620 (0.0009) +[2023-10-08 18:50:14,726][21195] Updated weights for policy 0, policy_version 76630 (0.0008) +[2023-10-08 18:50:15,095][21195] Updated weights for policy 0, policy_version 76640 (0.0009) +[2023-10-08 18:50:15,634][21194] Updated weights for policy 1, policy_version 76040 (0.0007) +[2023-10-08 18:50:15,997][21194] Updated weights for policy 1, policy_version 76050 (0.0007) +[2023-10-08 18:50:16,362][21194] Updated weights for policy 1, policy_version 76060 (0.0009) +[2023-10-08 18:50:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 156368896. Throughput: 0: 1730.4, 1: 1727.6. Samples: 39102788. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 18:50:18,803][19739] Avg episode reward: [(0, '474.680'), (1, '841.740')] +[2023-10-08 18:50:19,092][21195] Updated weights for policy 0, policy_version 76650 (0.0007) +[2023-10-08 18:50:19,464][21195] Updated weights for policy 0, policy_version 76660 (0.0007) +[2023-10-08 18:50:19,824][21195] Updated weights for policy 0, policy_version 76670 (0.0007) +[2023-10-08 18:50:20,312][21194] Updated weights for policy 1, policy_version 76070 (0.0008) +[2023-10-08 18:50:20,681][21194] Updated weights for policy 1, policy_version 76080 (0.0009) +[2023-10-08 18:50:21,052][21194] Updated weights for policy 1, policy_version 76090 (0.0008) +[2023-10-08 18:50:23,605][21195] Updated weights for policy 0, policy_version 76680 (0.0010) +[2023-10-08 18:50:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 156434432. Throughput: 0: 1726.7, 1: 1716.9. Samples: 39117852. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:50:23,803][19739] Avg episode reward: [(0, '474.680'), (1, '841.740')] +[2023-10-08 18:50:23,962][21195] Updated weights for policy 0, policy_version 76690 (0.0008) +[2023-10-08 18:50:24,332][21195] Updated weights for policy 0, policy_version 76700 (0.0009) +[2023-10-08 18:50:25,076][21194] Updated weights for policy 1, policy_version 76100 (0.0008) +[2023-10-08 18:50:25,437][21194] Updated weights for policy 1, policy_version 76110 (0.0009) +[2023-10-08 18:50:25,797][21194] Updated weights for policy 1, policy_version 76120 (0.0010) +[2023-10-08 18:50:28,312][21195] Updated weights for policy 0, policy_version 76710 (0.0009) +[2023-10-08 18:50:28,682][21195] Updated weights for policy 0, policy_version 76720 (0.0009) +[2023-10-08 18:50:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 156499968. Throughput: 0: 1740.5, 1: 1733.6. Samples: 39139380. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:50:28,803][19739] Avg episode reward: [(0, '474.680'), (1, '841.740')] +[2023-10-08 18:50:29,042][21195] Updated weights for policy 0, policy_version 76730 (0.0009) +[2023-10-08 18:50:29,760][21194] Updated weights for policy 1, policy_version 76130 (0.0008) +[2023-10-08 18:50:30,130][21194] Updated weights for policy 1, policy_version 76140 (0.0010) +[2023-10-08 18:50:30,501][21194] Updated weights for policy 1, policy_version 76150 (0.0011) +[2023-10-08 18:50:30,863][21194] Updated weights for policy 1, policy_version 76160 (0.0010) +[2023-10-08 18:50:32,989][21195] Updated weights for policy 0, policy_version 76740 (0.0011) +[2023-10-08 18:50:33,360][21195] Updated weights for policy 0, policy_version 76750 (0.0010) +[2023-10-08 18:50:33,730][21195] Updated weights for policy 0, policy_version 76760 (0.0008) +[2023-10-08 18:50:33,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 156565504. Throughput: 0: 1720.7, 1: 1714.9. Samples: 39153882. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:50:33,803][19739] Avg episode reward: [(0, '460.000'), (1, '841.680')] +[2023-10-08 18:50:34,850][21194] Updated weights for policy 1, policy_version 76170 (0.0011) +[2023-10-08 18:50:35,221][21194] Updated weights for policy 1, policy_version 76180 (0.0010) +[2023-10-08 18:50:35,580][21194] Updated weights for policy 1, policy_version 76190 (0.0010) +[2023-10-08 18:50:37,582][21195] Updated weights for policy 0, policy_version 76770 (0.0009) +[2023-10-08 18:50:37,960][21195] Updated weights for policy 0, policy_version 76780 (0.0010) +[2023-10-08 18:50:38,317][21195] Updated weights for policy 0, policy_version 76790 (0.0009) +[2023-10-08 18:50:38,686][21195] Updated weights for policy 0, policy_version 76800 (0.0010) +[2023-10-08 18:50:38,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 156663808. Throughput: 0: 1748.8, 1: 1723.2. Samples: 39170232. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:50:38,803][19739] Avg episode reward: [(0, '460.000'), (1, '825.890')] +[2023-10-08 18:50:39,543][21194] Updated weights for policy 1, policy_version 76200 (0.0010) +[2023-10-08 18:50:39,907][21194] Updated weights for policy 1, policy_version 76210 (0.0010) +[2023-10-08 18:50:40,261][21194] Updated weights for policy 1, policy_version 76220 (0.0010) +[2023-10-08 18:50:42,755][21195] Updated weights for policy 0, policy_version 76810 (0.0012) +[2023-10-08 18:50:43,123][21195] Updated weights for policy 0, policy_version 76820 (0.0010) +[2023-10-08 18:50:43,495][21195] Updated weights for policy 0, policy_version 76830 (0.0008) +[2023-10-08 18:50:43,803][19739] Fps is (10 sec: 16383.6, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 156729344. Throughput: 0: 1739.3, 1: 1746.8. Samples: 39191260. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:50:43,804][19739] Avg episode reward: [(0, '440.010'), (1, '825.890')] +[2023-10-08 18:50:44,024][21194] Updated weights for policy 1, policy_version 76230 (0.0008) +[2023-10-08 18:50:44,384][21194] Updated weights for policy 1, policy_version 76240 (0.0008) +[2023-10-08 18:50:44,749][21194] Updated weights for policy 1, policy_version 76250 (0.0007) +[2023-10-08 18:50:47,461][21195] Updated weights for policy 0, policy_version 76840 (0.0008) +[2023-10-08 18:50:47,818][21195] Updated weights for policy 0, policy_version 76850 (0.0007) +[2023-10-08 18:50:48,187][21195] Updated weights for policy 0, policy_version 76860 (0.0009) +[2023-10-08 18:50:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 156794880. Throughput: 0: 1720.5, 1: 1714.6. Samples: 39205820. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:50:48,803][19739] Avg episode reward: [(0, '440.010'), (1, '825.890')] +[2023-10-08 18:50:48,809][21194] Updated weights for policy 1, policy_version 76260 (0.0007) +[2023-10-08 18:50:49,167][21194] Updated weights for policy 1, policy_version 76270 (0.0009) +[2023-10-08 18:50:49,540][21194] Updated weights for policy 1, policy_version 76280 (0.0007) +[2023-10-08 18:50:52,135][21195] Updated weights for policy 0, policy_version 76870 (0.0010) +[2023-10-08 18:50:52,499][21195] Updated weights for policy 0, policy_version 76880 (0.0007) +[2023-10-08 18:50:52,868][21195] Updated weights for policy 0, policy_version 76890 (0.0008) +[2023-10-08 18:50:53,505][21194] Updated weights for policy 1, policy_version 76290 (0.0007) +[2023-10-08 18:50:53,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 156860416. Throughput: 0: 1750.2, 1: 1738.0. Samples: 39222494. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:50:53,804][19739] Avg episode reward: [(0, '463.470'), (1, '825.890')] +[2023-10-08 18:50:53,871][21194] Updated weights for policy 1, policy_version 76300 (0.0007) +[2023-10-08 18:50:54,242][21194] Updated weights for policy 1, policy_version 76310 (0.0009) +[2023-10-08 18:50:54,603][21194] Updated weights for policy 1, policy_version 76320 (0.0008) +[2023-10-08 18:50:56,761][21195] Updated weights for policy 0, policy_version 76900 (0.0008) +[2023-10-08 18:50:57,136][21195] Updated weights for policy 0, policy_version 76910 (0.0008) +[2023-10-08 18:50:57,509][21195] Updated weights for policy 0, policy_version 76920 (0.0008) +[2023-10-08 18:50:58,599][21194] Updated weights for policy 1, policy_version 76330 (0.0007) +[2023-10-08 18:50:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 156925952. Throughput: 0: 1722.4, 1: 1740.9. Samples: 39242600. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:50:58,803][19739] Avg episode reward: [(0, '463.730'), (1, '825.890')] +[2023-10-08 18:50:58,972][21194] Updated weights for policy 1, policy_version 76340 (0.0010) +[2023-10-08 18:50:59,340][21194] Updated weights for policy 1, policy_version 76350 (0.0008) +[2023-10-08 18:51:01,481][21195] Updated weights for policy 0, policy_version 76930 (0.0010) +[2023-10-08 18:51:01,851][21195] Updated weights for policy 0, policy_version 76940 (0.0008) +[2023-10-08 18:51:02,218][21195] Updated weights for policy 0, policy_version 76950 (0.0008) +[2023-10-08 18:51:02,588][21195] Updated weights for policy 0, policy_version 76960 (0.0007) +[2023-10-08 18:51:03,164][21194] Updated weights for policy 1, policy_version 76360 (0.0008) +[2023-10-08 18:51:03,533][21194] Updated weights for policy 1, policy_version 76370 (0.0008) +[2023-10-08 18:51:03,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 156991488. Throughput: 0: 1725.5, 1: 1723.1. Samples: 39257972. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:51:03,803][19739] Avg episode reward: [(0, '463.730'), (1, '826.590')] +[2023-10-08 18:51:03,893][21194] Updated weights for policy 1, policy_version 76380 (0.0008) +[2023-10-08 18:51:06,465][21195] Updated weights for policy 0, policy_version 76970 (0.0009) +[2023-10-08 18:51:06,835][21195] Updated weights for policy 0, policy_version 76980 (0.0009) +[2023-10-08 18:51:07,202][21195] Updated weights for policy 0, policy_version 76990 (0.0008) +[2023-10-08 18:51:07,826][21194] Updated weights for policy 1, policy_version 76390 (0.0009) +[2023-10-08 18:51:08,191][21194] Updated weights for policy 1, policy_version 76400 (0.0007) +[2023-10-08 18:51:08,569][21194] Updated weights for policy 1, policy_version 76410 (0.0008) +[2023-10-08 18:51:08,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 157089792. Throughput: 0: 1730.1, 1: 1744.7. Samples: 39274218. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:51:08,803][19739] Avg episode reward: [(0, '494.400'), (1, '826.590')] +[2023-10-08 18:51:11,194][21195] Updated weights for policy 0, policy_version 77000 (0.0010) +[2023-10-08 18:51:11,559][21195] Updated weights for policy 0, policy_version 77010 (0.0010) +[2023-10-08 18:51:11,923][21195] Updated weights for policy 0, policy_version 77020 (0.0010) +[2023-10-08 18:51:12,466][21194] Updated weights for policy 1, policy_version 76420 (0.0008) +[2023-10-08 18:51:12,830][21194] Updated weights for policy 1, policy_version 76430 (0.0010) +[2023-10-08 18:51:13,193][21194] Updated weights for policy 1, policy_version 76440 (0.0010) +[2023-10-08 18:51:13,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 157155328. Throughput: 0: 1713.2, 1: 1727.8. Samples: 39294226. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:51:13,803][19739] Avg episode reward: [(0, '494.400'), (1, '826.590')] +[2023-10-08 18:51:13,810][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000076448_78282752.pth... +[2023-10-08 18:51:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000077024_78872576.pth... +[2023-10-08 18:51:13,841][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000075392_77201408.pth +[2023-10-08 18:51:13,848][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000074816_76611584.pth +[2023-10-08 18:51:15,722][21195] Updated weights for policy 0, policy_version 77030 (0.0009) +[2023-10-08 18:51:16,092][21195] Updated weights for policy 0, policy_version 77040 (0.0010) +[2023-10-08 18:51:16,455][21195] Updated weights for policy 0, policy_version 77050 (0.0010) +[2023-10-08 18:51:17,220][21194] Updated weights for policy 1, policy_version 76450 (0.0011) +[2023-10-08 18:51:17,583][21194] Updated weights for policy 1, policy_version 76460 (0.0008) +[2023-10-08 18:51:17,955][21194] Updated weights for policy 1, policy_version 76470 (0.0010) +[2023-10-08 18:51:18,319][21194] Updated weights for policy 1, policy_version 76480 (0.0011) +[2023-10-08 18:51:18,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 157220864. Throughput: 0: 1739.9, 1: 1739.3. Samples: 39310446. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:51:18,804][19739] Avg episode reward: [(0, '494.480'), (1, '826.590')] +[2023-10-08 18:51:20,441][21195] Updated weights for policy 0, policy_version 77060 (0.0007) +[2023-10-08 18:51:20,799][21195] Updated weights for policy 0, policy_version 77070 (0.0008) +[2023-10-08 18:51:21,173][21195] Updated weights for policy 0, policy_version 77080 (0.0008) +[2023-10-08 18:51:22,371][21194] Updated weights for policy 1, policy_version 76490 (0.0007) +[2023-10-08 18:51:22,748][21194] Updated weights for policy 1, policy_version 76500 (0.0008) +[2023-10-08 18:51:23,120][21194] Updated weights for policy 1, policy_version 76510 (0.0008) +[2023-10-08 18:51:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 157286400. Throughput: 0: 1713.5, 1: 1739.6. Samples: 39325624. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:51:23,803][19739] Avg episode reward: [(0, '494.480'), (1, '841.110')] +[2023-10-08 18:51:25,094][21195] Updated weights for policy 0, policy_version 77090 (0.0007) +[2023-10-08 18:51:25,460][21195] Updated weights for policy 0, policy_version 77100 (0.0009) +[2023-10-08 18:51:25,823][21195] Updated weights for policy 0, policy_version 77110 (0.0008) +[2023-10-08 18:51:26,189][21195] Updated weights for policy 0, policy_version 77120 (0.0008) +[2023-10-08 18:51:26,912][21194] Updated weights for policy 1, policy_version 76520 (0.0007) +[2023-10-08 18:51:27,277][21194] Updated weights for policy 1, policy_version 76530 (0.0007) +[2023-10-08 18:51:27,640][21194] Updated weights for policy 1, policy_version 76540 (0.0007) +[2023-10-08 18:51:28,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 157351936. Throughput: 0: 1725.1, 1: 1708.5. Samples: 39345772. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:51:28,803][19739] Avg episode reward: [(0, '494.480'), (1, '841.110')] +[2023-10-08 18:51:30,177][21195] Updated weights for policy 0, policy_version 77130 (0.0007) +[2023-10-08 18:51:30,543][21195] Updated weights for policy 0, policy_version 77140 (0.0008) +[2023-10-08 18:51:30,903][21195] Updated weights for policy 0, policy_version 77150 (0.0009) +[2023-10-08 18:51:31,730][21194] Updated weights for policy 1, policy_version 76550 (0.0009) +[2023-10-08 18:51:32,098][21194] Updated weights for policy 1, policy_version 76560 (0.0009) +[2023-10-08 18:51:32,476][21194] Updated weights for policy 1, policy_version 76570 (0.0007) +[2023-10-08 18:51:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 157417472. Throughput: 0: 1743.9, 1: 1735.5. Samples: 39362392. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:51:33,803][19739] Avg episode reward: [(0, '494.480'), (1, '841.110')] +[2023-10-08 18:51:34,984][21195] Updated weights for policy 0, policy_version 77160 (0.0008) +[2023-10-08 18:51:35,352][21195] Updated weights for policy 0, policy_version 77170 (0.0008) +[2023-10-08 18:51:35,728][21195] Updated weights for policy 0, policy_version 77180 (0.0010) +[2023-10-08 18:51:36,496][21194] Updated weights for policy 1, policy_version 76580 (0.0011) +[2023-10-08 18:51:36,859][21194] Updated weights for policy 1, policy_version 76590 (0.0010) +[2023-10-08 18:51:37,230][21194] Updated weights for policy 1, policy_version 76600 (0.0011) +[2023-10-08 18:51:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 157483008. Throughput: 0: 1715.1, 1: 1722.1. Samples: 39377170. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:51:38,803][19739] Avg episode reward: [(0, '494.480'), (1, '841.110')] +[2023-10-08 18:51:39,507][21195] Updated weights for policy 0, policy_version 77190 (0.0009) +[2023-10-08 18:51:39,880][21195] Updated weights for policy 0, policy_version 77200 (0.0010) +[2023-10-08 18:51:40,239][21195] Updated weights for policy 0, policy_version 77210 (0.0010) +[2023-10-08 18:51:41,123][21194] Updated weights for policy 1, policy_version 76610 (0.0009) +[2023-10-08 18:51:41,497][21194] Updated weights for policy 1, policy_version 76620 (0.0007) +[2023-10-08 18:51:41,855][21194] Updated weights for policy 1, policy_version 76630 (0.0009) +[2023-10-08 18:51:42,218][21194] Updated weights for policy 1, policy_version 76640 (0.0009) +[2023-10-08 18:51:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 157548544. Throughput: 0: 1750.6, 1: 1712.0. Samples: 39398414. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:51:43,803][19739] Avg episode reward: [(0, '494.480'), (1, '841.110')] +[2023-10-08 18:51:43,967][21195] Updated weights for policy 0, policy_version 77220 (0.0007) +[2023-10-08 18:51:44,342][21195] Updated weights for policy 0, policy_version 77230 (0.0011) +[2023-10-08 18:51:44,717][21195] Updated weights for policy 0, policy_version 77240 (0.0007) +[2023-10-08 18:51:46,248][21194] Updated weights for policy 1, policy_version 76650 (0.0009) +[2023-10-08 18:51:46,620][21194] Updated weights for policy 1, policy_version 76660 (0.0008) +[2023-10-08 18:51:46,988][21194] Updated weights for policy 1, policy_version 76670 (0.0008) +[2023-10-08 18:51:48,536][21195] Updated weights for policy 0, policy_version 77250 (0.0007) +[2023-10-08 18:51:48,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 157614080. Throughput: 0: 1745.3, 1: 1733.3. Samples: 39414508. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:51:48,804][19739] Avg episode reward: [(0, '494.480'), (1, '851.270')] +[2023-10-08 18:51:48,900][21195] Updated weights for policy 0, policy_version 77260 (0.0008) +[2023-10-08 18:51:49,270][21195] Updated weights for policy 0, policy_version 77270 (0.0009) +[2023-10-08 18:51:49,635][21195] Updated weights for policy 0, policy_version 77280 (0.0008) +[2023-10-08 18:51:50,995][21194] Updated weights for policy 1, policy_version 76680 (0.0010) +[2023-10-08 18:51:51,360][21194] Updated weights for policy 1, policy_version 76690 (0.0007) +[2023-10-08 18:51:51,734][21194] Updated weights for policy 1, policy_version 76700 (0.0008) +[2023-10-08 18:51:53,424][21195] Updated weights for policy 0, policy_version 77290 (0.0008) +[2023-10-08 18:51:53,794][21195] Updated weights for policy 0, policy_version 77300 (0.0010) +[2023-10-08 18:51:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 157679616. Throughput: 0: 1747.8, 1: 1698.0. Samples: 39429278. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:51:53,804][19739] Avg episode reward: [(0, '494.480'), (1, '851.270')] +[2023-10-08 18:51:54,164][21195] Updated weights for policy 0, policy_version 77310 (0.0009) +[2023-10-08 18:51:55,508][21194] Updated weights for policy 1, policy_version 76710 (0.0009) +[2023-10-08 18:51:55,874][21194] Updated weights for policy 1, policy_version 76720 (0.0007) +[2023-10-08 18:51:56,244][21194] Updated weights for policy 1, policy_version 76730 (0.0008) +[2023-10-08 18:51:57,966][21195] Updated weights for policy 0, policy_version 77320 (0.0008) +[2023-10-08 18:51:58,328][21195] Updated weights for policy 0, policy_version 77330 (0.0007) +[2023-10-08 18:51:58,702][21195] Updated weights for policy 0, policy_version 77340 (0.0007) +[2023-10-08 18:51:58,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 157745152. Throughput: 0: 1760.8, 1: 1721.6. Samples: 39450936. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:51:58,803][19739] Avg episode reward: [(0, '494.480'), (1, '851.270')] +[2023-10-08 18:51:59,988][21194] Updated weights for policy 1, policy_version 76740 (0.0008) +[2023-10-08 18:52:00,354][21194] Updated weights for policy 1, policy_version 76750 (0.0008) +[2023-10-08 18:52:00,721][21194] Updated weights for policy 1, policy_version 76760 (0.0009) +[2023-10-08 18:52:02,599][21195] Updated weights for policy 0, policy_version 77350 (0.0009) +[2023-10-08 18:52:02,974][21195] Updated weights for policy 0, policy_version 77360 (0.0008) +[2023-10-08 18:52:03,335][21195] Updated weights for policy 0, policy_version 77370 (0.0007) +[2023-10-08 18:52:03,802][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 157843456. Throughput: 0: 1732.1, 1: 1707.8. Samples: 39465242. Policy #0 lag: (min: 2.0, avg: 5.0, max: 34.0) +[2023-10-08 18:52:03,803][19739] Avg episode reward: [(0, '494.480'), (1, '851.270')] +[2023-10-08 18:52:04,571][21194] Updated weights for policy 1, policy_version 76770 (0.0009) +[2023-10-08 18:52:04,927][21194] Updated weights for policy 1, policy_version 76780 (0.0008) +[2023-10-08 18:52:05,291][21194] Updated weights for policy 1, policy_version 76790 (0.0011) +[2023-10-08 18:52:05,659][21194] Updated weights for policy 1, policy_version 76800 (0.0011) +[2023-10-08 18:52:07,237][21195] Updated weights for policy 0, policy_version 77380 (0.0008) +[2023-10-08 18:52:07,611][21195] Updated weights for policy 0, policy_version 77390 (0.0009) +[2023-10-08 18:52:07,976][21195] Updated weights for policy 0, policy_version 77400 (0.0009) +[2023-10-08 18:52:08,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 157908992. Throughput: 0: 1767.8, 1: 1719.6. Samples: 39482556. Policy #0 lag: (min: 2.0, avg: 5.0, max: 34.0) +[2023-10-08 18:52:08,803][19739] Avg episode reward: [(0, '494.480'), (1, '851.270')] +[2023-10-08 18:52:09,721][21194] Updated weights for policy 1, policy_version 76810 (0.0009) +[2023-10-08 18:52:10,093][21194] Updated weights for policy 1, policy_version 76820 (0.0009) +[2023-10-08 18:52:10,452][21194] Updated weights for policy 1, policy_version 76830 (0.0008) +[2023-10-08 18:52:11,875][21195] Updated weights for policy 0, policy_version 77410 (0.0009) +[2023-10-08 18:52:12,239][21195] Updated weights for policy 0, policy_version 77420 (0.0010) +[2023-10-08 18:52:12,602][21195] Updated weights for policy 0, policy_version 77430 (0.0010) +[2023-10-08 18:52:12,978][21195] Updated weights for policy 0, policy_version 77440 (0.0009) +[2023-10-08 18:52:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 157974528. Throughput: 0: 1742.4, 1: 1751.8. Samples: 39503010. Policy #0 lag: (min: 2.0, avg: 5.0, max: 34.0) +[2023-10-08 18:52:13,803][19739] Avg episode reward: [(0, '506.430'), (1, '866.440')] +[2023-10-08 18:52:14,207][21194] Updated weights for policy 1, policy_version 76840 (0.0010) +[2023-10-08 18:52:14,576][21194] Updated weights for policy 1, policy_version 76850 (0.0011) +[2023-10-08 18:52:14,942][21194] Updated weights for policy 1, policy_version 76860 (0.0007) +[2023-10-08 18:52:16,744][21195] Updated weights for policy 0, policy_version 77450 (0.0008) +[2023-10-08 18:52:17,109][21195] Updated weights for policy 0, policy_version 77460 (0.0009) +[2023-10-08 18:52:17,477][21195] Updated weights for policy 0, policy_version 77470 (0.0007) +[2023-10-08 18:52:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 158040064. Throughput: 0: 1741.2, 1: 1721.2. Samples: 39518204. Policy #0 lag: (min: 2.0, avg: 5.0, max: 34.0) +[2023-10-08 18:52:18,803][19739] Avg episode reward: [(0, '506.430'), (1, '866.440')] +[2023-10-08 18:52:18,826][21194] Updated weights for policy 1, policy_version 76870 (0.0009) +[2023-10-08 18:52:19,206][21194] Updated weights for policy 1, policy_version 76880 (0.0009) +[2023-10-08 18:52:19,570][21194] Updated weights for policy 1, policy_version 76890 (0.0009) +[2023-10-08 18:52:21,304][21195] Updated weights for policy 0, policy_version 77480 (0.0009) +[2023-10-08 18:52:21,670][21195] Updated weights for policy 0, policy_version 77490 (0.0008) +[2023-10-08 18:52:22,033][21195] Updated weights for policy 0, policy_version 77500 (0.0007) +[2023-10-08 18:52:23,256][21194] Updated weights for policy 1, policy_version 76900 (0.0008) +[2023-10-08 18:52:23,626][21194] Updated weights for policy 1, policy_version 76910 (0.0007) +[2023-10-08 18:52:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 158105600. Throughput: 0: 1750.3, 1: 1745.5. Samples: 39534480. Policy #0 lag: (min: 2.0, avg: 5.0, max: 34.0) +[2023-10-08 18:52:23,804][19739] Avg episode reward: [(0, '506.430'), (1, '856.540')] +[2023-10-08 18:52:23,989][21194] Updated weights for policy 1, policy_version 76920 (0.0011) +[2023-10-08 18:52:25,995][21195] Updated weights for policy 0, policy_version 77510 (0.0008) +[2023-10-08 18:52:26,354][21195] Updated weights for policy 0, policy_version 77520 (0.0010) +[2023-10-08 18:52:26,726][21195] Updated weights for policy 0, policy_version 77530 (0.0009) +[2023-10-08 18:52:27,774][21194] Updated weights for policy 1, policy_version 76930 (0.0007) +[2023-10-08 18:52:28,134][21194] Updated weights for policy 1, policy_version 76940 (0.0009) +[2023-10-08 18:52:28,499][21194] Updated weights for policy 1, policy_version 76950 (0.0009) +[2023-10-08 18:52:28,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 158171136. Throughput: 0: 1738.6, 1: 1754.4. Samples: 39555598. Policy #0 lag: (min: 2.0, avg: 5.0, max: 34.0) +[2023-10-08 18:52:28,803][19739] Avg episode reward: [(0, '506.430'), (1, '856.540')] +[2023-10-08 18:52:28,866][21194] Updated weights for policy 1, policy_version 76960 (0.0010) +[2023-10-08 18:52:30,457][21195] Updated weights for policy 0, policy_version 77540 (0.0008) +[2023-10-08 18:52:30,824][21195] Updated weights for policy 0, policy_version 77550 (0.0010) +[2023-10-08 18:52:31,200][21195] Updated weights for policy 0, policy_version 77560 (0.0009) +[2023-10-08 18:52:32,934][21194] Updated weights for policy 1, policy_version 76970 (0.0008) +[2023-10-08 18:52:33,299][21194] Updated weights for policy 1, policy_version 76980 (0.0007) +[2023-10-08 18:52:33,670][21194] Updated weights for policy 1, policy_version 76990 (0.0008) +[2023-10-08 18:52:33,802][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13995.8). Total num frames: 158269440. Throughput: 0: 1744.6, 1: 1740.0. Samples: 39571316. Policy #0 lag: (min: 2.0, avg: 5.0, max: 34.0) +[2023-10-08 18:52:33,803][19739] Avg episode reward: [(0, '506.430'), (1, '826.500')] +[2023-10-08 18:52:35,179][21195] Updated weights for policy 0, policy_version 77570 (0.0007) +[2023-10-08 18:52:35,535][21195] Updated weights for policy 0, policy_version 77580 (0.0010) +[2023-10-08 18:52:35,898][21195] Updated weights for policy 0, policy_version 77590 (0.0010) +[2023-10-08 18:52:36,266][21195] Updated weights for policy 0, policy_version 77600 (0.0011) +[2023-10-08 18:52:37,800][21194] Updated weights for policy 1, policy_version 77000 (0.0010) +[2023-10-08 18:52:38,165][21194] Updated weights for policy 1, policy_version 77010 (0.0010) +[2023-10-08 18:52:38,534][21194] Updated weights for policy 1, policy_version 77020 (0.0011) +[2023-10-08 18:52:38,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13995.8). Total num frames: 158334976. Throughput: 0: 1734.8, 1: 1766.6. Samples: 39586842. Policy #0 lag: (min: 2.0, avg: 5.0, max: 34.0) +[2023-10-08 18:52:38,803][19739] Avg episode reward: [(0, '506.430'), (1, '811.980')] +[2023-10-08 18:52:40,332][21195] Updated weights for policy 0, policy_version 77610 (0.0010) +[2023-10-08 18:52:40,706][21195] Updated weights for policy 0, policy_version 77620 (0.0009) +[2023-10-08 18:52:41,070][21195] Updated weights for policy 0, policy_version 77630 (0.0010) +[2023-10-08 18:52:42,355][21194] Updated weights for policy 1, policy_version 77030 (0.0009) +[2023-10-08 18:52:42,714][21194] Updated weights for policy 1, policy_version 77040 (0.0007) +[2023-10-08 18:52:43,085][21194] Updated weights for policy 1, policy_version 77050 (0.0007) +[2023-10-08 18:52:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 158400512. Throughput: 0: 1736.1, 1: 1739.3. Samples: 39607328. Policy #0 lag: (min: 2.0, avg: 5.0, max: 34.0) +[2023-10-08 18:52:43,803][19739] Avg episode reward: [(0, '521.420'), (1, '827.100')] +[2023-10-08 18:52:44,927][21195] Updated weights for policy 0, policy_version 77640 (0.0010) +[2023-10-08 18:52:45,297][21195] Updated weights for policy 0, policy_version 77650 (0.0009) +[2023-10-08 18:52:45,674][21195] Updated weights for policy 0, policy_version 77660 (0.0011) +[2023-10-08 18:52:46,995][21194] Updated weights for policy 1, policy_version 77060 (0.0007) +[2023-10-08 18:52:47,355][21194] Updated weights for policy 1, policy_version 77070 (0.0008) +[2023-10-08 18:52:47,722][21194] Updated weights for policy 1, policy_version 77080 (0.0008) +[2023-10-08 18:52:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 158466048. Throughput: 0: 1760.0, 1: 1764.8. Samples: 39623860. Policy #0 lag: (min: 2.0, avg: 5.0, max: 34.0) +[2023-10-08 18:52:48,803][19739] Avg episode reward: [(0, '530.690'), (1, '838.170')] +[2023-10-08 18:52:49,621][21195] Updated weights for policy 0, policy_version 77670 (0.0009) +[2023-10-08 18:52:49,991][21195] Updated weights for policy 0, policy_version 77680 (0.0008) +[2023-10-08 18:52:50,357][21195] Updated weights for policy 0, policy_version 77690 (0.0010) +[2023-10-08 18:52:51,588][21194] Updated weights for policy 1, policy_version 77090 (0.0009) +[2023-10-08 18:52:51,953][21194] Updated weights for policy 1, policy_version 77100 (0.0008) +[2023-10-08 18:52:52,316][21194] Updated weights for policy 1, policy_version 77110 (0.0010) +[2023-10-08 18:52:52,677][21194] Updated weights for policy 1, policy_version 77120 (0.0010) +[2023-10-08 18:52:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 158531584. Throughput: 0: 1725.0, 1: 1747.7. Samples: 39638826. Policy #0 lag: (min: 2.0, avg: 5.0, max: 34.0) +[2023-10-08 18:52:53,803][19739] Avg episode reward: [(0, '514.780'), (1, '838.170')] +[2023-10-08 18:52:54,279][21195] Updated weights for policy 0, policy_version 77700 (0.0008) +[2023-10-08 18:52:54,641][21195] Updated weights for policy 0, policy_version 77710 (0.0008) +[2023-10-08 18:52:55,022][21195] Updated weights for policy 0, policy_version 77720 (0.0010) +[2023-10-08 18:52:56,801][21194] Updated weights for policy 1, policy_version 77130 (0.0008) +[2023-10-08 18:52:57,181][21194] Updated weights for policy 1, policy_version 77140 (0.0008) +[2023-10-08 18:52:57,547][21194] Updated weights for policy 1, policy_version 77150 (0.0008) +[2023-10-08 18:52:58,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 158597120. Throughput: 0: 1751.1, 1: 1722.2. Samples: 39659308. Policy #0 lag: (min: 21.0, avg: 27.4, max: 53.0) +[2023-10-08 18:52:58,803][19739] Avg episode reward: [(0, '514.780'), (1, '838.130')] +[2023-10-08 18:52:58,996][21195] Updated weights for policy 0, policy_version 77730 (0.0009) +[2023-10-08 18:52:59,364][21195] Updated weights for policy 0, policy_version 77740 (0.0007) +[2023-10-08 18:52:59,735][21195] Updated weights for policy 0, policy_version 77750 (0.0008) +[2023-10-08 18:53:00,094][21195] Updated weights for policy 0, policy_version 77760 (0.0008) +[2023-10-08 18:53:01,307][21194] Updated weights for policy 1, policy_version 77160 (0.0010) +[2023-10-08 18:53:01,673][21194] Updated weights for policy 1, policy_version 77170 (0.0010) +[2023-10-08 18:53:02,044][21194] Updated weights for policy 1, policy_version 77180 (0.0007) +[2023-10-08 18:53:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 158662656. Throughput: 0: 1752.6, 1: 1757.7. Samples: 39676166. Policy #0 lag: (min: 21.0, avg: 27.4, max: 53.0) +[2023-10-08 18:53:03,803][19739] Avg episode reward: [(0, '514.780'), (1, '822.950')] +[2023-10-08 18:53:04,013][21195] Updated weights for policy 0, policy_version 77770 (0.0007) +[2023-10-08 18:53:04,378][21195] Updated weights for policy 0, policy_version 77780 (0.0007) +[2023-10-08 18:53:04,755][21195] Updated weights for policy 0, policy_version 77790 (0.0007) +[2023-10-08 18:53:06,080][21194] Updated weights for policy 1, policy_version 77190 (0.0008) +[2023-10-08 18:53:06,441][21194] Updated weights for policy 1, policy_version 77200 (0.0008) +[2023-10-08 18:53:06,816][21194] Updated weights for policy 1, policy_version 77210 (0.0009) +[2023-10-08 18:53:08,611][21195] Updated weights for policy 0, policy_version 77800 (0.0008) +[2023-10-08 18:53:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 158728192. Throughput: 0: 1750.3, 1: 1718.5. Samples: 39690572. Policy #0 lag: (min: 21.0, avg: 27.4, max: 53.0) +[2023-10-08 18:53:08,803][19739] Avg episode reward: [(0, '500.100'), (1, '852.910')] +[2023-10-08 18:53:08,981][21195] Updated weights for policy 0, policy_version 77810 (0.0007) +[2023-10-08 18:53:09,350][21195] Updated weights for policy 0, policy_version 77820 (0.0007) +[2023-10-08 18:53:10,762][21194] Updated weights for policy 1, policy_version 77220 (0.0008) +[2023-10-08 18:53:11,121][21194] Updated weights for policy 1, policy_version 77230 (0.0007) +[2023-10-08 18:53:11,486][21194] Updated weights for policy 1, policy_version 77240 (0.0009) +[2023-10-08 18:53:13,354][21195] Updated weights for policy 0, policy_version 77830 (0.0007) +[2023-10-08 18:53:13,724][21195] Updated weights for policy 0, policy_version 77840 (0.0007) +[2023-10-08 18:53:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 158793728. Throughput: 0: 1750.7, 1: 1719.8. Samples: 39711770. Policy #0 lag: (min: 21.0, avg: 27.4, max: 53.0) +[2023-10-08 18:53:13,803][19739] Avg episode reward: [(0, '506.460'), (1, '853.420')] +[2023-10-08 18:53:13,809][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000077248_79101952.pth... +[2023-10-08 18:53:13,840][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000075648_77463552.pth +[2023-10-08 18:53:14,089][21195] Updated weights for policy 0, policy_version 77850 (0.0007) +[2023-10-08 18:53:14,313][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000077856_79724544.pth... +[2023-10-08 18:53:14,354][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000076224_78053376.pth +[2023-10-08 18:53:15,325][21194] Updated weights for policy 1, policy_version 77250 (0.0010) +[2023-10-08 18:53:15,690][21194] Updated weights for policy 1, policy_version 77260 (0.0008) +[2023-10-08 18:53:16,057][21194] Updated weights for policy 1, policy_version 77270 (0.0007) +[2023-10-08 18:53:16,430][21194] Updated weights for policy 1, policy_version 77280 (0.0007) +[2023-10-08 18:53:18,038][21195] Updated weights for policy 0, policy_version 77860 (0.0009) +[2023-10-08 18:53:18,404][21195] Updated weights for policy 0, policy_version 77870 (0.0012) +[2023-10-08 18:53:18,763][21195] Updated weights for policy 0, policy_version 77880 (0.0010) +[2023-10-08 18:53:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 158859264. Throughput: 0: 1725.8, 1: 1725.5. Samples: 39726622. Policy #0 lag: (min: 21.0, avg: 27.4, max: 53.0) +[2023-10-08 18:53:18,803][19739] Avg episode reward: [(0, '521.670'), (1, '853.420')] +[2023-10-08 18:53:20,287][21194] Updated weights for policy 1, policy_version 77290 (0.0009) +[2023-10-08 18:53:20,658][21194] Updated weights for policy 1, policy_version 77300 (0.0009) +[2023-10-08 18:53:21,025][21194] Updated weights for policy 1, policy_version 77310 (0.0010) +[2023-10-08 18:53:22,744][21195] Updated weights for policy 0, policy_version 77890 (0.0010) +[2023-10-08 18:53:23,109][21195] Updated weights for policy 0, policy_version 77900 (0.0009) +[2023-10-08 18:53:23,478][21195] Updated weights for policy 0, policy_version 77910 (0.0008) +[2023-10-08 18:53:23,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 158924800. Throughput: 0: 1742.8, 1: 1714.1. Samples: 39742406. Policy #0 lag: (min: 21.0, avg: 27.4, max: 53.0) +[2023-10-08 18:53:23,803][19739] Avg episode reward: [(0, '530.170'), (1, '853.420')] +[2023-10-08 18:53:23,839][21195] Updated weights for policy 0, policy_version 77920 (0.0009) +[2023-10-08 18:53:25,182][21194] Updated weights for policy 1, policy_version 77320 (0.0008) +[2023-10-08 18:53:25,544][21194] Updated weights for policy 1, policy_version 77330 (0.0008) +[2023-10-08 18:53:25,905][21194] Updated weights for policy 1, policy_version 77340 (0.0011) +[2023-10-08 18:53:27,764][21195] Updated weights for policy 0, policy_version 77930 (0.0010) +[2023-10-08 18:53:28,142][21195] Updated weights for policy 0, policy_version 77940 (0.0009) +[2023-10-08 18:53:28,508][21195] Updated weights for policy 0, policy_version 77950 (0.0009) +[2023-10-08 18:53:28,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 159023104. Throughput: 0: 1731.0, 1: 1739.4. Samples: 39763496. Policy #0 lag: (min: 21.0, avg: 27.4, max: 53.0) +[2023-10-08 18:53:28,803][19739] Avg episode reward: [(0, '499.960'), (1, '853.420')] +[2023-10-08 18:53:29,770][21194] Updated weights for policy 1, policy_version 77350 (0.0009) +[2023-10-08 18:53:30,138][21194] Updated weights for policy 1, policy_version 77360 (0.0007) +[2023-10-08 18:53:30,505][21194] Updated weights for policy 1, policy_version 77370 (0.0010) +[2023-10-08 18:53:32,388][21195] Updated weights for policy 0, policy_version 77960 (0.0007) +[2023-10-08 18:53:32,755][21195] Updated weights for policy 0, policy_version 77970 (0.0008) +[2023-10-08 18:53:33,125][21195] Updated weights for policy 0, policy_version 77980 (0.0008) +[2023-10-08 18:53:33,803][19739] Fps is (10 sec: 16383.8, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 159088640. Throughput: 0: 1711.8, 1: 1713.6. Samples: 39778004. Policy #0 lag: (min: 21.0, avg: 27.4, max: 53.0) +[2023-10-08 18:53:33,804][19739] Avg episode reward: [(0, '499.960'), (1, '853.420')] +[2023-10-08 18:53:34,424][21194] Updated weights for policy 1, policy_version 77380 (0.0007) +[2023-10-08 18:53:34,795][21194] Updated weights for policy 1, policy_version 77390 (0.0007) +[2023-10-08 18:53:35,163][21194] Updated weights for policy 1, policy_version 77400 (0.0007) +[2023-10-08 18:53:37,018][21195] Updated weights for policy 0, policy_version 77990 (0.0010) +[2023-10-08 18:53:37,385][21195] Updated weights for policy 0, policy_version 78000 (0.0008) +[2023-10-08 18:53:37,767][21195] Updated weights for policy 0, policy_version 78010 (0.0008) +[2023-10-08 18:53:38,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 159154176. Throughput: 0: 1747.5, 1: 1723.8. Samples: 39795034. Policy #0 lag: (min: 21.0, avg: 27.4, max: 53.0) +[2023-10-08 18:53:38,803][19739] Avg episode reward: [(0, '499.960'), (1, '853.420')] +[2023-10-08 18:53:38,944][21194] Updated weights for policy 1, policy_version 77410 (0.0009) +[2023-10-08 18:53:39,313][21194] Updated weights for policy 1, policy_version 77420 (0.0008) +[2023-10-08 18:53:39,683][21194] Updated weights for policy 1, policy_version 77430 (0.0009) +[2023-10-08 18:53:40,049][21194] Updated weights for policy 1, policy_version 77440 (0.0008) +[2023-10-08 18:53:41,759][21195] Updated weights for policy 0, policy_version 78020 (0.0009) +[2023-10-08 18:53:42,131][21195] Updated weights for policy 0, policy_version 78030 (0.0008) +[2023-10-08 18:53:42,510][21195] Updated weights for policy 0, policy_version 78040 (0.0010) +[2023-10-08 18:53:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 159219712. Throughput: 0: 1713.9, 1: 1750.5. Samples: 39815206. Policy #0 lag: (min: 21.0, avg: 27.4, max: 53.0) +[2023-10-08 18:53:43,803][19739] Avg episode reward: [(0, '499.960'), (1, '853.420')] +[2023-10-08 18:53:44,025][21194] Updated weights for policy 1, policy_version 77450 (0.0008) +[2023-10-08 18:53:44,387][21194] Updated weights for policy 1, policy_version 77460 (0.0007) +[2023-10-08 18:53:44,753][21194] Updated weights for policy 1, policy_version 77470 (0.0007) +[2023-10-08 18:53:46,362][21195] Updated weights for policy 0, policy_version 78050 (0.0010) +[2023-10-08 18:53:46,741][21195] Updated weights for policy 0, policy_version 78060 (0.0007) +[2023-10-08 18:53:47,114][21195] Updated weights for policy 0, policy_version 78070 (0.0007) +[2023-10-08 18:53:47,492][21195] Updated weights for policy 0, policy_version 78080 (0.0010) +[2023-10-08 18:53:48,679][21194] Updated weights for policy 1, policy_version 77480 (0.0007) +[2023-10-08 18:53:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 159285248. Throughput: 0: 1717.6, 1: 1715.6. Samples: 39830656. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:53:48,803][19739] Avg episode reward: [(0, '499.960'), (1, '852.660')] +[2023-10-08 18:53:49,048][21194] Updated weights for policy 1, policy_version 77490 (0.0008) +[2023-10-08 18:53:49,402][21194] Updated weights for policy 1, policy_version 77500 (0.0007) +[2023-10-08 18:53:51,314][21195] Updated weights for policy 0, policy_version 78090 (0.0009) +[2023-10-08 18:53:51,684][21195] Updated weights for policy 0, policy_version 78100 (0.0008) +[2023-10-08 18:53:52,048][21195] Updated weights for policy 0, policy_version 78110 (0.0008) +[2023-10-08 18:53:53,447][21194] Updated weights for policy 1, policy_version 77510 (0.0007) +[2023-10-08 18:53:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 159350784. Throughput: 0: 1719.7, 1: 1744.2. Samples: 39846448. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:53:53,803][19739] Avg episode reward: [(0, '499.960'), (1, '867.470')] +[2023-10-08 18:53:53,817][21194] Updated weights for policy 1, policy_version 77520 (0.0008) +[2023-10-08 18:53:54,182][21194] Updated weights for policy 1, policy_version 77530 (0.0009) +[2023-10-08 18:53:55,842][21195] Updated weights for policy 0, policy_version 78120 (0.0008) +[2023-10-08 18:53:56,206][21195] Updated weights for policy 0, policy_version 78130 (0.0007) +[2023-10-08 18:53:56,585][21195] Updated weights for policy 0, policy_version 78140 (0.0009) +[2023-10-08 18:53:57,966][21194] Updated weights for policy 1, policy_version 77540 (0.0009) +[2023-10-08 18:53:58,325][21194] Updated weights for policy 1, policy_version 77550 (0.0008) +[2023-10-08 18:53:58,686][21194] Updated weights for policy 1, policy_version 77560 (0.0008) +[2023-10-08 18:53:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 159416320. Throughput: 0: 1716.6, 1: 1745.3. Samples: 39867554. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:53:58,803][19739] Avg episode reward: [(0, '499.960'), (1, '867.470')] +[2023-10-08 18:54:00,586][21195] Updated weights for policy 0, policy_version 78150 (0.0009) +[2023-10-08 18:54:00,953][21195] Updated weights for policy 0, policy_version 78160 (0.0008) +[2023-10-08 18:54:01,323][21195] Updated weights for policy 0, policy_version 78170 (0.0008) +[2023-10-08 18:54:02,356][21194] Updated weights for policy 1, policy_version 77570 (0.0009) +[2023-10-08 18:54:02,719][21194] Updated weights for policy 1, policy_version 77580 (0.0008) +[2023-10-08 18:54:03,077][21194] Updated weights for policy 1, policy_version 77590 (0.0008) +[2023-10-08 18:54:03,448][21194] Updated weights for policy 1, policy_version 77600 (0.0010) +[2023-10-08 18:54:03,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13995.8). Total num frames: 159514624. Throughput: 0: 1742.2, 1: 1738.4. Samples: 39883250. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:54:03,803][19739] Avg episode reward: [(0, '501.010'), (1, '867.470')] +[2023-10-08 18:54:05,282][21195] Updated weights for policy 0, policy_version 78180 (0.0008) +[2023-10-08 18:54:05,640][21195] Updated weights for policy 0, policy_version 78190 (0.0010) +[2023-10-08 18:54:06,010][21195] Updated weights for policy 0, policy_version 78200 (0.0010) +[2023-10-08 18:54:07,421][21194] Updated weights for policy 1, policy_version 77610 (0.0008) +[2023-10-08 18:54:07,791][21194] Updated weights for policy 1, policy_version 77620 (0.0007) +[2023-10-08 18:54:08,159][21194] Updated weights for policy 1, policy_version 77630 (0.0007) +[2023-10-08 18:54:08,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 13995.8). Total num frames: 159580160. Throughput: 0: 1719.1, 1: 1752.0. Samples: 39898604. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:54:08,803][19739] Avg episode reward: [(0, '501.010'), (1, '867.470')] +[2023-10-08 18:54:09,896][21195] Updated weights for policy 0, policy_version 78210 (0.0009) +[2023-10-08 18:54:10,254][21195] Updated weights for policy 0, policy_version 78220 (0.0009) +[2023-10-08 18:54:10,630][21195] Updated weights for policy 0, policy_version 78230 (0.0008) +[2023-10-08 18:54:10,999][21195] Updated weights for policy 0, policy_version 78240 (0.0011) +[2023-10-08 18:54:12,237][21194] Updated weights for policy 1, policy_version 77640 (0.0008) +[2023-10-08 18:54:12,596][21194] Updated weights for policy 1, policy_version 77650 (0.0008) +[2023-10-08 18:54:12,969][21194] Updated weights for policy 1, policy_version 77660 (0.0007) +[2023-10-08 18:54:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 159645696. Throughput: 0: 1733.7, 1: 1723.9. Samples: 39919088. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:54:13,803][19739] Avg episode reward: [(0, '516.300'), (1, '867.470')] +[2023-10-08 18:54:14,816][21195] Updated weights for policy 0, policy_version 78250 (0.0008) +[2023-10-08 18:54:15,195][21195] Updated weights for policy 0, policy_version 78260 (0.0008) +[2023-10-08 18:54:15,554][21195] Updated weights for policy 0, policy_version 78270 (0.0009) +[2023-10-08 18:54:16,905][21194] Updated weights for policy 1, policy_version 77670 (0.0009) +[2023-10-08 18:54:17,266][21194] Updated weights for policy 1, policy_version 77680 (0.0007) +[2023-10-08 18:54:17,631][21194] Updated weights for policy 1, policy_version 77690 (0.0009) +[2023-10-08 18:54:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 159711232. Throughput: 0: 1754.5, 1: 1755.5. Samples: 39935952. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:54:18,803][19739] Avg episode reward: [(0, '531.850'), (1, '867.470')] +[2023-10-08 18:54:19,582][21195] Updated weights for policy 0, policy_version 78280 (0.0008) +[2023-10-08 18:54:19,948][21195] Updated weights for policy 0, policy_version 78290 (0.0008) +[2023-10-08 18:54:20,315][21195] Updated weights for policy 0, policy_version 78300 (0.0011) +[2023-10-08 18:54:21,508][21194] Updated weights for policy 1, policy_version 77700 (0.0010) +[2023-10-08 18:54:21,869][21194] Updated weights for policy 1, policy_version 77710 (0.0011) +[2023-10-08 18:54:22,239][21194] Updated weights for policy 1, policy_version 77720 (0.0010) +[2023-10-08 18:54:23,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 159776768. Throughput: 0: 1717.5, 1: 1738.2. Samples: 39950542. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:54:23,804][19739] Avg episode reward: [(0, '577.490'), (1, '867.470')] +[2023-10-08 18:54:24,207][21195] Updated weights for policy 0, policy_version 78310 (0.0010) +[2023-10-08 18:54:24,579][21195] Updated weights for policy 0, policy_version 78320 (0.0007) +[2023-10-08 18:54:24,948][21195] Updated weights for policy 0, policy_version 78330 (0.0009) +[2023-10-08 18:54:26,183][21194] Updated weights for policy 1, policy_version 77730 (0.0009) +[2023-10-08 18:54:26,541][21194] Updated weights for policy 1, policy_version 77740 (0.0011) +[2023-10-08 18:54:26,911][21194] Updated weights for policy 1, policy_version 77750 (0.0009) +[2023-10-08 18:54:27,275][21194] Updated weights for policy 1, policy_version 77760 (0.0007) +[2023-10-08 18:54:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 159842304. Throughput: 0: 1753.8, 1: 1722.0. Samples: 39971620. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:54:28,803][19739] Avg episode reward: [(0, '577.490'), (1, '867.470')] +[2023-10-08 18:54:28,864][21195] Updated weights for policy 0, policy_version 78340 (0.0008) +[2023-10-08 18:54:29,235][21195] Updated weights for policy 0, policy_version 78350 (0.0008) +[2023-10-08 18:54:29,613][21195] Updated weights for policy 0, policy_version 78360 (0.0008) +[2023-10-08 18:54:31,330][21194] Updated weights for policy 1, policy_version 77770 (0.0008) +[2023-10-08 18:54:31,701][21194] Updated weights for policy 1, policy_version 77780 (0.0007) +[2023-10-08 18:54:32,061][21194] Updated weights for policy 1, policy_version 77790 (0.0010) +[2023-10-08 18:54:33,374][21195] Updated weights for policy 0, policy_version 78370 (0.0007) +[2023-10-08 18:54:33,751][21195] Updated weights for policy 0, policy_version 78380 (0.0008) +[2023-10-08 18:54:33,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 159907840. Throughput: 0: 1740.7, 1: 1744.1. Samples: 39987474. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:54:33,803][19739] Avg episode reward: [(0, '577.490'), (1, '867.470')] +[2023-10-08 18:54:34,113][21195] Updated weights for policy 0, policy_version 78390 (0.0009) +[2023-10-08 18:54:34,484][21195] Updated weights for policy 0, policy_version 78400 (0.0009) +[2023-10-08 18:54:36,142][21194] Updated weights for policy 1, policy_version 77800 (0.0009) +[2023-10-08 18:54:36,508][21194] Updated weights for policy 1, policy_version 77810 (0.0009) +[2023-10-08 18:54:36,884][21194] Updated weights for policy 1, policy_version 77820 (0.0008) +[2023-10-08 18:54:38,268][21195] Updated weights for policy 0, policy_version 78410 (0.0009) +[2023-10-08 18:54:38,649][21195] Updated weights for policy 0, policy_version 78420 (0.0010) +[2023-10-08 18:54:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 159973376. Throughput: 0: 1743.1, 1: 1715.6. Samples: 40002088. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 18:54:38,803][19739] Avg episode reward: [(0, '577.490'), (1, '867.470')] +[2023-10-08 18:54:39,013][21195] Updated weights for policy 0, policy_version 78430 (0.0007) +[2023-10-08 18:54:40,782][21194] Updated weights for policy 1, policy_version 77830 (0.0010) +[2023-10-08 18:54:41,145][21194] Updated weights for policy 1, policy_version 77840 (0.0011) +[2023-10-08 18:54:41,518][21194] Updated weights for policy 1, policy_version 77850 (0.0008) +[2023-10-08 18:54:43,069][21195] Updated weights for policy 0, policy_version 78440 (0.0008) +[2023-10-08 18:54:43,439][21195] Updated weights for policy 0, policy_version 78450 (0.0007) +[2023-10-08 18:54:43,799][21195] Updated weights for policy 0, policy_version 78460 (0.0011) +[2023-10-08 18:54:43,803][19739] Fps is (10 sec: 13106.7, 60 sec: 13653.3, 300 sec: 13773.6). Total num frames: 160038912. Throughput: 0: 1756.0, 1: 1714.0. Samples: 40023706. Policy #0 lag: (min: 18.0, avg: 26.1, max: 50.0) +[2023-10-08 18:54:43,804][19739] Avg episode reward: [(0, '577.490'), (1, '867.470')] +[2023-10-08 18:54:45,459][21194] Updated weights for policy 1, policy_version 77860 (0.0008) +[2023-10-08 18:54:45,821][21194] Updated weights for policy 1, policy_version 77870 (0.0009) +[2023-10-08 18:54:46,191][21194] Updated weights for policy 1, policy_version 77880 (0.0008) +[2023-10-08 18:54:47,613][21195] Updated weights for policy 0, policy_version 78470 (0.0011) +[2023-10-08 18:54:47,983][21195] Updated weights for policy 0, policy_version 78480 (0.0009) +[2023-10-08 18:54:48,356][21195] Updated weights for policy 0, policy_version 78490 (0.0007) +[2023-10-08 18:54:48,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 160137216. Throughput: 0: 1728.8, 1: 1721.1. Samples: 40038494. Policy #0 lag: (min: 18.0, avg: 26.1, max: 50.0) +[2023-10-08 18:54:48,803][19739] Avg episode reward: [(0, '577.490'), (1, '867.210')] +[2023-10-08 18:54:50,124][21194] Updated weights for policy 1, policy_version 77890 (0.0009) +[2023-10-08 18:54:50,496][21194] Updated weights for policy 1, policy_version 77900 (0.0011) +[2023-10-08 18:54:50,862][21194] Updated weights for policy 1, policy_version 77910 (0.0011) +[2023-10-08 18:54:51,226][21194] Updated weights for policy 1, policy_version 77920 (0.0010) +[2023-10-08 18:54:52,282][21195] Updated weights for policy 0, policy_version 78500 (0.0008) +[2023-10-08 18:54:52,655][21195] Updated weights for policy 0, policy_version 78510 (0.0008) +[2023-10-08 18:54:53,042][21195] Updated weights for policy 0, policy_version 78520 (0.0007) +[2023-10-08 18:54:53,803][19739] Fps is (10 sec: 16384.6, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 160202752. Throughput: 0: 1763.3, 1: 1704.2. Samples: 40054642. Policy #0 lag: (min: 18.0, avg: 26.1, max: 50.0) +[2023-10-08 18:54:53,803][19739] Avg episode reward: [(0, '577.490'), (1, '867.210')] +[2023-10-08 18:54:55,286][21194] Updated weights for policy 1, policy_version 77930 (0.0007) +[2023-10-08 18:54:55,648][21194] Updated weights for policy 1, policy_version 77940 (0.0008) +[2023-10-08 18:54:56,024][21194] Updated weights for policy 1, policy_version 77950 (0.0009) +[2023-10-08 18:54:56,682][21195] Updated weights for policy 0, policy_version 78530 (0.0008) +[2023-10-08 18:54:57,061][21195] Updated weights for policy 0, policy_version 78540 (0.0009) +[2023-10-08 18:54:57,420][21195] Updated weights for policy 0, policy_version 78550 (0.0007) +[2023-10-08 18:54:57,795][21195] Updated weights for policy 0, policy_version 78560 (0.0009) +[2023-10-08 18:54:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 160268288. Throughput: 0: 1737.0, 1: 1726.8. Samples: 40074958. Policy #0 lag: (min: 18.0, avg: 26.1, max: 50.0) +[2023-10-08 18:54:58,803][19739] Avg episode reward: [(0, '593.020'), (1, '867.210')] +[2023-10-08 18:55:00,040][21194] Updated weights for policy 1, policy_version 77960 (0.0008) +[2023-10-08 18:55:00,405][21194] Updated weights for policy 1, policy_version 77970 (0.0010) +[2023-10-08 18:55:00,767][21194] Updated weights for policy 1, policy_version 77980 (0.0010) +[2023-10-08 18:55:02,053][21195] Updated weights for policy 0, policy_version 78570 (0.0009) +[2023-10-08 18:55:02,429][21195] Updated weights for policy 0, policy_version 78580 (0.0007) +[2023-10-08 18:55:02,802][21195] Updated weights for policy 0, policy_version 78590 (0.0009) +[2023-10-08 18:55:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 160333824. Throughput: 0: 1734.7, 1: 1694.4. Samples: 40090260. Policy #0 lag: (min: 18.0, avg: 26.1, max: 50.0) +[2023-10-08 18:55:03,803][19739] Avg episode reward: [(0, '593.020'), (1, '867.210')] +[2023-10-08 18:55:04,591][21194] Updated weights for policy 1, policy_version 77990 (0.0011) +[2023-10-08 18:55:04,951][21194] Updated weights for policy 1, policy_version 78000 (0.0008) +[2023-10-08 18:55:05,316][21194] Updated weights for policy 1, policy_version 78010 (0.0009) +[2023-10-08 18:55:06,585][21195] Updated weights for policy 0, policy_version 78600 (0.0007) +[2023-10-08 18:55:06,949][21195] Updated weights for policy 0, policy_version 78610 (0.0010) +[2023-10-08 18:55:07,325][21195] Updated weights for policy 0, policy_version 78620 (0.0007) +[2023-10-08 18:55:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 160399360. Throughput: 0: 1751.8, 1: 1714.0. Samples: 40106506. Policy #0 lag: (min: 18.0, avg: 26.1, max: 50.0) +[2023-10-08 18:55:08,803][19739] Avg episode reward: [(0, '608.700'), (1, '867.210')] +[2023-10-08 18:55:09,320][21194] Updated weights for policy 1, policy_version 78020 (0.0011) +[2023-10-08 18:55:09,677][21194] Updated weights for policy 1, policy_version 78030 (0.0010) +[2023-10-08 18:55:10,042][21194] Updated weights for policy 1, policy_version 78040 (0.0012) +[2023-10-08 18:55:11,353][21195] Updated weights for policy 0, policy_version 78630 (0.0007) +[2023-10-08 18:55:11,727][21195] Updated weights for policy 0, policy_version 78640 (0.0007) +[2023-10-08 18:55:12,089][21195] Updated weights for policy 0, policy_version 78650 (0.0007) +[2023-10-08 18:55:13,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 160464896. Throughput: 0: 1730.8, 1: 1729.9. Samples: 40127352. Policy #0 lag: (min: 18.0, avg: 26.1, max: 50.0) +[2023-10-08 18:55:13,804][19739] Avg episode reward: [(0, '646.590'), (1, '868.620')] +[2023-10-08 18:55:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000078656_80543744.pth... +[2023-10-08 18:55:13,849][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000077024_78872576.pth +[2023-10-08 18:55:13,874][21194] Updated weights for policy 1, policy_version 78050 (0.0010) +[2023-10-08 18:55:14,237][21194] Updated weights for policy 1, policy_version 78060 (0.0011) +[2023-10-08 18:55:14,600][21194] Updated weights for policy 1, policy_version 78070 (0.0007) +[2023-10-08 18:55:14,966][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000078080_79953920.pth... +[2023-10-08 18:55:14,971][21194] Updated weights for policy 1, policy_version 78080 (0.0008) +[2023-10-08 18:55:15,002][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000076448_78282752.pth +[2023-10-08 18:55:15,792][21195] Updated weights for policy 0, policy_version 78660 (0.0007) +[2023-10-08 18:55:16,157][21195] Updated weights for policy 0, policy_version 78670 (0.0009) +[2023-10-08 18:55:16,521][21195] Updated weights for policy 0, policy_version 78680 (0.0011) +[2023-10-08 18:55:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 160530432. Throughput: 0: 1754.9, 1: 1707.0. Samples: 40143262. Policy #0 lag: (min: 18.0, avg: 26.1, max: 50.0) +[2023-10-08 18:55:18,803][19739] Avg episode reward: [(0, '646.590'), (1, '868.620')] +[2023-10-08 18:55:18,907][21194] Updated weights for policy 1, policy_version 78090 (0.0008) +[2023-10-08 18:55:19,270][21194] Updated weights for policy 1, policy_version 78100 (0.0008) +[2023-10-08 18:55:19,636][21194] Updated weights for policy 1, policy_version 78110 (0.0009) +[2023-10-08 18:55:20,257][21195] Updated weights for policy 0, policy_version 78690 (0.0007) +[2023-10-08 18:55:20,621][21195] Updated weights for policy 0, policy_version 78700 (0.0008) +[2023-10-08 18:55:20,983][21195] Updated weights for policy 0, policy_version 78710 (0.0009) +[2023-10-08 18:55:21,353][21195] Updated weights for policy 0, policy_version 78720 (0.0008) +[2023-10-08 18:55:23,540][21194] Updated weights for policy 1, policy_version 78120 (0.0008) +[2023-10-08 18:55:23,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 160595968. Throughput: 0: 1742.4, 1: 1737.6. Samples: 40158686. Policy #0 lag: (min: 18.0, avg: 26.1, max: 50.0) +[2023-10-08 18:55:23,803][19739] Avg episode reward: [(0, '654.910'), (1, '868.620')] +[2023-10-08 18:55:23,894][21194] Updated weights for policy 1, policy_version 78130 (0.0008) +[2023-10-08 18:55:24,261][21194] Updated weights for policy 1, policy_version 78140 (0.0010) +[2023-10-08 18:55:25,016][21195] Updated weights for policy 0, policy_version 78730 (0.0009) +[2023-10-08 18:55:25,380][21195] Updated weights for policy 0, policy_version 78740 (0.0008) +[2023-10-08 18:55:25,746][21195] Updated weights for policy 0, policy_version 78750 (0.0009) +[2023-10-08 18:55:28,173][21194] Updated weights for policy 1, policy_version 78150 (0.0009) +[2023-10-08 18:55:28,538][21194] Updated weights for policy 1, policy_version 78160 (0.0008) +[2023-10-08 18:55:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 160661504. Throughput: 0: 1745.0, 1: 1740.7. Samples: 40180560. Policy #0 lag: (min: 18.0, avg: 26.1, max: 50.0) +[2023-10-08 18:55:28,803][19739] Avg episode reward: [(0, '654.910'), (1, '868.620')] +[2023-10-08 18:55:28,903][21194] Updated weights for policy 1, policy_version 78170 (0.0008) +[2023-10-08 18:55:29,510][21195] Updated weights for policy 0, policy_version 78760 (0.0008) +[2023-10-08 18:55:29,880][21195] Updated weights for policy 0, policy_version 78770 (0.0007) +[2023-10-08 18:55:30,253][21195] Updated weights for policy 0, policy_version 78780 (0.0008) +[2023-10-08 18:55:32,846][21194] Updated weights for policy 1, policy_version 78180 (0.0008) +[2023-10-08 18:55:33,210][21194] Updated weights for policy 1, policy_version 78190 (0.0008) +[2023-10-08 18:55:33,567][21194] Updated weights for policy 1, policy_version 78200 (0.0007) +[2023-10-08 18:55:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 160727040. Throughput: 0: 1771.5, 1: 1730.4. Samples: 40196080. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 18:55:33,804][19739] Avg episode reward: [(0, '654.910'), (1, '883.690')] +[2023-10-08 18:55:34,290][21195] Updated weights for policy 0, policy_version 78790 (0.0008) +[2023-10-08 18:55:34,656][21195] Updated weights for policy 0, policy_version 78800 (0.0008) +[2023-10-08 18:55:35,015][21195] Updated weights for policy 0, policy_version 78810 (0.0008) +[2023-10-08 18:55:37,458][21194] Updated weights for policy 1, policy_version 78210 (0.0008) +[2023-10-08 18:55:37,818][21194] Updated weights for policy 1, policy_version 78220 (0.0009) +[2023-10-08 18:55:38,188][21194] Updated weights for policy 1, policy_version 78230 (0.0009) +[2023-10-08 18:55:38,551][21194] Updated weights for policy 1, policy_version 78240 (0.0009) +[2023-10-08 18:55:38,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 160825344. Throughput: 0: 1736.5, 1: 1746.3. Samples: 40211368. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 18:55:38,803][19739] Avg episode reward: [(0, '654.910'), (1, '883.690')] +[2023-10-08 18:55:39,103][21195] Updated weights for policy 0, policy_version 78820 (0.0008) +[2023-10-08 18:55:39,478][21195] Updated weights for policy 0, policy_version 78830 (0.0007) +[2023-10-08 18:55:39,839][21195] Updated weights for policy 0, policy_version 78840 (0.0008) +[2023-10-08 18:55:42,461][21194] Updated weights for policy 1, policy_version 78250 (0.0007) +[2023-10-08 18:55:42,820][21194] Updated weights for policy 1, policy_version 78260 (0.0007) +[2023-10-08 18:55:43,180][21194] Updated weights for policy 1, policy_version 78270 (0.0007) +[2023-10-08 18:55:43,803][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 160890880. Throughput: 0: 1757.5, 1: 1723.7. Samples: 40231614. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 18:55:43,803][19739] Avg episode reward: [(0, '654.910'), (1, '883.690')] +[2023-10-08 18:55:43,875][21195] Updated weights for policy 0, policy_version 78850 (0.0008) +[2023-10-08 18:55:44,236][21195] Updated weights for policy 0, policy_version 78860 (0.0007) +[2023-10-08 18:55:44,609][21195] Updated weights for policy 0, policy_version 78870 (0.0007) +[2023-10-08 18:55:44,985][21195] Updated weights for policy 0, policy_version 78880 (0.0007) +[2023-10-08 18:55:47,211][21194] Updated weights for policy 1, policy_version 78280 (0.0008) +[2023-10-08 18:55:47,571][21194] Updated weights for policy 1, policy_version 78290 (0.0008) +[2023-10-08 18:55:47,936][21194] Updated weights for policy 1, policy_version 78300 (0.0009) +[2023-10-08 18:55:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 160956416. Throughput: 0: 1754.0, 1: 1747.2. Samples: 40247812. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 18:55:48,803][19739] Avg episode reward: [(0, '654.910'), (1, '883.690')] +[2023-10-08 18:55:48,971][21195] Updated weights for policy 0, policy_version 78890 (0.0009) +[2023-10-08 18:55:49,338][21195] Updated weights for policy 0, policy_version 78900 (0.0009) +[2023-10-08 18:55:49,705][21195] Updated weights for policy 0, policy_version 78910 (0.0008) +[2023-10-08 18:55:51,946][21194] Updated weights for policy 1, policy_version 78310 (0.0009) +[2023-10-08 18:55:52,309][21194] Updated weights for policy 1, policy_version 78320 (0.0007) +[2023-10-08 18:55:52,669][21194] Updated weights for policy 1, policy_version 78330 (0.0008) +[2023-10-08 18:55:53,511][21195] Updated weights for policy 0, policy_version 78920 (0.0007) +[2023-10-08 18:55:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 161021952. Throughput: 0: 1743.6, 1: 1735.1. Samples: 40263046. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 18:55:53,804][19739] Avg episode reward: [(0, '654.910'), (1, '884.520')] +[2023-10-08 18:55:53,882][21195] Updated weights for policy 0, policy_version 78930 (0.0008) +[2023-10-08 18:55:54,256][21195] Updated weights for policy 0, policy_version 78940 (0.0008) +[2023-10-08 18:55:56,438][21194] Updated weights for policy 1, policy_version 78340 (0.0007) +[2023-10-08 18:55:56,801][21194] Updated weights for policy 1, policy_version 78350 (0.0007) +[2023-10-08 18:55:57,164][21194] Updated weights for policy 1, policy_version 78360 (0.0007) +[2023-10-08 18:55:58,163][21195] Updated weights for policy 0, policy_version 78950 (0.0008) +[2023-10-08 18:55:58,530][21195] Updated weights for policy 0, policy_version 78960 (0.0007) +[2023-10-08 18:55:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 161087488. Throughput: 0: 1764.5, 1: 1718.1. Samples: 40284070. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 18:55:58,803][19739] Avg episode reward: [(0, '654.910'), (1, '884.520')] +[2023-10-08 18:55:58,898][21195] Updated weights for policy 0, policy_version 78970 (0.0009) +[2023-10-08 18:56:01,030][21194] Updated weights for policy 1, policy_version 78370 (0.0007) +[2023-10-08 18:56:01,404][21194] Updated weights for policy 1, policy_version 78380 (0.0009) +[2023-10-08 18:56:01,775][21194] Updated weights for policy 1, policy_version 78390 (0.0010) +[2023-10-08 18:56:02,143][21194] Updated weights for policy 1, policy_version 78400 (0.0009) +[2023-10-08 18:56:02,658][21195] Updated weights for policy 0, policy_version 78980 (0.0008) +[2023-10-08 18:56:03,022][21195] Updated weights for policy 0, policy_version 78990 (0.0007) +[2023-10-08 18:56:03,384][21195] Updated weights for policy 0, policy_version 79000 (0.0011) +[2023-10-08 18:56:03,803][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 161185792. Throughput: 0: 1725.5, 1: 1749.4. Samples: 40299632. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 18:56:03,803][19739] Avg episode reward: [(0, '654.910'), (1, '884.520')] +[2023-10-08 18:56:06,056][21194] Updated weights for policy 1, policy_version 78410 (0.0007) +[2023-10-08 18:56:06,423][21194] Updated weights for policy 1, policy_version 78420 (0.0007) +[2023-10-08 18:56:06,783][21194] Updated weights for policy 1, policy_version 78430 (0.0010) +[2023-10-08 18:56:07,341][21195] Updated weights for policy 0, policy_version 79010 (0.0009) +[2023-10-08 18:56:07,711][21195] Updated weights for policy 0, policy_version 79020 (0.0008) +[2023-10-08 18:56:08,073][21195] Updated weights for policy 0, policy_version 79030 (0.0008) +[2023-10-08 18:56:08,451][21195] Updated weights for policy 0, policy_version 79040 (0.0008) +[2023-10-08 18:56:08,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 161251328. Throughput: 0: 1760.4, 1: 1719.9. Samples: 40315300. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 18:56:08,803][19739] Avg episode reward: [(0, '654.910'), (1, '884.520')] +[2023-10-08 18:56:10,673][21194] Updated weights for policy 1, policy_version 78440 (0.0010) +[2023-10-08 18:56:11,042][21194] Updated weights for policy 1, policy_version 78450 (0.0011) +[2023-10-08 18:56:11,405][21194] Updated weights for policy 1, policy_version 78460 (0.0007) +[2023-10-08 18:56:12,263][21195] Updated weights for policy 0, policy_version 79050 (0.0007) +[2023-10-08 18:56:12,633][21195] Updated weights for policy 0, policy_version 79060 (0.0007) +[2023-10-08 18:56:12,999][21195] Updated weights for policy 0, policy_version 79070 (0.0010) +[2023-10-08 18:56:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 161316864. Throughput: 0: 1728.3, 1: 1723.3. Samples: 40335880. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 18:56:13,803][19739] Avg episode reward: [(0, '654.910'), (1, '884.520')] +[2023-10-08 18:56:15,138][21194] Updated weights for policy 1, policy_version 78470 (0.0008) +[2023-10-08 18:56:15,506][21194] Updated weights for policy 1, policy_version 78480 (0.0008) +[2023-10-08 18:56:15,873][21194] Updated weights for policy 1, policy_version 78490 (0.0009) +[2023-10-08 18:56:16,996][21195] Updated weights for policy 0, policy_version 79080 (0.0008) +[2023-10-08 18:56:17,360][21195] Updated weights for policy 0, policy_version 79090 (0.0009) +[2023-10-08 18:56:17,733][21195] Updated weights for policy 0, policy_version 79100 (0.0008) +[2023-10-08 18:56:18,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 161382400. Throughput: 0: 1719.1, 1: 1728.1. Samples: 40351202. Policy #0 lag: (min: 31.0, avg: 37.7, max: 63.0) +[2023-10-08 18:56:18,804][19739] Avg episode reward: [(0, '654.910'), (1, '884.520')] +[2023-10-08 18:56:19,872][21194] Updated weights for policy 1, policy_version 78500 (0.0009) +[2023-10-08 18:56:20,246][21194] Updated weights for policy 1, policy_version 78510 (0.0008) +[2023-10-08 18:56:20,603][21194] Updated weights for policy 1, policy_version 78520 (0.0008) +[2023-10-08 18:56:21,619][21195] Updated weights for policy 0, policy_version 79110 (0.0008) +[2023-10-08 18:56:21,998][21195] Updated weights for policy 0, policy_version 79120 (0.0008) +[2023-10-08 18:56:22,366][21195] Updated weights for policy 0, policy_version 79130 (0.0008) +[2023-10-08 18:56:23,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 161447936. Throughput: 0: 1744.4, 1: 1723.2. Samples: 40367410. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 18:56:23,803][19739] Avg episode reward: [(0, '654.910'), (1, '899.600')] +[2023-10-08 18:56:24,542][21194] Updated weights for policy 1, policy_version 78530 (0.0010) +[2023-10-08 18:56:24,908][21194] Updated weights for policy 1, policy_version 78540 (0.0008) +[2023-10-08 18:56:25,275][21194] Updated weights for policy 1, policy_version 78550 (0.0011) +[2023-10-08 18:56:25,644][21194] Updated weights for policy 1, policy_version 78560 (0.0009) +[2023-10-08 18:56:26,391][21195] Updated weights for policy 0, policy_version 79140 (0.0009) +[2023-10-08 18:56:26,752][21195] Updated weights for policy 0, policy_version 79150 (0.0009) +[2023-10-08 18:56:27,128][21195] Updated weights for policy 0, policy_version 79160 (0.0008) +[2023-10-08 18:56:28,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 161513472. Throughput: 0: 1724.4, 1: 1753.1. Samples: 40388100. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 18:56:28,803][19739] Avg episode reward: [(0, '654.910'), (1, '929.230')] +[2023-10-08 18:56:29,467][21194] Updated weights for policy 1, policy_version 78570 (0.0008) +[2023-10-08 18:56:29,832][21194] Updated weights for policy 1, policy_version 78580 (0.0009) +[2023-10-08 18:56:30,191][21194] Updated weights for policy 1, policy_version 78590 (0.0008) +[2023-10-08 18:56:30,980][21195] Updated weights for policy 0, policy_version 79170 (0.0008) +[2023-10-08 18:56:31,352][21195] Updated weights for policy 0, policy_version 79180 (0.0009) +[2023-10-08 18:56:31,728][21195] Updated weights for policy 0, policy_version 79190 (0.0009) +[2023-10-08 18:56:32,095][21195] Updated weights for policy 0, policy_version 79200 (0.0008) +[2023-10-08 18:56:33,803][19739] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 161579008. Throughput: 0: 1733.9, 1: 1729.2. Samples: 40403654. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 18:56:33,804][19739] Avg episode reward: [(0, '654.910'), (1, '929.230')] +[2023-10-08 18:56:34,055][21194] Updated weights for policy 1, policy_version 78600 (0.0008) +[2023-10-08 18:56:34,426][21194] Updated weights for policy 1, policy_version 78610 (0.0007) +[2023-10-08 18:56:34,790][21194] Updated weights for policy 1, policy_version 78620 (0.0008) +[2023-10-08 18:56:35,939][21195] Updated weights for policy 0, policy_version 79210 (0.0008) +[2023-10-08 18:56:36,308][21195] Updated weights for policy 0, policy_version 79220 (0.0008) +[2023-10-08 18:56:36,678][21195] Updated weights for policy 0, policy_version 79230 (0.0008) +[2023-10-08 18:56:38,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 161644544. Throughput: 0: 1730.5, 1: 1742.3. Samples: 40419324. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 18:56:38,803][19739] Avg episode reward: [(0, '654.910'), (1, '929.230')] +[2023-10-08 18:56:38,814][21194] Updated weights for policy 1, policy_version 78630 (0.0008) +[2023-10-08 18:56:39,171][21194] Updated weights for policy 1, policy_version 78640 (0.0010) +[2023-10-08 18:56:39,536][21194] Updated weights for policy 1, policy_version 78650 (0.0009) +[2023-10-08 18:56:40,434][21195] Updated weights for policy 0, policy_version 79240 (0.0009) +[2023-10-08 18:56:40,802][21195] Updated weights for policy 0, policy_version 79250 (0.0011) +[2023-10-08 18:56:41,177][21195] Updated weights for policy 0, policy_version 79260 (0.0010) +[2023-10-08 18:56:43,487][21194] Updated weights for policy 1, policy_version 78660 (0.0008) +[2023-10-08 18:56:43,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 161710080. Throughput: 0: 1728.4, 1: 1756.7. Samples: 40440902. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 18:56:43,803][19739] Avg episode reward: [(0, '654.910'), (1, '929.230')] +[2023-10-08 18:56:43,846][21194] Updated weights for policy 1, policy_version 78670 (0.0007) +[2023-10-08 18:56:44,218][21194] Updated weights for policy 1, policy_version 78680 (0.0008) +[2023-10-08 18:56:45,034][21195] Updated weights for policy 0, policy_version 79270 (0.0009) +[2023-10-08 18:56:45,401][21195] Updated weights for policy 0, policy_version 79280 (0.0008) +[2023-10-08 18:56:45,776][21195] Updated weights for policy 0, policy_version 79290 (0.0009) +[2023-10-08 18:56:48,253][21194] Updated weights for policy 1, policy_version 78690 (0.0008) +[2023-10-08 18:56:48,631][21194] Updated weights for policy 1, policy_version 78700 (0.0008) +[2023-10-08 18:56:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 161775616. Throughput: 0: 1761.1, 1: 1729.1. Samples: 40456690. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 18:56:48,803][19739] Avg episode reward: [(0, '654.910'), (1, '929.230')] +[2023-10-08 18:56:48,988][21194] Updated weights for policy 1, policy_version 78710 (0.0009) +[2023-10-08 18:56:49,350][21194] Updated weights for policy 1, policy_version 78720 (0.0007) +[2023-10-08 18:56:49,559][21195] Updated weights for policy 0, policy_version 79300 (0.0009) +[2023-10-08 18:56:49,928][21195] Updated weights for policy 0, policy_version 79310 (0.0008) +[2023-10-08 18:56:50,297][21195] Updated weights for policy 0, policy_version 79320 (0.0010) +[2023-10-08 18:56:53,503][21194] Updated weights for policy 1, policy_version 78730 (0.0007) +[2023-10-08 18:56:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 161841152. Throughput: 0: 1723.9, 1: 1751.7. Samples: 40471702. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 18:56:53,803][19739] Avg episode reward: [(0, '655.360'), (1, '943.830')] +[2023-10-08 18:56:53,878][21194] Updated weights for policy 1, policy_version 78740 (0.0007) +[2023-10-08 18:56:54,237][21194] Updated weights for policy 1, policy_version 78750 (0.0009) +[2023-10-08 18:56:54,282][21195] Updated weights for policy 0, policy_version 79330 (0.0009) +[2023-10-08 18:56:54,663][21195] Updated weights for policy 0, policy_version 79340 (0.0009) +[2023-10-08 18:56:55,039][21195] Updated weights for policy 0, policy_version 79350 (0.0008) +[2023-10-08 18:56:55,406][21195] Updated weights for policy 0, policy_version 79360 (0.0009) +[2023-10-08 18:56:57,875][21194] Updated weights for policy 1, policy_version 78760 (0.0007) +[2023-10-08 18:56:58,235][21194] Updated weights for policy 1, policy_version 78770 (0.0010) +[2023-10-08 18:56:58,602][21194] Updated weights for policy 1, policy_version 78780 (0.0011) +[2023-10-08 18:56:58,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 161939456. Throughput: 0: 1753.6, 1: 1737.3. Samples: 40492968. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 18:56:58,803][19739] Avg episode reward: [(0, '655.110'), (1, '943.700')] +[2023-10-08 18:56:59,328][21195] Updated weights for policy 0, policy_version 79370 (0.0007) +[2023-10-08 18:56:59,699][21195] Updated weights for policy 0, policy_version 79380 (0.0007) +[2023-10-08 18:57:00,059][21195] Updated weights for policy 0, policy_version 79390 (0.0008) +[2023-10-08 18:57:02,668][21194] Updated weights for policy 1, policy_version 78790 (0.0009) +[2023-10-08 18:57:03,029][21194] Updated weights for policy 1, policy_version 78800 (0.0007) +[2023-10-08 18:57:03,410][21194] Updated weights for policy 1, policy_version 78810 (0.0007) +[2023-10-08 18:57:03,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 162004992. Throughput: 0: 1768.1, 1: 1737.3. Samples: 40508946. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 18:57:03,803][19739] Avg episode reward: [(0, '630.990'), (1, '948.690')] +[2023-10-08 18:57:03,989][21195] Updated weights for policy 0, policy_version 79400 (0.0009) +[2023-10-08 18:57:04,358][21195] Updated weights for policy 0, policy_version 79410 (0.0007) +[2023-10-08 18:57:04,735][21195] Updated weights for policy 0, policy_version 79420 (0.0010) +[2023-10-08 18:57:07,338][21194] Updated weights for policy 1, policy_version 78820 (0.0007) +[2023-10-08 18:57:07,704][21194] Updated weights for policy 1, policy_version 78830 (0.0008) +[2023-10-08 18:57:08,077][21194] Updated weights for policy 1, policy_version 78840 (0.0008) +[2023-10-08 18:57:08,596][21195] Updated weights for policy 0, policy_version 79430 (0.0009) +[2023-10-08 18:57:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 162070528. Throughput: 0: 1745.3, 1: 1741.3. Samples: 40524306. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 18:57:08,803][19739] Avg episode reward: [(0, '630.990'), (1, '948.690')] +[2023-10-08 18:57:08,958][21195] Updated weights for policy 0, policy_version 79440 (0.0008) +[2023-10-08 18:57:09,325][21195] Updated weights for policy 0, policy_version 79450 (0.0008) +[2023-10-08 18:57:12,097][21194] Updated weights for policy 1, policy_version 78850 (0.0009) +[2023-10-08 18:57:12,468][21194] Updated weights for policy 1, policy_version 78860 (0.0011) +[2023-10-08 18:57:12,834][21194] Updated weights for policy 1, policy_version 78870 (0.0007) +[2023-10-08 18:57:13,147][21195] Updated weights for policy 0, policy_version 79460 (0.0007) +[2023-10-08 18:57:13,199][21194] Updated weights for policy 1, policy_version 78880 (0.0008) +[2023-10-08 18:57:13,505][21195] Updated weights for policy 0, policy_version 79470 (0.0009) +[2023-10-08 18:57:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 162136064. Throughput: 0: 1770.1, 1: 1710.7. Samples: 40544736. Policy #0 lag: (min: 11.0, avg: 11.0, max: 11.0) +[2023-10-08 18:57:13,803][19739] Avg episode reward: [(0, '629.570'), (1, '948.690')] +[2023-10-08 18:57:13,810][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000078880_80773120.pth... +[2023-10-08 18:57:13,839][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000077248_79101952.pth +[2023-10-08 18:57:13,871][21195] Updated weights for policy 0, policy_version 79480 (0.0010) +[2023-10-08 18:57:14,172][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000079488_81395712.pth... +[2023-10-08 18:57:14,212][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000077856_79724544.pth +[2023-10-08 18:57:17,066][21194] Updated weights for policy 1, policy_version 78890 (0.0008) +[2023-10-08 18:57:17,426][21194] Updated weights for policy 1, policy_version 78900 (0.0007) +[2023-10-08 18:57:17,679][21195] Updated weights for policy 0, policy_version 79490 (0.0009) +[2023-10-08 18:57:17,793][21194] Updated weights for policy 1, policy_version 78910 (0.0009) +[2023-10-08 18:57:18,044][21195] Updated weights for policy 0, policy_version 79500 (0.0008) +[2023-10-08 18:57:18,418][21195] Updated weights for policy 0, policy_version 79510 (0.0007) +[2023-10-08 18:57:18,787][21195] Updated weights for policy 0, policy_version 79520 (0.0008) +[2023-10-08 18:57:18,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13995.8). Total num frames: 162234368. Throughput: 0: 1739.9, 1: 1741.7. Samples: 40560324. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 18:57:18,803][19739] Avg episode reward: [(0, '629.570'), (1, '948.530')] +[2023-10-08 18:57:21,772][21194] Updated weights for policy 1, policy_version 78920 (0.0008) +[2023-10-08 18:57:22,134][21194] Updated weights for policy 1, policy_version 78930 (0.0009) +[2023-10-08 18:57:22,499][21194] Updated weights for policy 1, policy_version 78940 (0.0009) +[2023-10-08 18:57:22,825][21195] Updated weights for policy 0, policy_version 79530 (0.0007) +[2023-10-08 18:57:23,196][21195] Updated weights for policy 0, policy_version 79540 (0.0007) +[2023-10-08 18:57:23,565][21195] Updated weights for policy 0, policy_version 79550 (0.0008) +[2023-10-08 18:57:23,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13995.8). Total num frames: 162299904. Throughput: 0: 1765.8, 1: 1721.5. Samples: 40576250. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 18:57:23,804][19739] Avg episode reward: [(0, '621.990'), (1, '948.530')] +[2023-10-08 18:57:26,398][21194] Updated weights for policy 1, policy_version 78950 (0.0007) +[2023-10-08 18:57:26,765][21194] Updated weights for policy 1, policy_version 78960 (0.0007) +[2023-10-08 18:57:27,137][21194] Updated weights for policy 1, policy_version 78970 (0.0007) +[2023-10-08 18:57:27,371][21195] Updated weights for policy 0, policy_version 79560 (0.0008) +[2023-10-08 18:57:27,736][21195] Updated weights for policy 0, policy_version 79570 (0.0010) +[2023-10-08 18:57:28,112][21195] Updated weights for policy 0, policy_version 79580 (0.0008) +[2023-10-08 18:57:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 162365440. Throughput: 0: 1742.9, 1: 1705.3. Samples: 40596072. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 18:57:28,803][19739] Avg episode reward: [(0, '621.990'), (1, '948.530')] +[2023-10-08 18:57:31,143][21194] Updated weights for policy 1, policy_version 78980 (0.0007) +[2023-10-08 18:57:31,516][21194] Updated weights for policy 1, policy_version 78990 (0.0008) +[2023-10-08 18:57:31,885][21194] Updated weights for policy 1, policy_version 79000 (0.0008) +[2023-10-08 18:57:32,237][21195] Updated weights for policy 0, policy_version 79590 (0.0009) +[2023-10-08 18:57:32,608][21195] Updated weights for policy 0, policy_version 79600 (0.0008) +[2023-10-08 18:57:32,975][21195] Updated weights for policy 0, policy_version 79610 (0.0008) +[2023-10-08 18:57:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 162430976. Throughput: 0: 1720.6, 1: 1735.5. Samples: 40612216. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 18:57:33,804][19739] Avg episode reward: [(0, '621.990'), (1, '948.530')] +[2023-10-08 18:57:35,653][21194] Updated weights for policy 1, policy_version 79010 (0.0008) +[2023-10-08 18:57:36,022][21194] Updated weights for policy 1, policy_version 79020 (0.0007) +[2023-10-08 18:57:36,384][21194] Updated weights for policy 1, policy_version 79030 (0.0009) +[2023-10-08 18:57:36,753][21194] Updated weights for policy 1, policy_version 79040 (0.0010) +[2023-10-08 18:57:37,025][21195] Updated weights for policy 0, policy_version 79620 (0.0009) +[2023-10-08 18:57:37,398][21195] Updated weights for policy 0, policy_version 79630 (0.0010) +[2023-10-08 18:57:37,769][21195] Updated weights for policy 0, policy_version 79640 (0.0008) +[2023-10-08 18:57:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 162496512. Throughput: 0: 1749.8, 1: 1712.9. Samples: 40627526. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 18:57:38,803][19739] Avg episode reward: [(0, '621.990'), (1, '948.530')] +[2023-10-08 18:57:40,869][21194] Updated weights for policy 1, policy_version 79050 (0.0009) +[2023-10-08 18:57:41,243][21194] Updated weights for policy 1, policy_version 79060 (0.0009) +[2023-10-08 18:57:41,536][21195] Updated weights for policy 0, policy_version 79650 (0.0008) +[2023-10-08 18:57:41,598][21194] Updated weights for policy 1, policy_version 79070 (0.0008) +[2023-10-08 18:57:41,897][21195] Updated weights for policy 0, policy_version 79660 (0.0010) +[2023-10-08 18:57:42,277][21195] Updated weights for policy 0, policy_version 79670 (0.0009) +[2023-10-08 18:57:42,631][21195] Updated weights for policy 0, policy_version 79680 (0.0009) +[2023-10-08 18:57:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 162562048. Throughput: 0: 1718.2, 1: 1716.6. Samples: 40647536. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 18:57:43,803][19739] Avg episode reward: [(0, '621.990'), (1, '948.530')] +[2023-10-08 18:57:45,640][21194] Updated weights for policy 1, policy_version 79080 (0.0011) +[2023-10-08 18:57:46,005][21194] Updated weights for policy 1, policy_version 79090 (0.0008) +[2023-10-08 18:57:46,367][21194] Updated weights for policy 1, policy_version 79100 (0.0007) +[2023-10-08 18:57:46,555][21195] Updated weights for policy 0, policy_version 79690 (0.0009) +[2023-10-08 18:57:46,929][21195] Updated weights for policy 0, policy_version 79700 (0.0008) +[2023-10-08 18:57:47,310][21195] Updated weights for policy 0, policy_version 79710 (0.0008) +[2023-10-08 18:57:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 162627584. Throughput: 0: 1712.7, 1: 1721.9. Samples: 40663502. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 18:57:48,803][19739] Avg episode reward: [(0, '621.990'), (1, '948.530')] +[2023-10-08 18:57:50,318][21194] Updated weights for policy 1, policy_version 79110 (0.0008) +[2023-10-08 18:57:50,682][21194] Updated weights for policy 1, policy_version 79120 (0.0007) +[2023-10-08 18:57:51,037][21194] Updated weights for policy 1, policy_version 79130 (0.0008) +[2023-10-08 18:57:51,273][21195] Updated weights for policy 0, policy_version 79720 (0.0009) +[2023-10-08 18:57:51,640][21195] Updated weights for policy 0, policy_version 79730 (0.0009) +[2023-10-08 18:57:52,006][21195] Updated weights for policy 0, policy_version 79740 (0.0007) +[2023-10-08 18:57:53,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 162693120. Throughput: 0: 1725.6, 1: 1710.7. Samples: 40678936. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 18:57:53,803][19739] Avg episode reward: [(0, '621.990'), (1, '948.530')] +[2023-10-08 18:57:55,036][21194] Updated weights for policy 1, policy_version 79140 (0.0008) +[2023-10-08 18:57:55,401][21194] Updated weights for policy 1, policy_version 79150 (0.0009) +[2023-10-08 18:57:55,772][21194] Updated weights for policy 1, policy_version 79160 (0.0013) +[2023-10-08 18:57:55,980][21195] Updated weights for policy 0, policy_version 79750 (0.0007) +[2023-10-08 18:57:56,343][21195] Updated weights for policy 0, policy_version 79760 (0.0009) +[2023-10-08 18:57:56,712][21195] Updated weights for policy 0, policy_version 79770 (0.0009) +[2023-10-08 18:57:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 162758656. Throughput: 0: 1714.6, 1: 1734.5. Samples: 40699946. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 18:57:58,803][19739] Avg episode reward: [(0, '621.990'), (1, '962.330')] +[2023-10-08 18:57:59,719][21194] Updated weights for policy 1, policy_version 79170 (0.0008) +[2023-10-08 18:58:00,079][21194] Updated weights for policy 1, policy_version 79180 (0.0007) +[2023-10-08 18:58:00,452][21194] Updated weights for policy 1, policy_version 79190 (0.0008) +[2023-10-08 18:58:00,544][21195] Updated weights for policy 0, policy_version 79780 (0.0007) +[2023-10-08 18:58:00,811][21194] Updated weights for policy 1, policy_version 79200 (0.0009) +[2023-10-08 18:58:00,911][21195] Updated weights for policy 0, policy_version 79790 (0.0008) +[2023-10-08 18:58:01,290][21195] Updated weights for policy 0, policy_version 79800 (0.0010) +[2023-10-08 18:58:03,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 162824192. Throughput: 0: 1742.5, 1: 1704.0. Samples: 40715420. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 18:58:03,804][19739] Avg episode reward: [(0, '621.990'), (1, '962.540')] +[2023-10-08 18:58:04,695][21194] Updated weights for policy 1, policy_version 79210 (0.0007) +[2023-10-08 18:58:05,069][21194] Updated weights for policy 1, policy_version 79220 (0.0007) +[2023-10-08 18:58:05,196][21195] Updated weights for policy 0, policy_version 79810 (0.0007) +[2023-10-08 18:58:05,431][21194] Updated weights for policy 1, policy_version 79230 (0.0009) +[2023-10-08 18:58:05,564][21195] Updated weights for policy 0, policy_version 79820 (0.0010) +[2023-10-08 18:58:05,945][21195] Updated weights for policy 0, policy_version 79830 (0.0009) +[2023-10-08 18:58:06,316][21195] Updated weights for policy 0, policy_version 79840 (0.0007) +[2023-10-08 18:58:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 162889728. Throughput: 0: 1714.2, 1: 1724.3. Samples: 40730982. Policy #0 lag: (min: 17.0, avg: 28.5, max: 49.0) +[2023-10-08 18:58:08,803][19739] Avg episode reward: [(0, '622.330'), (1, '962.540')] +[2023-10-08 18:58:09,343][21194] Updated weights for policy 1, policy_version 79240 (0.0010) +[2023-10-08 18:58:09,712][21194] Updated weights for policy 1, policy_version 79250 (0.0009) +[2023-10-08 18:58:10,065][21194] Updated weights for policy 1, policy_version 79260 (0.0009) +[2023-10-08 18:58:10,286][21195] Updated weights for policy 0, policy_version 79850 (0.0008) +[2023-10-08 18:58:10,650][21195] Updated weights for policy 0, policy_version 79860 (0.0010) +[2023-10-08 18:58:11,022][21195] Updated weights for policy 0, policy_version 79870 (0.0011) +[2023-10-08 18:58:13,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 162955264. Throughput: 0: 1728.0, 1: 1735.3. Samples: 40751922. Policy #0 lag: (min: 17.0, avg: 28.5, max: 49.0) +[2023-10-08 18:58:13,803][19739] Avg episode reward: [(0, '622.330'), (1, '947.710')] +[2023-10-08 18:58:14,177][21194] Updated weights for policy 1, policy_version 79270 (0.0009) +[2023-10-08 18:58:14,545][21194] Updated weights for policy 1, policy_version 79280 (0.0008) +[2023-10-08 18:58:14,902][21194] Updated weights for policy 1, policy_version 79290 (0.0009) +[2023-10-08 18:58:15,067][21195] Updated weights for policy 0, policy_version 79880 (0.0009) +[2023-10-08 18:58:15,437][21195] Updated weights for policy 0, policy_version 79890 (0.0008) +[2023-10-08 18:58:15,806][21195] Updated weights for policy 0, policy_version 79900 (0.0007) +[2023-10-08 18:58:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13884.7). Total num frames: 163020800. Throughput: 0: 1742.1, 1: 1701.7. Samples: 40767190. Policy #0 lag: (min: 17.0, avg: 28.5, max: 49.0) +[2023-10-08 18:58:18,803][19739] Avg episode reward: [(0, '637.740'), (1, '947.710')] +[2023-10-08 18:58:19,002][21194] Updated weights for policy 1, policy_version 79300 (0.0008) +[2023-10-08 18:58:19,371][21194] Updated weights for policy 1, policy_version 79310 (0.0007) +[2023-10-08 18:58:19,593][21195] Updated weights for policy 0, policy_version 79910 (0.0008) +[2023-10-08 18:58:19,739][21194] Updated weights for policy 1, policy_version 79320 (0.0008) +[2023-10-08 18:58:19,958][21195] Updated weights for policy 0, policy_version 79920 (0.0008) +[2023-10-08 18:58:20,320][21195] Updated weights for policy 0, policy_version 79930 (0.0009) +[2023-10-08 18:58:23,724][21194] Updated weights for policy 1, policy_version 79330 (0.0008) +[2023-10-08 18:58:23,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 163086336. Throughput: 0: 1714.4, 1: 1724.8. Samples: 40782290. Policy #0 lag: (min: 17.0, avg: 28.5, max: 49.0) +[2023-10-08 18:58:23,803][19739] Avg episode reward: [(0, '637.740'), (1, '947.710')] +[2023-10-08 18:58:24,094][21194] Updated weights for policy 1, policy_version 79340 (0.0010) +[2023-10-08 18:58:24,293][21195] Updated weights for policy 0, policy_version 79940 (0.0008) +[2023-10-08 18:58:24,457][21194] Updated weights for policy 1, policy_version 79350 (0.0008) +[2023-10-08 18:58:24,660][21195] Updated weights for policy 0, policy_version 79950 (0.0009) +[2023-10-08 18:58:24,816][21194] Updated weights for policy 1, policy_version 79360 (0.0008) +[2023-10-08 18:58:25,027][21195] Updated weights for policy 0, policy_version 79960 (0.0009) +[2023-10-08 18:58:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 163151872. Throughput: 0: 1743.8, 1: 1726.1. Samples: 40803680. Policy #0 lag: (min: 17.0, avg: 28.5, max: 49.0) +[2023-10-08 18:58:28,803][19739] Avg episode reward: [(0, '653.210'), (1, '947.710')] +[2023-10-08 18:58:28,911][21195] Updated weights for policy 0, policy_version 79970 (0.0009) +[2023-10-08 18:58:28,944][21194] Updated weights for policy 1, policy_version 79370 (0.0009) +[2023-10-08 18:58:29,279][21195] Updated weights for policy 0, policy_version 79980 (0.0009) +[2023-10-08 18:58:29,310][21194] Updated weights for policy 1, policy_version 79380 (0.0010) +[2023-10-08 18:58:29,649][21195] Updated weights for policy 0, policy_version 79990 (0.0009) +[2023-10-08 18:58:29,685][21194] Updated weights for policy 1, policy_version 79390 (0.0008) +[2023-10-08 18:58:30,024][21195] Updated weights for policy 0, policy_version 80000 (0.0007) +[2023-10-08 18:58:33,677][21194] Updated weights for policy 1, policy_version 79400 (0.0010) +[2023-10-08 18:58:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 163217408. Throughput: 0: 1736.1, 1: 1708.2. Samples: 40818498. Policy #0 lag: (min: 17.0, avg: 28.5, max: 49.0) +[2023-10-08 18:58:33,803][19739] Avg episode reward: [(0, '699.510'), (1, '938.430')] +[2023-10-08 18:58:33,969][21195] Updated weights for policy 0, policy_version 80010 (0.0008) +[2023-10-08 18:58:34,040][21194] Updated weights for policy 1, policy_version 79410 (0.0008) +[2023-10-08 18:58:34,334][21195] Updated weights for policy 0, policy_version 80020 (0.0007) +[2023-10-08 18:58:34,404][21194] Updated weights for policy 1, policy_version 79420 (0.0008) +[2023-10-08 18:58:34,698][21195] Updated weights for policy 0, policy_version 80030 (0.0007) +[2023-10-08 18:58:38,246][21194] Updated weights for policy 1, policy_version 79430 (0.0010) +[2023-10-08 18:58:38,607][21194] Updated weights for policy 1, policy_version 79440 (0.0009) +[2023-10-08 18:58:38,650][21195] Updated weights for policy 0, policy_version 80040 (0.0010) +[2023-10-08 18:58:38,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 163282944. Throughput: 0: 1730.1, 1: 1716.9. Samples: 40834052. Policy #0 lag: (min: 17.0, avg: 28.5, max: 49.0) +[2023-10-08 18:58:38,804][19739] Avg episode reward: [(0, '699.510'), (1, '938.430')] +[2023-10-08 18:58:38,984][21194] Updated weights for policy 1, policy_version 79450 (0.0009) +[2023-10-08 18:58:39,020][21195] Updated weights for policy 0, policy_version 80050 (0.0008) +[2023-10-08 18:58:39,383][21195] Updated weights for policy 0, policy_version 80060 (0.0008) +[2023-10-08 18:58:42,920][21194] Updated weights for policy 1, policy_version 79460 (0.0008) +[2023-10-08 18:58:43,288][21194] Updated weights for policy 1, policy_version 79470 (0.0007) +[2023-10-08 18:58:43,505][21195] Updated weights for policy 0, policy_version 80070 (0.0008) +[2023-10-08 18:58:43,656][21194] Updated weights for policy 1, policy_version 79480 (0.0008) +[2023-10-08 18:58:43,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 163348480. Throughput: 0: 1735.8, 1: 1709.0. Samples: 40854962. Policy #0 lag: (min: 17.0, avg: 28.5, max: 49.0) +[2023-10-08 18:58:43,804][19739] Avg episode reward: [(0, '699.510'), (1, '938.430')] +[2023-10-08 18:58:43,871][21195] Updated weights for policy 0, policy_version 80080 (0.0008) +[2023-10-08 18:58:44,236][21195] Updated weights for policy 0, policy_version 80090 (0.0008) +[2023-10-08 18:58:47,772][21194] Updated weights for policy 1, policy_version 79490 (0.0009) +[2023-10-08 18:58:48,038][21195] Updated weights for policy 0, policy_version 80100 (0.0008) +[2023-10-08 18:58:48,142][21194] Updated weights for policy 1, policy_version 79500 (0.0010) +[2023-10-08 18:58:48,410][21195] Updated weights for policy 0, policy_version 80110 (0.0009) +[2023-10-08 18:58:48,509][21194] Updated weights for policy 1, policy_version 79510 (0.0007) +[2023-10-08 18:58:48,771][21195] Updated weights for policy 0, policy_version 80120 (0.0007) +[2023-10-08 18:58:48,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 163414016. Throughput: 0: 1711.7, 1: 1712.9. Samples: 40869530. Policy #0 lag: (min: 17.0, avg: 28.5, max: 49.0) +[2023-10-08 18:58:48,803][19739] Avg episode reward: [(0, '699.510'), (1, '938.430')] +[2023-10-08 18:58:48,883][21194] Updated weights for policy 1, policy_version 79520 (0.0008) +[2023-10-08 18:58:52,790][21194] Updated weights for policy 1, policy_version 79530 (0.0009) +[2023-10-08 18:58:52,859][21195] Updated weights for policy 0, policy_version 80130 (0.0008) +[2023-10-08 18:58:53,154][21194] Updated weights for policy 1, policy_version 79540 (0.0008) +[2023-10-08 18:58:53,230][21195] Updated weights for policy 0, policy_version 80140 (0.0008) +[2023-10-08 18:58:53,527][21194] Updated weights for policy 1, policy_version 79550 (0.0007) +[2023-10-08 18:58:53,588][21195] Updated weights for policy 0, policy_version 80150 (0.0008) +[2023-10-08 18:58:53,803][19739] Fps is (10 sec: 16384.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 163512320. Throughput: 0: 1734.2, 1: 1703.6. Samples: 40885686. Policy #0 lag: (min: 17.0, avg: 28.5, max: 49.0) +[2023-10-08 18:58:53,803][19739] Avg episode reward: [(0, '699.510'), (1, '938.430')] +[2023-10-08 18:58:53,952][21195] Updated weights for policy 0, policy_version 80160 (0.0009) +[2023-10-08 18:58:57,674][21194] Updated weights for policy 1, policy_version 79560 (0.0008) +[2023-10-08 18:58:57,807][21195] Updated weights for policy 0, policy_version 80170 (0.0007) +[2023-10-08 18:58:58,033][21194] Updated weights for policy 1, policy_version 79570 (0.0008) +[2023-10-08 18:58:58,181][21195] Updated weights for policy 0, policy_version 80180 (0.0008) +[2023-10-08 18:58:58,408][21194] Updated weights for policy 1, policy_version 79580 (0.0008) +[2023-10-08 18:58:58,537][21195] Updated weights for policy 0, policy_version 80190 (0.0007) +[2023-10-08 18:58:58,802][19739] Fps is (10 sec: 19660.7, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 163610624. Throughput: 0: 1732.3, 1: 1687.1. Samples: 40905796. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:58:58,803][19739] Avg episode reward: [(0, '699.510'), (1, '938.430')] +[2023-10-08 18:59:02,369][21194] Updated weights for policy 1, policy_version 79590 (0.0008) +[2023-10-08 18:59:02,600][21195] Updated weights for policy 0, policy_version 80200 (0.0007) +[2023-10-08 18:59:02,732][21194] Updated weights for policy 1, policy_version 79600 (0.0007) +[2023-10-08 18:59:02,961][21195] Updated weights for policy 0, policy_version 80210 (0.0009) +[2023-10-08 18:59:03,097][21194] Updated weights for policy 1, policy_version 79610 (0.0007) +[2023-10-08 18:59:03,325][21195] Updated weights for policy 0, policy_version 80220 (0.0008) +[2023-10-08 18:59:03,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 163676160. Throughput: 0: 1711.0, 1: 1699.4. Samples: 40920658. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:59:03,803][19739] Avg episode reward: [(0, '699.510'), (1, '939.230')] +[2023-10-08 18:59:06,976][21194] Updated weights for policy 1, policy_version 79620 (0.0007) +[2023-10-08 18:59:07,072][21195] Updated weights for policy 0, policy_version 80230 (0.0008) +[2023-10-08 18:59:07,338][21194] Updated weights for policy 1, policy_version 79630 (0.0008) +[2023-10-08 18:59:07,442][21195] Updated weights for policy 0, policy_version 80240 (0.0007) +[2023-10-08 18:59:07,702][21194] Updated weights for policy 1, policy_version 79640 (0.0008) +[2023-10-08 18:59:07,806][21195] Updated weights for policy 0, policy_version 80250 (0.0010) +[2023-10-08 18:59:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 163741696. Throughput: 0: 1748.8, 1: 1699.0. Samples: 40937440. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:59:08,803][19739] Avg episode reward: [(0, '715.060'), (1, '939.230')] +[2023-10-08 18:59:11,791][21194] Updated weights for policy 1, policy_version 79650 (0.0008) +[2023-10-08 18:59:11,799][21195] Updated weights for policy 0, policy_version 80260 (0.0008) +[2023-10-08 18:59:12,155][21194] Updated weights for policy 1, policy_version 79660 (0.0008) +[2023-10-08 18:59:12,171][21195] Updated weights for policy 0, policy_version 80270 (0.0007) +[2023-10-08 18:59:12,526][21194] Updated weights for policy 1, policy_version 79670 (0.0008) +[2023-10-08 18:59:12,535][21195] Updated weights for policy 0, policy_version 80280 (0.0008) +[2023-10-08 18:59:12,892][21194] Updated weights for policy 1, policy_version 79680 (0.0007) +[2023-10-08 18:59:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 163807232. Throughput: 0: 1718.2, 1: 1671.8. Samples: 40956228. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:59:13,803][19739] Avg episode reward: [(0, '715.060'), (1, '939.230')] +[2023-10-08 18:59:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000080288_82214912.pth... +[2023-10-08 18:59:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000079680_81592320.pth... +[2023-10-08 18:59:13,844][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000078656_80543744.pth +[2023-10-08 18:59:13,855][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000078080_79953920.pth +[2023-10-08 18:59:16,476][21195] Updated weights for policy 0, policy_version 80290 (0.0008) +[2023-10-08 18:59:16,840][21195] Updated weights for policy 0, policy_version 80300 (0.0008) +[2023-10-08 18:59:17,007][21194] Updated weights for policy 1, policy_version 79690 (0.0008) +[2023-10-08 18:59:17,201][21195] Updated weights for policy 0, policy_version 80310 (0.0007) +[2023-10-08 18:59:17,376][21194] Updated weights for policy 1, policy_version 79700 (0.0007) +[2023-10-08 18:59:17,565][21195] Updated weights for policy 0, policy_version 80320 (0.0007) +[2023-10-08 18:59:17,733][21194] Updated weights for policy 1, policy_version 79710 (0.0007) +[2023-10-08 18:59:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 163872768. Throughput: 0: 1725.4, 1: 1704.3. Samples: 40972836. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:59:18,803][19739] Avg episode reward: [(0, '694.600'), (1, '939.230')] +[2023-10-08 18:59:21,340][21195] Updated weights for policy 0, policy_version 80330 (0.0007) +[2023-10-08 18:59:21,698][21195] Updated weights for policy 0, policy_version 80340 (0.0008) +[2023-10-08 18:59:21,867][21194] Updated weights for policy 1, policy_version 79720 (0.0007) +[2023-10-08 18:59:22,067][21195] Updated weights for policy 0, policy_version 80350 (0.0009) +[2023-10-08 18:59:22,228][21194] Updated weights for policy 1, policy_version 79730 (0.0007) +[2023-10-08 18:59:22,597][21194] Updated weights for policy 1, policy_version 79740 (0.0007) +[2023-10-08 18:59:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 163938304. Throughput: 0: 1729.3, 1: 1689.7. Samples: 40987910. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:59:23,803][19739] Avg episode reward: [(0, '725.440'), (1, '939.230')] +[2023-10-08 18:59:26,168][21195] Updated weights for policy 0, policy_version 80360 (0.0007) +[2023-10-08 18:59:26,541][21195] Updated weights for policy 0, policy_version 80370 (0.0009) +[2023-10-08 18:59:26,553][21194] Updated weights for policy 1, policy_version 79750 (0.0008) +[2023-10-08 18:59:26,904][21195] Updated weights for policy 0, policy_version 80380 (0.0009) +[2023-10-08 18:59:26,922][21194] Updated weights for policy 1, policy_version 79760 (0.0008) +[2023-10-08 18:59:27,290][21194] Updated weights for policy 1, policy_version 79770 (0.0010) +[2023-10-08 18:59:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 164003840. Throughput: 0: 1721.0, 1: 1678.0. Samples: 41007914. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:59:28,803][19739] Avg episode reward: [(0, '740.640'), (1, '939.140')] +[2023-10-08 18:59:30,691][21195] Updated weights for policy 0, policy_version 80390 (0.0011) +[2023-10-08 18:59:31,065][21195] Updated weights for policy 0, policy_version 80400 (0.0009) +[2023-10-08 18:59:31,299][21194] Updated weights for policy 1, policy_version 79780 (0.0007) +[2023-10-08 18:59:31,425][21195] Updated weights for policy 0, policy_version 80410 (0.0007) +[2023-10-08 18:59:31,673][21194] Updated weights for policy 1, policy_version 79790 (0.0009) +[2023-10-08 18:59:32,029][21194] Updated weights for policy 1, policy_version 79800 (0.0009) +[2023-10-08 18:59:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 164069376. Throughput: 0: 1752.4, 1: 1702.2. Samples: 41024986. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:59:33,803][19739] Avg episode reward: [(0, '740.640'), (1, '939.140')] +[2023-10-08 18:59:35,050][21195] Updated weights for policy 0, policy_version 80420 (0.0008) +[2023-10-08 18:59:35,418][21195] Updated weights for policy 0, policy_version 80430 (0.0008) +[2023-10-08 18:59:35,789][21195] Updated weights for policy 0, policy_version 80440 (0.0008) +[2023-10-08 18:59:36,025][21194] Updated weights for policy 1, policy_version 79810 (0.0009) +[2023-10-08 18:59:36,394][21194] Updated weights for policy 1, policy_version 79820 (0.0007) +[2023-10-08 18:59:36,759][21194] Updated weights for policy 1, policy_version 79830 (0.0008) +[2023-10-08 18:59:37,131][21194] Updated weights for policy 1, policy_version 79840 (0.0007) +[2023-10-08 18:59:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 164134912. Throughput: 0: 1733.9, 1: 1686.0. Samples: 41039580. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:59:38,803][19739] Avg episode reward: [(0, '740.640'), (1, '939.140')] +[2023-10-08 18:59:39,637][21195] Updated weights for policy 0, policy_version 80450 (0.0009) +[2023-10-08 18:59:40,004][21195] Updated weights for policy 0, policy_version 80460 (0.0010) +[2023-10-08 18:59:40,366][21195] Updated weights for policy 0, policy_version 80470 (0.0011) +[2023-10-08 18:59:40,729][21195] Updated weights for policy 0, policy_version 80480 (0.0010) +[2023-10-08 18:59:40,965][21194] Updated weights for policy 1, policy_version 79850 (0.0008) +[2023-10-08 18:59:41,331][21194] Updated weights for policy 1, policy_version 79860 (0.0007) +[2023-10-08 18:59:41,699][21194] Updated weights for policy 1, policy_version 79870 (0.0007) +[2023-10-08 18:59:43,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 164200448. Throughput: 0: 1743.2, 1: 1703.9. Samples: 41060916. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:59:43,804][19739] Avg episode reward: [(0, '740.640'), (1, '939.140')] +[2023-10-08 18:59:44,815][21195] Updated weights for policy 0, policy_version 80490 (0.0009) +[2023-10-08 18:59:45,183][21195] Updated weights for policy 0, policy_version 80500 (0.0008) +[2023-10-08 18:59:45,545][21195] Updated weights for policy 0, policy_version 80510 (0.0009) +[2023-10-08 18:59:45,598][21194] Updated weights for policy 1, policy_version 79880 (0.0010) +[2023-10-08 18:59:45,972][21194] Updated weights for policy 1, policy_version 79890 (0.0010) +[2023-10-08 18:59:46,334][21194] Updated weights for policy 1, policy_version 79900 (0.0009) +[2023-10-08 18:59:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 164265984. Throughput: 0: 1765.3, 1: 1704.4. Samples: 41076794. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:59:48,803][19739] Avg episode reward: [(0, '740.640'), (1, '929.170')] +[2023-10-08 18:59:49,423][21195] Updated weights for policy 0, policy_version 80520 (0.0009) +[2023-10-08 18:59:49,787][21195] Updated weights for policy 0, policy_version 80530 (0.0007) +[2023-10-08 18:59:50,160][21195] Updated weights for policy 0, policy_version 80540 (0.0008) +[2023-10-08 18:59:50,282][21194] Updated weights for policy 1, policy_version 79910 (0.0009) +[2023-10-08 18:59:50,654][21194] Updated weights for policy 1, policy_version 79920 (0.0007) +[2023-10-08 18:59:51,012][21194] Updated weights for policy 1, policy_version 79930 (0.0010) +[2023-10-08 18:59:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 164331520. Throughput: 0: 1727.6, 1: 1699.8. Samples: 41091674. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:59:53,804][19739] Avg episode reward: [(0, '740.640'), (1, '929.170')] +[2023-10-08 18:59:54,066][21195] Updated weights for policy 0, policy_version 80550 (0.0009) +[2023-10-08 18:59:54,449][21195] Updated weights for policy 0, policy_version 80560 (0.0008) +[2023-10-08 18:59:54,754][21194] Updated weights for policy 1, policy_version 79940 (0.0008) +[2023-10-08 18:59:54,820][21195] Updated weights for policy 0, policy_version 80570 (0.0007) +[2023-10-08 18:59:55,118][21194] Updated weights for policy 1, policy_version 79950 (0.0008) +[2023-10-08 18:59:55,481][21194] Updated weights for policy 1, policy_version 79960 (0.0007) +[2023-10-08 18:59:58,633][21195] Updated weights for policy 0, policy_version 80580 (0.0008) +[2023-10-08 18:59:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.1, 300 sec: 13773.7). Total num frames: 164397056. Throughput: 0: 1756.8, 1: 1731.9. Samples: 41113218. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 18:59:58,804][19739] Avg episode reward: [(0, '740.640'), (1, '929.070')] +[2023-10-08 18:59:59,000][21195] Updated weights for policy 0, policy_version 80590 (0.0007) +[2023-10-08 18:59:59,362][21195] Updated weights for policy 0, policy_version 80600 (0.0007) +[2023-10-08 18:59:59,466][21194] Updated weights for policy 1, policy_version 79970 (0.0009) +[2023-10-08 18:59:59,832][21194] Updated weights for policy 1, policy_version 79980 (0.0008) +[2023-10-08 19:00:00,196][21194] Updated weights for policy 1, policy_version 79990 (0.0007) +[2023-10-08 19:00:00,562][21194] Updated weights for policy 1, policy_version 80000 (0.0009) +[2023-10-08 19:00:03,373][21195] Updated weights for policy 0, policy_version 80610 (0.0007) +[2023-10-08 19:00:03,737][21195] Updated weights for policy 0, policy_version 80620 (0.0009) +[2023-10-08 19:00:03,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 164462592. Throughput: 0: 1742.4, 1: 1704.1. Samples: 41127928. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:00:03,803][19739] Avg episode reward: [(0, '740.640'), (1, '929.070')] +[2023-10-08 19:00:04,104][21195] Updated weights for policy 0, policy_version 80630 (0.0009) +[2023-10-08 19:00:04,477][21195] Updated weights for policy 0, policy_version 80640 (0.0007) +[2023-10-08 19:00:04,556][21194] Updated weights for policy 1, policy_version 80010 (0.0008) +[2023-10-08 19:00:04,925][21194] Updated weights for policy 1, policy_version 80020 (0.0008) +[2023-10-08 19:00:05,299][21194] Updated weights for policy 1, policy_version 80030 (0.0007) +[2023-10-08 19:00:08,283][21195] Updated weights for policy 0, policy_version 80650 (0.0007) +[2023-10-08 19:00:08,649][21195] Updated weights for policy 0, policy_version 80660 (0.0007) +[2023-10-08 19:00:08,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 164528128. Throughput: 0: 1746.8, 1: 1718.5. Samples: 41143846. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:00:08,803][19739] Avg episode reward: [(0, '740.640'), (1, '929.070')] +[2023-10-08 19:00:09,018][21195] Updated weights for policy 0, policy_version 80670 (0.0008) +[2023-10-08 19:00:09,293][21194] Updated weights for policy 1, policy_version 80040 (0.0009) +[2023-10-08 19:00:09,668][21194] Updated weights for policy 1, policy_version 80050 (0.0008) +[2023-10-08 19:00:10,040][21194] Updated weights for policy 1, policy_version 80060 (0.0007) +[2023-10-08 19:00:12,987][21195] Updated weights for policy 0, policy_version 80680 (0.0010) +[2023-10-08 19:00:13,359][21195] Updated weights for policy 0, policy_version 80690 (0.0011) +[2023-10-08 19:00:13,717][21195] Updated weights for policy 0, policy_version 80700 (0.0011) +[2023-10-08 19:00:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 164593664. Throughput: 0: 1755.0, 1: 1733.8. Samples: 41164912. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:00:13,803][19739] Avg episode reward: [(0, '740.640'), (1, '929.070')] +[2023-10-08 19:00:14,030][21194] Updated weights for policy 1, policy_version 80070 (0.0008) +[2023-10-08 19:00:14,388][21194] Updated weights for policy 1, policy_version 80080 (0.0008) +[2023-10-08 19:00:14,765][21194] Updated weights for policy 1, policy_version 80090 (0.0011) +[2023-10-08 19:00:17,687][21195] Updated weights for policy 0, policy_version 80710 (0.0010) +[2023-10-08 19:00:18,047][21195] Updated weights for policy 0, policy_version 80720 (0.0009) +[2023-10-08 19:00:18,418][21195] Updated weights for policy 0, policy_version 80730 (0.0011) +[2023-10-08 19:00:18,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 164691968. Throughput: 0: 1719.0, 1: 1706.9. Samples: 41179152. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:00:18,803][19739] Avg episode reward: [(0, '740.640'), (1, '929.070')] +[2023-10-08 19:00:18,847][21194] Updated weights for policy 1, policy_version 80100 (0.0009) +[2023-10-08 19:00:19,209][21194] Updated weights for policy 1, policy_version 80110 (0.0007) +[2023-10-08 19:00:19,583][21194] Updated weights for policy 1, policy_version 80120 (0.0008) +[2023-10-08 19:00:22,182][21195] Updated weights for policy 0, policy_version 80740 (0.0010) +[2023-10-08 19:00:22,550][21195] Updated weights for policy 0, policy_version 80750 (0.0009) +[2023-10-08 19:00:22,917][21195] Updated weights for policy 0, policy_version 80760 (0.0009) +[2023-10-08 19:00:23,602][21194] Updated weights for policy 1, policy_version 80130 (0.0007) +[2023-10-08 19:00:23,803][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 164757504. Throughput: 0: 1747.8, 1: 1724.1. Samples: 41195816. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:00:23,803][19739] Avg episode reward: [(0, '740.640'), (1, '929.070')] +[2023-10-08 19:00:23,961][21194] Updated weights for policy 1, policy_version 80140 (0.0009) +[2023-10-08 19:00:24,330][21194] Updated weights for policy 1, policy_version 80150 (0.0007) +[2023-10-08 19:00:24,691][21194] Updated weights for policy 1, policy_version 80160 (0.0008) +[2023-10-08 19:00:26,916][21195] Updated weights for policy 0, policy_version 80770 (0.0009) +[2023-10-08 19:00:27,277][21195] Updated weights for policy 0, policy_version 80780 (0.0007) +[2023-10-08 19:00:27,640][21195] Updated weights for policy 0, policy_version 80790 (0.0009) +[2023-10-08 19:00:28,006][21195] Updated weights for policy 0, policy_version 80800 (0.0010) +[2023-10-08 19:00:28,601][21194] Updated weights for policy 1, policy_version 80170 (0.0008) +[2023-10-08 19:00:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 164823040. Throughput: 0: 1726.1, 1: 1729.7. Samples: 41216428. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:00:28,803][19739] Avg episode reward: [(0, '740.640'), (1, '929.070')] +[2023-10-08 19:00:28,968][21194] Updated weights for policy 1, policy_version 80180 (0.0008) +[2023-10-08 19:00:29,333][21194] Updated weights for policy 1, policy_version 80190 (0.0008) +[2023-10-08 19:00:32,106][21195] Updated weights for policy 0, policy_version 80810 (0.0007) +[2023-10-08 19:00:32,480][21195] Updated weights for policy 0, policy_version 80820 (0.0009) +[2023-10-08 19:00:32,846][21195] Updated weights for policy 0, policy_version 80830 (0.0010) +[2023-10-08 19:00:33,398][21194] Updated weights for policy 1, policy_version 80200 (0.0009) +[2023-10-08 19:00:33,774][21194] Updated weights for policy 1, policy_version 80210 (0.0009) +[2023-10-08 19:00:33,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 164888576. Throughput: 0: 1718.8, 1: 1714.9. Samples: 41231310. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:00:33,804][19739] Avg episode reward: [(0, '744.670'), (1, '929.070')] +[2023-10-08 19:00:34,133][21194] Updated weights for policy 1, policy_version 80220 (0.0007) +[2023-10-08 19:00:36,967][21195] Updated weights for policy 0, policy_version 80840 (0.0009) +[2023-10-08 19:00:37,329][21195] Updated weights for policy 0, policy_version 80850 (0.0008) +[2023-10-08 19:00:37,702][21195] Updated weights for policy 0, policy_version 80860 (0.0007) +[2023-10-08 19:00:38,154][21194] Updated weights for policy 1, policy_version 80230 (0.0008) +[2023-10-08 19:00:38,521][21194] Updated weights for policy 1, policy_version 80240 (0.0008) +[2023-10-08 19:00:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 164954112. Throughput: 0: 1739.3, 1: 1721.5. Samples: 41247412. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:00:38,803][19739] Avg episode reward: [(0, '744.670'), (1, '929.310')] +[2023-10-08 19:00:38,883][21194] Updated weights for policy 1, policy_version 80250 (0.0008) +[2023-10-08 19:00:41,537][21195] Updated weights for policy 0, policy_version 80870 (0.0007) +[2023-10-08 19:00:41,900][21195] Updated weights for policy 0, policy_version 80880 (0.0009) +[2023-10-08 19:00:42,274][21195] Updated weights for policy 0, policy_version 80890 (0.0011) +[2023-10-08 19:00:42,876][21194] Updated weights for policy 1, policy_version 80260 (0.0009) +[2023-10-08 19:00:43,243][21194] Updated weights for policy 1, policy_version 80270 (0.0011) +[2023-10-08 19:00:43,617][21194] Updated weights for policy 1, policy_version 80280 (0.0009) +[2023-10-08 19:00:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 165019648. Throughput: 0: 1707.0, 1: 1713.1. Samples: 41267124. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 19:00:43,803][19739] Avg episode reward: [(0, '744.670'), (1, '929.310')] +[2023-10-08 19:00:46,314][21195] Updated weights for policy 0, policy_version 80900 (0.0010) +[2023-10-08 19:00:46,682][21195] Updated weights for policy 0, policy_version 80910 (0.0007) +[2023-10-08 19:00:47,059][21195] Updated weights for policy 0, policy_version 80920 (0.0007) +[2023-10-08 19:00:47,489][21194] Updated weights for policy 1, policy_version 80290 (0.0010) +[2023-10-08 19:00:47,856][21194] Updated weights for policy 1, policy_version 80300 (0.0009) +[2023-10-08 19:00:48,217][21194] Updated weights for policy 1, policy_version 80310 (0.0008) +[2023-10-08 19:00:48,592][21194] Updated weights for policy 1, policy_version 80320 (0.0007) +[2023-10-08 19:00:48,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 165117952. Throughput: 0: 1720.8, 1: 1718.4. Samples: 41282694. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 19:00:48,803][19739] Avg episode reward: [(0, '744.670'), (1, '929.310')] +[2023-10-08 19:00:50,929][21195] Updated weights for policy 0, policy_version 80930 (0.0008) +[2023-10-08 19:00:51,304][21195] Updated weights for policy 0, policy_version 80940 (0.0009) +[2023-10-08 19:00:51,680][21195] Updated weights for policy 0, policy_version 80950 (0.0011) +[2023-10-08 19:00:52,055][21195] Updated weights for policy 0, policy_version 80960 (0.0010) +[2023-10-08 19:00:52,625][21194] Updated weights for policy 1, policy_version 80330 (0.0009) +[2023-10-08 19:00:52,989][21194] Updated weights for policy 1, policy_version 80340 (0.0009) +[2023-10-08 19:00:53,360][21194] Updated weights for policy 1, policy_version 80350 (0.0008) +[2023-10-08 19:00:53,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 165183488. Throughput: 0: 1712.0, 1: 1720.4. Samples: 41298304. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 19:00:53,803][19739] Avg episode reward: [(0, '744.670'), (1, '929.310')] +[2023-10-08 19:00:56,005][21195] Updated weights for policy 0, policy_version 80970 (0.0008) +[2023-10-08 19:00:56,375][21195] Updated weights for policy 0, policy_version 80980 (0.0008) +[2023-10-08 19:00:56,742][21195] Updated weights for policy 0, policy_version 80990 (0.0009) +[2023-10-08 19:00:57,298][21194] Updated weights for policy 1, policy_version 80360 (0.0008) +[2023-10-08 19:00:57,660][21194] Updated weights for policy 1, policy_version 80370 (0.0009) +[2023-10-08 19:00:58,031][21194] Updated weights for policy 1, policy_version 80380 (0.0010) +[2023-10-08 19:00:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 165249024. Throughput: 0: 1706.6, 1: 1700.8. Samples: 41318244. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 19:00:58,803][19739] Avg episode reward: [(0, '743.970'), (1, '929.310')] +[2023-10-08 19:01:00,845][21195] Updated weights for policy 0, policy_version 81000 (0.0009) +[2023-10-08 19:01:01,209][21195] Updated weights for policy 0, policy_version 81010 (0.0009) +[2023-10-08 19:01:01,583][21195] Updated weights for policy 0, policy_version 81020 (0.0009) +[2023-10-08 19:01:02,085][21194] Updated weights for policy 1, policy_version 80390 (0.0010) +[2023-10-08 19:01:02,448][21194] Updated weights for policy 1, policy_version 80400 (0.0010) +[2023-10-08 19:01:02,810][21194] Updated weights for policy 1, policy_version 80410 (0.0008) +[2023-10-08 19:01:03,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 165314560. Throughput: 0: 1734.3, 1: 1723.8. Samples: 41334768. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 19:01:03,804][19739] Avg episode reward: [(0, '743.970'), (1, '929.440')] +[2023-10-08 19:01:05,409][21195] Updated weights for policy 0, policy_version 81030 (0.0008) +[2023-10-08 19:01:05,779][21195] Updated weights for policy 0, policy_version 81040 (0.0008) +[2023-10-08 19:01:06,144][21195] Updated weights for policy 0, policy_version 81050 (0.0009) +[2023-10-08 19:01:06,670][21194] Updated weights for policy 1, policy_version 80420 (0.0009) +[2023-10-08 19:01:07,040][21194] Updated weights for policy 1, policy_version 80430 (0.0010) +[2023-10-08 19:01:07,408][21194] Updated weights for policy 1, policy_version 80440 (0.0008) +[2023-10-08 19:01:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 165380096. Throughput: 0: 1703.3, 1: 1713.3. Samples: 41349566. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 19:01:08,803][19739] Avg episode reward: [(0, '743.970'), (1, '929.430')] +[2023-10-08 19:01:09,894][21195] Updated weights for policy 0, policy_version 81060 (0.0009) +[2023-10-08 19:01:10,252][21195] Updated weights for policy 0, policy_version 81070 (0.0009) +[2023-10-08 19:01:10,616][21195] Updated weights for policy 0, policy_version 81080 (0.0010) +[2023-10-08 19:01:11,495][21194] Updated weights for policy 1, policy_version 80450 (0.0007) +[2023-10-08 19:01:11,868][21194] Updated weights for policy 1, policy_version 80460 (0.0010) +[2023-10-08 19:01:12,233][21194] Updated weights for policy 1, policy_version 80470 (0.0010) +[2023-10-08 19:01:12,594][21194] Updated weights for policy 1, policy_version 80480 (0.0009) +[2023-10-08 19:01:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 165445632. Throughput: 0: 1729.8, 1: 1690.6. Samples: 41370346. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 19:01:13,804][19739] Avg episode reward: [(0, '744.610'), (1, '944.090')] +[2023-10-08 19:01:13,813][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000080480_82411520.pth... +[2023-10-08 19:01:13,814][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000081088_83034112.pth... +[2023-10-08 19:01:13,842][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000078880_80773120.pth +[2023-10-08 19:01:13,846][20836] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p1/milestones/checkpoint_000080480_82411520.pth +[2023-10-08 19:01:13,857][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000079488_81395712.pth +[2023-10-08 19:01:13,862][20740] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p0/milestones/checkpoint_000081088_83034112.pth +[2023-10-08 19:01:14,507][21195] Updated weights for policy 0, policy_version 81090 (0.0009) +[2023-10-08 19:01:14,870][21195] Updated weights for policy 0, policy_version 81100 (0.0009) +[2023-10-08 19:01:15,239][21195] Updated weights for policy 0, policy_version 81110 (0.0011) +[2023-10-08 19:01:15,607][21195] Updated weights for policy 0, policy_version 81120 (0.0010) +[2023-10-08 19:01:16,594][21194] Updated weights for policy 1, policy_version 80490 (0.0008) +[2023-10-08 19:01:16,959][21194] Updated weights for policy 1, policy_version 80500 (0.0009) +[2023-10-08 19:01:17,318][21194] Updated weights for policy 1, policy_version 80510 (0.0007) +[2023-10-08 19:01:18,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 165511168. Throughput: 0: 1735.0, 1: 1724.7. Samples: 41386996. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 19:01:18,804][19739] Avg episode reward: [(0, '744.610'), (1, '944.090')] +[2023-10-08 19:01:19,650][21195] Updated weights for policy 0, policy_version 81130 (0.0009) +[2023-10-08 19:01:20,024][21195] Updated weights for policy 0, policy_version 81140 (0.0009) +[2023-10-08 19:01:20,383][21195] Updated weights for policy 0, policy_version 81150 (0.0009) +[2023-10-08 19:01:21,261][21194] Updated weights for policy 1, policy_version 80520 (0.0007) +[2023-10-08 19:01:21,619][21194] Updated weights for policy 1, policy_version 80530 (0.0009) +[2023-10-08 19:01:21,993][21194] Updated weights for policy 1, policy_version 80540 (0.0009) +[2023-10-08 19:01:23,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 165576704. Throughput: 0: 1710.9, 1: 1698.1. Samples: 41400816. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 19:01:23,803][19739] Avg episode reward: [(0, '760.130'), (1, '914.020')] +[2023-10-08 19:01:24,409][21195] Updated weights for policy 0, policy_version 81160 (0.0009) +[2023-10-08 19:01:24,774][21195] Updated weights for policy 0, policy_version 81170 (0.0010) +[2023-10-08 19:01:25,142][21195] Updated weights for policy 0, policy_version 81180 (0.0010) +[2023-10-08 19:01:25,972][21194] Updated weights for policy 1, policy_version 80550 (0.0008) +[2023-10-08 19:01:26,331][21194] Updated weights for policy 1, policy_version 80560 (0.0007) +[2023-10-08 19:01:26,693][21194] Updated weights for policy 1, policy_version 80570 (0.0009) +[2023-10-08 19:01:28,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 165642240. Throughput: 0: 1741.3, 1: 1704.5. Samples: 41422186. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 19:01:28,803][19739] Avg episode reward: [(0, '760.130'), (1, '899.210')] +[2023-10-08 19:01:29,124][21195] Updated weights for policy 0, policy_version 81190 (0.0007) +[2023-10-08 19:01:29,495][21195] Updated weights for policy 0, policy_version 81200 (0.0008) +[2023-10-08 19:01:29,856][21195] Updated weights for policy 0, policy_version 81210 (0.0008) +[2023-10-08 19:01:30,689][21194] Updated weights for policy 1, policy_version 80580 (0.0011) +[2023-10-08 19:01:31,047][21194] Updated weights for policy 1, policy_version 80590 (0.0011) +[2023-10-08 19:01:31,415][21194] Updated weights for policy 1, policy_version 80600 (0.0010) +[2023-10-08 19:01:33,650][21195] Updated weights for policy 0, policy_version 81220 (0.0008) +[2023-10-08 19:01:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 165707776. Throughput: 0: 1738.0, 1: 1717.7. Samples: 41438202. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 19:01:33,804][19739] Avg episode reward: [(0, '775.520'), (1, '899.140')] +[2023-10-08 19:01:34,019][21195] Updated weights for policy 0, policy_version 81230 (0.0009) +[2023-10-08 19:01:34,386][21195] Updated weights for policy 0, policy_version 81240 (0.0007) +[2023-10-08 19:01:35,563][21194] Updated weights for policy 1, policy_version 80610 (0.0009) +[2023-10-08 19:01:35,929][21194] Updated weights for policy 1, policy_version 80620 (0.0008) +[2023-10-08 19:01:36,293][21194] Updated weights for policy 1, policy_version 80630 (0.0008) +[2023-10-08 19:01:36,655][21194] Updated weights for policy 1, policy_version 80640 (0.0010) +[2023-10-08 19:01:38,264][21195] Updated weights for policy 0, policy_version 81250 (0.0007) +[2023-10-08 19:01:38,635][21195] Updated weights for policy 0, policy_version 81260 (0.0009) +[2023-10-08 19:01:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 165773312. Throughput: 0: 1741.6, 1: 1695.7. Samples: 41452982. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 19:01:38,803][19739] Avg episode reward: [(0, '775.520'), (1, '913.930')] +[2023-10-08 19:01:39,003][21195] Updated weights for policy 0, policy_version 81270 (0.0009) +[2023-10-08 19:01:39,374][21195] Updated weights for policy 0, policy_version 81280 (0.0009) +[2023-10-08 19:01:40,589][21194] Updated weights for policy 1, policy_version 80650 (0.0007) +[2023-10-08 19:01:40,954][21194] Updated weights for policy 1, policy_version 80660 (0.0008) +[2023-10-08 19:01:41,329][21194] Updated weights for policy 1, policy_version 80670 (0.0009) +[2023-10-08 19:01:43,194][21195] Updated weights for policy 0, policy_version 81290 (0.0007) +[2023-10-08 19:01:43,569][21195] Updated weights for policy 0, policy_version 81300 (0.0008) +[2023-10-08 19:01:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 165838848. Throughput: 0: 1749.4, 1: 1713.7. Samples: 41474084. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 19:01:43,803][19739] Avg episode reward: [(0, '775.520'), (1, '913.930')] +[2023-10-08 19:01:43,945][21195] Updated weights for policy 0, policy_version 81310 (0.0008) +[2023-10-08 19:01:45,353][21194] Updated weights for policy 1, policy_version 80680 (0.0008) +[2023-10-08 19:01:45,724][21194] Updated weights for policy 1, policy_version 80690 (0.0008) +[2023-10-08 19:01:46,091][21194] Updated weights for policy 1, policy_version 80700 (0.0008) +[2023-10-08 19:01:47,654][21195] Updated weights for policy 0, policy_version 81320 (0.0008) +[2023-10-08 19:01:48,024][21195] Updated weights for policy 0, policy_version 81330 (0.0010) +[2023-10-08 19:01:48,392][21195] Updated weights for policy 0, policy_version 81340 (0.0010) +[2023-10-08 19:01:48,802][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 165937152. Throughput: 0: 1725.6, 1: 1696.1. Samples: 41488744. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 19:01:48,803][19739] Avg episode reward: [(0, '775.520'), (1, '913.930')] +[2023-10-08 19:01:50,087][21194] Updated weights for policy 1, policy_version 80710 (0.0009) +[2023-10-08 19:01:50,450][21194] Updated weights for policy 1, policy_version 80720 (0.0007) +[2023-10-08 19:01:50,820][21194] Updated weights for policy 1, policy_version 80730 (0.0007) +[2023-10-08 19:01:52,299][21195] Updated weights for policy 0, policy_version 81350 (0.0007) +[2023-10-08 19:01:52,674][21195] Updated weights for policy 0, policy_version 81360 (0.0011) +[2023-10-08 19:01:53,038][21195] Updated weights for policy 0, policy_version 81370 (0.0009) +[2023-10-08 19:01:53,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 166002688. Throughput: 0: 1755.2, 1: 1699.0. Samples: 41505006. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 19:01:53,803][19739] Avg episode reward: [(0, '775.520'), (1, '913.930')] +[2023-10-08 19:01:54,802][21194] Updated weights for policy 1, policy_version 80740 (0.0010) +[2023-10-08 19:01:55,182][21194] Updated weights for policy 1, policy_version 80750 (0.0010) +[2023-10-08 19:01:55,547][21194] Updated weights for policy 1, policy_version 80760 (0.0009) +[2023-10-08 19:01:56,955][21195] Updated weights for policy 0, policy_version 81380 (0.0007) +[2023-10-08 19:01:57,331][21195] Updated weights for policy 0, policy_version 81390 (0.0010) +[2023-10-08 19:01:57,714][21195] Updated weights for policy 0, policy_version 81400 (0.0009) +[2023-10-08 19:01:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 166068224. Throughput: 0: 1726.4, 1: 1723.0. Samples: 41525568. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 19:01:58,803][19739] Avg episode reward: [(0, '775.520'), (1, '913.930')] +[2023-10-08 19:01:59,359][21194] Updated weights for policy 1, policy_version 80770 (0.0010) +[2023-10-08 19:01:59,723][21194] Updated weights for policy 1, policy_version 80780 (0.0008) +[2023-10-08 19:02:00,091][21194] Updated weights for policy 1, policy_version 80790 (0.0007) +[2023-10-08 19:02:00,456][21194] Updated weights for policy 1, policy_version 80800 (0.0007) +[2023-10-08 19:02:01,531][21195] Updated weights for policy 0, policy_version 81410 (0.0010) +[2023-10-08 19:02:01,888][21195] Updated weights for policy 0, policy_version 81420 (0.0007) +[2023-10-08 19:02:02,267][21195] Updated weights for policy 0, policy_version 81430 (0.0007) +[2023-10-08 19:02:02,629][21195] Updated weights for policy 0, policy_version 81440 (0.0007) +[2023-10-08 19:02:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 166133760. Throughput: 0: 1728.5, 1: 1692.1. Samples: 41540922. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 19:02:03,803][19739] Avg episode reward: [(0, '775.520'), (1, '899.980')] +[2023-10-08 19:02:04,388][21194] Updated weights for policy 1, policy_version 80810 (0.0008) +[2023-10-08 19:02:04,755][21194] Updated weights for policy 1, policy_version 80820 (0.0009) +[2023-10-08 19:02:05,123][21194] Updated weights for policy 1, policy_version 80830 (0.0011) +[2023-10-08 19:02:06,616][21195] Updated weights for policy 0, policy_version 81450 (0.0008) +[2023-10-08 19:02:06,983][21195] Updated weights for policy 0, policy_version 81460 (0.0008) +[2023-10-08 19:02:07,354][21195] Updated weights for policy 0, policy_version 81470 (0.0010) +[2023-10-08 19:02:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 166199296. Throughput: 0: 1750.1, 1: 1724.4. Samples: 41557166. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 19:02:08,803][19739] Avg episode reward: [(0, '775.520'), (1, '915.040')] +[2023-10-08 19:02:08,871][21194] Updated weights for policy 1, policy_version 80840 (0.0008) +[2023-10-08 19:02:09,240][21194] Updated weights for policy 1, policy_version 80850 (0.0007) +[2023-10-08 19:02:09,614][21194] Updated weights for policy 1, policy_version 80860 (0.0007) +[2023-10-08 19:02:11,416][21195] Updated weights for policy 0, policy_version 81480 (0.0007) +[2023-10-08 19:02:11,794][21195] Updated weights for policy 0, policy_version 81490 (0.0008) +[2023-10-08 19:02:12,159][21195] Updated weights for policy 0, policy_version 81500 (0.0008) +[2023-10-08 19:02:13,472][21194] Updated weights for policy 1, policy_version 80870 (0.0008) +[2023-10-08 19:02:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 166264832. Throughput: 0: 1727.8, 1: 1734.8. Samples: 41578002. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 19:02:13,803][19739] Avg episode reward: [(0, '791.130'), (1, '915.040')] +[2023-10-08 19:02:13,833][21194] Updated weights for policy 1, policy_version 80880 (0.0008) +[2023-10-08 19:02:14,191][21194] Updated weights for policy 1, policy_version 80890 (0.0008) +[2023-10-08 19:02:16,070][21195] Updated weights for policy 0, policy_version 81510 (0.0009) +[2023-10-08 19:02:16,431][21195] Updated weights for policy 0, policy_version 81520 (0.0012) +[2023-10-08 19:02:16,797][21195] Updated weights for policy 0, policy_version 81530 (0.0009) +[2023-10-08 19:02:18,189][21194] Updated weights for policy 1, policy_version 80900 (0.0007) +[2023-10-08 19:02:18,558][21194] Updated weights for policy 1, policy_version 80910 (0.0010) +[2023-10-08 19:02:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 166330368. Throughput: 0: 1733.1, 1: 1717.8. Samples: 41593492. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 19:02:18,803][19739] Avg episode reward: [(0, '791.130'), (1, '914.340')] +[2023-10-08 19:02:18,911][21194] Updated weights for policy 1, policy_version 80920 (0.0011) +[2023-10-08 19:02:20,790][21195] Updated weights for policy 0, policy_version 81540 (0.0009) +[2023-10-08 19:02:21,161][21195] Updated weights for policy 0, policy_version 81550 (0.0007) +[2023-10-08 19:02:21,526][21195] Updated weights for policy 0, policy_version 81560 (0.0008) +[2023-10-08 19:02:22,862][21194] Updated weights for policy 1, policy_version 80930 (0.0009) +[2023-10-08 19:02:23,227][21194] Updated weights for policy 1, policy_version 80940 (0.0008) +[2023-10-08 19:02:23,592][21194] Updated weights for policy 1, policy_version 80950 (0.0008) +[2023-10-08 19:02:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 166395904. Throughput: 0: 1728.9, 1: 1737.5. Samples: 41608972. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 19:02:23,803][19739] Avg episode reward: [(0, '806.770'), (1, '914.340')] +[2023-10-08 19:02:23,956][21194] Updated weights for policy 1, policy_version 80960 (0.0009) +[2023-10-08 19:02:25,260][21195] Updated weights for policy 0, policy_version 81570 (0.0008) +[2023-10-08 19:02:25,618][21195] Updated weights for policy 0, policy_version 81580 (0.0010) +[2023-10-08 19:02:25,984][21195] Updated weights for policy 0, policy_version 81590 (0.0008) +[2023-10-08 19:02:26,363][21195] Updated weights for policy 0, policy_version 81600 (0.0008) +[2023-10-08 19:02:28,055][21194] Updated weights for policy 1, policy_version 80970 (0.0008) +[2023-10-08 19:02:28,425][21194] Updated weights for policy 1, policy_version 80980 (0.0009) +[2023-10-08 19:02:28,796][21194] Updated weights for policy 1, policy_version 80990 (0.0008) +[2023-10-08 19:02:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 166461440. Throughput: 0: 1731.5, 1: 1733.6. Samples: 41630010. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:02:28,804][19739] Avg episode reward: [(0, '806.770'), (1, '914.340')] +[2023-10-08 19:02:30,241][21195] Updated weights for policy 0, policy_version 81610 (0.0009) +[2023-10-08 19:02:30,611][21195] Updated weights for policy 0, policy_version 81620 (0.0008) +[2023-10-08 19:02:30,973][21195] Updated weights for policy 0, policy_version 81630 (0.0008) +[2023-10-08 19:02:32,699][21194] Updated weights for policy 1, policy_version 81000 (0.0008) +[2023-10-08 19:02:33,071][21194] Updated weights for policy 1, policy_version 81010 (0.0008) +[2023-10-08 19:02:33,441][21194] Updated weights for policy 1, policy_version 81020 (0.0009) +[2023-10-08 19:02:33,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 166559744. Throughput: 0: 1757.6, 1: 1734.5. Samples: 41645892. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:02:33,803][19739] Avg episode reward: [(0, '807.340'), (1, '914.340')] +[2023-10-08 19:02:34,758][21195] Updated weights for policy 0, policy_version 81640 (0.0010) +[2023-10-08 19:02:35,131][21195] Updated weights for policy 0, policy_version 81650 (0.0009) +[2023-10-08 19:02:35,507][21195] Updated weights for policy 0, policy_version 81660 (0.0008) +[2023-10-08 19:02:37,578][21194] Updated weights for policy 1, policy_version 81030 (0.0008) +[2023-10-08 19:02:37,934][21194] Updated weights for policy 1, policy_version 81040 (0.0008) +[2023-10-08 19:02:38,297][21194] Updated weights for policy 1, policy_version 81050 (0.0008) +[2023-10-08 19:02:38,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 166625280. Throughput: 0: 1726.3, 1: 1744.3. Samples: 41661182. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:02:38,803][19739] Avg episode reward: [(0, '822.880'), (1, '914.340')] +[2023-10-08 19:02:39,357][21195] Updated weights for policy 0, policy_version 81670 (0.0010) +[2023-10-08 19:02:39,730][21195] Updated weights for policy 0, policy_version 81680 (0.0007) +[2023-10-08 19:02:40,104][21195] Updated weights for policy 0, policy_version 81690 (0.0007) +[2023-10-08 19:02:42,233][21194] Updated weights for policy 1, policy_version 81060 (0.0009) +[2023-10-08 19:02:42,591][21194] Updated weights for policy 1, policy_version 81070 (0.0009) +[2023-10-08 19:02:42,956][21194] Updated weights for policy 1, policy_version 81080 (0.0007) +[2023-10-08 19:02:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 166690816. Throughput: 0: 1753.1, 1: 1716.0. Samples: 41681678. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:02:43,803][19739] Avg episode reward: [(0, '838.170'), (1, '914.340')] +[2023-10-08 19:02:44,003][21195] Updated weights for policy 0, policy_version 81700 (0.0008) +[2023-10-08 19:02:44,365][21195] Updated weights for policy 0, policy_version 81710 (0.0007) +[2023-10-08 19:02:44,746][21195] Updated weights for policy 0, policy_version 81720 (0.0008) +[2023-10-08 19:02:46,975][21194] Updated weights for policy 1, policy_version 81090 (0.0009) +[2023-10-08 19:02:47,341][21194] Updated weights for policy 1, policy_version 81100 (0.0008) +[2023-10-08 19:02:47,701][21194] Updated weights for policy 1, policy_version 81110 (0.0010) +[2023-10-08 19:02:48,062][21194] Updated weights for policy 1, policy_version 81120 (0.0010) +[2023-10-08 19:02:48,654][21195] Updated weights for policy 0, policy_version 81730 (0.0007) +[2023-10-08 19:02:48,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 166756352. Throughput: 0: 1746.0, 1: 1738.0. Samples: 41697702. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:02:48,803][19739] Avg episode reward: [(0, '853.780'), (1, '914.340')] +[2023-10-08 19:02:49,026][21195] Updated weights for policy 0, policy_version 81740 (0.0007) +[2023-10-08 19:02:49,402][21195] Updated weights for policy 0, policy_version 81750 (0.0010) +[2023-10-08 19:02:49,776][21195] Updated weights for policy 0, policy_version 81760 (0.0010) +[2023-10-08 19:02:51,942][21194] Updated weights for policy 1, policy_version 81130 (0.0010) +[2023-10-08 19:02:52,307][21194] Updated weights for policy 1, policy_version 81140 (0.0010) +[2023-10-08 19:02:52,675][21194] Updated weights for policy 1, policy_version 81150 (0.0008) +[2023-10-08 19:02:53,686][21195] Updated weights for policy 0, policy_version 81770 (0.0008) +[2023-10-08 19:02:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 166821888. Throughput: 0: 1733.4, 1: 1724.6. Samples: 41712776. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:02:53,803][19739] Avg episode reward: [(0, '853.780'), (1, '914.340')] +[2023-10-08 19:02:54,045][21195] Updated weights for policy 0, policy_version 81780 (0.0009) +[2023-10-08 19:02:54,412][21195] Updated weights for policy 0, policy_version 81790 (0.0007) +[2023-10-08 19:02:56,640][21194] Updated weights for policy 1, policy_version 81160 (0.0007) +[2023-10-08 19:02:57,007][21194] Updated weights for policy 1, policy_version 81170 (0.0010) +[2023-10-08 19:02:57,366][21194] Updated weights for policy 1, policy_version 81180 (0.0009) +[2023-10-08 19:02:58,464][21195] Updated weights for policy 0, policy_version 81800 (0.0008) +[2023-10-08 19:02:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 166887424. Throughput: 0: 1756.8, 1: 1701.9. Samples: 41733644. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:02:58,803][19739] Avg episode reward: [(0, '853.780'), (1, '914.340')] +[2023-10-08 19:02:58,825][21195] Updated weights for policy 0, policy_version 81810 (0.0009) +[2023-10-08 19:02:59,192][21195] Updated weights for policy 0, policy_version 81820 (0.0009) +[2023-10-08 19:03:01,294][21194] Updated weights for policy 1, policy_version 81190 (0.0007) +[2023-10-08 19:03:01,646][21194] Updated weights for policy 1, policy_version 81200 (0.0008) +[2023-10-08 19:03:02,018][21194] Updated weights for policy 1, policy_version 81210 (0.0009) +[2023-10-08 19:03:03,196][21195] Updated weights for policy 0, policy_version 81830 (0.0008) +[2023-10-08 19:03:03,560][21195] Updated weights for policy 0, policy_version 81840 (0.0009) +[2023-10-08 19:03:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 166952960. Throughput: 0: 1733.7, 1: 1729.6. Samples: 41749342. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:03:03,803][19739] Avg episode reward: [(0, '853.780'), (1, '914.340')] +[2023-10-08 19:03:03,927][21195] Updated weights for policy 0, policy_version 81850 (0.0009) +[2023-10-08 19:03:05,969][21194] Updated weights for policy 1, policy_version 81220 (0.0010) +[2023-10-08 19:03:06,341][21194] Updated weights for policy 1, policy_version 81230 (0.0007) +[2023-10-08 19:03:06,705][21194] Updated weights for policy 1, policy_version 81240 (0.0009) +[2023-10-08 19:03:07,798][21195] Updated weights for policy 0, policy_version 81860 (0.0010) +[2023-10-08 19:03:08,170][21195] Updated weights for policy 0, policy_version 81870 (0.0009) +[2023-10-08 19:03:08,544][21195] Updated weights for policy 0, policy_version 81880 (0.0007) +[2023-10-08 19:03:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 167018496. Throughput: 0: 1750.8, 1: 1708.0. Samples: 41764620. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:03:08,803][19739] Avg episode reward: [(0, '853.780'), (1, '914.340')] +[2023-10-08 19:03:10,617][21194] Updated weights for policy 1, policy_version 81250 (0.0008) +[2023-10-08 19:03:10,987][21194] Updated weights for policy 1, policy_version 81260 (0.0007) +[2023-10-08 19:03:11,358][21194] Updated weights for policy 1, policy_version 81270 (0.0009) +[2023-10-08 19:03:11,711][21194] Updated weights for policy 1, policy_version 81280 (0.0011) +[2023-10-08 19:03:12,473][21195] Updated weights for policy 0, policy_version 81890 (0.0009) +[2023-10-08 19:03:12,839][21195] Updated weights for policy 0, policy_version 81900 (0.0008) +[2023-10-08 19:03:13,213][21195] Updated weights for policy 0, policy_version 81910 (0.0007) +[2023-10-08 19:03:13,578][21195] Updated weights for policy 0, policy_version 81920 (0.0008) +[2023-10-08 19:03:13,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 167116800. Throughput: 0: 1739.7, 1: 1717.5. Samples: 41785586. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:03:13,803][19739] Avg episode reward: [(0, '853.780'), (1, '929.340')] +[2023-10-08 19:03:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000081280_83230720.pth... +[2023-10-08 19:03:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000081920_83886080.pth... +[2023-10-08 19:03:13,848][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000080288_82214912.pth +[2023-10-08 19:03:13,851][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000079680_81592320.pth +[2023-10-08 19:03:15,852][21194] Updated weights for policy 1, policy_version 81290 (0.0008) +[2023-10-08 19:03:16,231][21194] Updated weights for policy 1, policy_version 81300 (0.0009) +[2023-10-08 19:03:16,601][21194] Updated weights for policy 1, policy_version 81310 (0.0008) +[2023-10-08 19:03:17,515][21195] Updated weights for policy 0, policy_version 81930 (0.0007) +[2023-10-08 19:03:17,886][21195] Updated weights for policy 0, policy_version 81940 (0.0007) +[2023-10-08 19:03:18,254][21195] Updated weights for policy 0, policy_version 81950 (0.0009) +[2023-10-08 19:03:18,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 167182336. Throughput: 0: 1716.2, 1: 1721.6. Samples: 41800590. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 19:03:18,803][19739] Avg episode reward: [(0, '854.020'), (1, '929.340')] +[2023-10-08 19:03:20,600][21194] Updated weights for policy 1, policy_version 81320 (0.0007) +[2023-10-08 19:03:20,967][21194] Updated weights for policy 1, policy_version 81330 (0.0008) +[2023-10-08 19:03:21,334][21194] Updated weights for policy 1, policy_version 81340 (0.0008) +[2023-10-08 19:03:22,268][21195] Updated weights for policy 0, policy_version 81960 (0.0008) +[2023-10-08 19:03:22,641][21195] Updated weights for policy 0, policy_version 81970 (0.0008) +[2023-10-08 19:03:23,018][21195] Updated weights for policy 0, policy_version 81980 (0.0009) +[2023-10-08 19:03:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 167247872. Throughput: 0: 1745.8, 1: 1701.6. Samples: 41816312. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 19:03:23,803][19739] Avg episode reward: [(0, '869.640'), (1, '929.340')] +[2023-10-08 19:03:24,983][21194] Updated weights for policy 1, policy_version 81350 (0.0009) +[2023-10-08 19:03:25,346][21194] Updated weights for policy 1, policy_version 81360 (0.0009) +[2023-10-08 19:03:25,710][21194] Updated weights for policy 1, policy_version 81370 (0.0010) +[2023-10-08 19:03:26,906][21195] Updated weights for policy 0, policy_version 81990 (0.0008) +[2023-10-08 19:03:27,283][21195] Updated weights for policy 0, policy_version 82000 (0.0008) +[2023-10-08 19:03:27,647][21195] Updated weights for policy 0, policy_version 82010 (0.0009) +[2023-10-08 19:03:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 167313408. Throughput: 0: 1715.4, 1: 1735.4. Samples: 41836966. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 19:03:28,803][19739] Avg episode reward: [(0, '869.640'), (1, '929.340')] +[2023-10-08 19:03:29,526][21194] Updated weights for policy 1, policy_version 81380 (0.0008) +[2023-10-08 19:03:29,894][21194] Updated weights for policy 1, policy_version 81390 (0.0007) +[2023-10-08 19:03:30,250][21194] Updated weights for policy 1, policy_version 81400 (0.0007) +[2023-10-08 19:03:31,409][21195] Updated weights for policy 0, policy_version 82020 (0.0008) +[2023-10-08 19:03:31,786][21195] Updated weights for policy 0, policy_version 82030 (0.0009) +[2023-10-08 19:03:32,154][21195] Updated weights for policy 0, policy_version 82040 (0.0008) +[2023-10-08 19:03:33,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 167378944. Throughput: 0: 1722.9, 1: 1711.9. Samples: 41852266. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 19:03:33,803][19739] Avg episode reward: [(0, '880.680'), (1, '929.340')] +[2023-10-08 19:03:34,222][21194] Updated weights for policy 1, policy_version 81410 (0.0008) +[2023-10-08 19:03:34,598][21194] Updated weights for policy 1, policy_version 81420 (0.0008) +[2023-10-08 19:03:34,964][21194] Updated weights for policy 1, policy_version 81430 (0.0007) +[2023-10-08 19:03:35,329][21194] Updated weights for policy 1, policy_version 81440 (0.0008) +[2023-10-08 19:03:35,977][21195] Updated weights for policy 0, policy_version 82050 (0.0009) +[2023-10-08 19:03:36,353][21195] Updated weights for policy 0, policy_version 82060 (0.0010) +[2023-10-08 19:03:36,709][21195] Updated weights for policy 0, policy_version 82070 (0.0009) +[2023-10-08 19:03:37,072][21195] Updated weights for policy 0, policy_version 82080 (0.0010) +[2023-10-08 19:03:38,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 167444480. Throughput: 0: 1727.3, 1: 1726.7. Samples: 41868208. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 19:03:38,803][19739] Avg episode reward: [(0, '896.920'), (1, '943.950')] +[2023-10-08 19:03:39,231][21194] Updated weights for policy 1, policy_version 81450 (0.0009) +[2023-10-08 19:03:39,604][21194] Updated weights for policy 1, policy_version 81460 (0.0009) +[2023-10-08 19:03:39,959][21194] Updated weights for policy 1, policy_version 81470 (0.0009) +[2023-10-08 19:03:41,045][21195] Updated weights for policy 0, policy_version 82090 (0.0007) +[2023-10-08 19:03:41,410][21195] Updated weights for policy 0, policy_version 82100 (0.0008) +[2023-10-08 19:03:41,782][21195] Updated weights for policy 0, policy_version 82110 (0.0009) +[2023-10-08 19:03:43,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 167510016. Throughput: 0: 1723.3, 1: 1734.5. Samples: 41889246. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 19:03:43,803][19739] Avg episode reward: [(0, '896.920'), (1, '943.950')] +[2023-10-08 19:03:43,986][21194] Updated weights for policy 1, policy_version 81480 (0.0009) +[2023-10-08 19:03:44,341][21194] Updated weights for policy 1, policy_version 81490 (0.0009) +[2023-10-08 19:03:44,707][21194] Updated weights for policy 1, policy_version 81500 (0.0007) +[2023-10-08 19:03:45,820][21195] Updated weights for policy 0, policy_version 82120 (0.0008) +[2023-10-08 19:03:46,182][21195] Updated weights for policy 0, policy_version 82130 (0.0009) +[2023-10-08 19:03:46,557][21195] Updated weights for policy 0, policy_version 82140 (0.0010) +[2023-10-08 19:03:48,779][21194] Updated weights for policy 1, policy_version 81510 (0.0007) +[2023-10-08 19:03:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 167575552. Throughput: 0: 1738.7, 1: 1705.6. Samples: 41904338. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 19:03:48,803][19739] Avg episode reward: [(0, '896.920'), (1, '943.950')] +[2023-10-08 19:03:49,138][21194] Updated weights for policy 1, policy_version 81520 (0.0007) +[2023-10-08 19:03:49,503][21194] Updated weights for policy 1, policy_version 81530 (0.0008) +[2023-10-08 19:03:50,538][21195] Updated weights for policy 0, policy_version 82150 (0.0008) +[2023-10-08 19:03:50,903][21195] Updated weights for policy 0, policy_version 82160 (0.0008) +[2023-10-08 19:03:51,271][21195] Updated weights for policy 0, policy_version 82170 (0.0009) +[2023-10-08 19:03:53,325][21194] Updated weights for policy 1, policy_version 81540 (0.0010) +[2023-10-08 19:03:53,693][21194] Updated weights for policy 1, policy_version 81550 (0.0007) +[2023-10-08 19:03:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 167641088. Throughput: 0: 1716.1, 1: 1730.6. Samples: 41919724. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 19:03:53,803][19739] Avg episode reward: [(0, '896.920'), (1, '943.950')] +[2023-10-08 19:03:54,049][21194] Updated weights for policy 1, policy_version 81560 (0.0008) +[2023-10-08 19:03:55,098][21195] Updated weights for policy 0, policy_version 82180 (0.0009) +[2023-10-08 19:03:55,469][21195] Updated weights for policy 0, policy_version 82190 (0.0010) +[2023-10-08 19:03:55,831][21195] Updated weights for policy 0, policy_version 82200 (0.0009) +[2023-10-08 19:03:57,979][21194] Updated weights for policy 1, policy_version 81570 (0.0009) +[2023-10-08 19:03:58,340][21194] Updated weights for policy 1, policy_version 81580 (0.0009) +[2023-10-08 19:03:58,709][21194] Updated weights for policy 1, policy_version 81590 (0.0008) +[2023-10-08 19:03:58,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 167706624. Throughput: 0: 1733.1, 1: 1732.3. Samples: 41941528. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 19:03:58,803][19739] Avg episode reward: [(0, '896.920'), (1, '943.290')] +[2023-10-08 19:03:59,073][21194] Updated weights for policy 1, policy_version 81600 (0.0011) +[2023-10-08 19:03:59,699][21195] Updated weights for policy 0, policy_version 82210 (0.0008) +[2023-10-08 19:04:00,063][21195] Updated weights for policy 0, policy_version 82220 (0.0008) +[2023-10-08 19:04:00,428][21195] Updated weights for policy 0, policy_version 82230 (0.0011) +[2023-10-08 19:04:00,795][21195] Updated weights for policy 0, policy_version 82240 (0.0009) +[2023-10-08 19:04:03,229][21194] Updated weights for policy 1, policy_version 81610 (0.0008) +[2023-10-08 19:04:03,602][21194] Updated weights for policy 1, policy_version 81620 (0.0009) +[2023-10-08 19:04:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 167772160. Throughput: 0: 1760.7, 1: 1724.6. Samples: 41957430. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 19:04:03,803][19739] Avg episode reward: [(0, '896.920'), (1, '912.900')] +[2023-10-08 19:04:03,971][21194] Updated weights for policy 1, policy_version 81630 (0.0008) +[2023-10-08 19:04:04,620][21195] Updated weights for policy 0, policy_version 82250 (0.0007) +[2023-10-08 19:04:04,995][21195] Updated weights for policy 0, policy_version 82260 (0.0007) +[2023-10-08 19:04:05,357][21195] Updated weights for policy 0, policy_version 82270 (0.0009) +[2023-10-08 19:04:07,916][21194] Updated weights for policy 1, policy_version 81640 (0.0008) +[2023-10-08 19:04:08,282][21194] Updated weights for policy 1, policy_version 81650 (0.0007) +[2023-10-08 19:04:08,653][21194] Updated weights for policy 1, policy_version 81660 (0.0010) +[2023-10-08 19:04:08,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 167870464. Throughput: 0: 1734.2, 1: 1742.5. Samples: 41972766. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 19:04:08,803][19739] Avg episode reward: [(0, '896.920'), (1, '912.790')] +[2023-10-08 19:04:09,060][21195] Updated weights for policy 0, policy_version 82280 (0.0008) +[2023-10-08 19:04:09,439][21195] Updated weights for policy 0, policy_version 82290 (0.0009) +[2023-10-08 19:04:09,816][21195] Updated weights for policy 0, policy_version 82300 (0.0008) +[2023-10-08 19:04:12,414][21194] Updated weights for policy 1, policy_version 81670 (0.0011) +[2023-10-08 19:04:12,780][21194] Updated weights for policy 1, policy_version 81680 (0.0007) +[2023-10-08 19:04:13,148][21194] Updated weights for policy 1, policy_version 81690 (0.0008) +[2023-10-08 19:04:13,779][21195] Updated weights for policy 0, policy_version 82310 (0.0008) +[2023-10-08 19:04:13,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 167936000. Throughput: 0: 1762.6, 1: 1715.3. Samples: 41993472. Policy #0 lag: (min: 6.0, avg: 12.7, max: 38.0) +[2023-10-08 19:04:13,803][19739] Avg episode reward: [(0, '896.920'), (1, '912.790')] +[2023-10-08 19:04:14,143][21195] Updated weights for policy 0, policy_version 82320 (0.0008) +[2023-10-08 19:04:14,515][21195] Updated weights for policy 0, policy_version 82330 (0.0011) +[2023-10-08 19:04:17,105][21194] Updated weights for policy 1, policy_version 81700 (0.0010) +[2023-10-08 19:04:17,458][21194] Updated weights for policy 1, policy_version 81710 (0.0009) +[2023-10-08 19:04:17,828][21194] Updated weights for policy 1, policy_version 81720 (0.0008) +[2023-10-08 19:04:18,289][21195] Updated weights for policy 0, policy_version 82340 (0.0008) +[2023-10-08 19:04:18,667][21195] Updated weights for policy 0, policy_version 82350 (0.0009) +[2023-10-08 19:04:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 168001536. Throughput: 0: 1748.8, 1: 1737.5. Samples: 42009148. Policy #0 lag: (min: 6.0, avg: 12.7, max: 38.0) +[2023-10-08 19:04:18,803][19739] Avg episode reward: [(0, '896.920'), (1, '912.790')] +[2023-10-08 19:04:19,025][21195] Updated weights for policy 0, policy_version 82360 (0.0009) +[2023-10-08 19:04:21,866][21194] Updated weights for policy 1, policy_version 81730 (0.0009) +[2023-10-08 19:04:22,233][21194] Updated weights for policy 1, policy_version 81740 (0.0009) +[2023-10-08 19:04:22,599][21194] Updated weights for policy 1, policy_version 81750 (0.0009) +[2023-10-08 19:04:22,963][21194] Updated weights for policy 1, policy_version 81760 (0.0008) +[2023-10-08 19:04:23,023][21195] Updated weights for policy 0, policy_version 82370 (0.0007) +[2023-10-08 19:04:23,393][21195] Updated weights for policy 0, policy_version 82380 (0.0007) +[2023-10-08 19:04:23,761][21195] Updated weights for policy 0, policy_version 82390 (0.0009) +[2023-10-08 19:04:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 168067072. Throughput: 0: 1752.2, 1: 1727.3. Samples: 42024786. Policy #0 lag: (min: 6.0, avg: 12.7, max: 38.0) +[2023-10-08 19:04:23,803][19739] Avg episode reward: [(0, '896.920'), (1, '912.790')] +[2023-10-08 19:04:24,121][21195] Updated weights for policy 0, policy_version 82400 (0.0008) +[2023-10-08 19:04:27,094][21194] Updated weights for policy 1, policy_version 81770 (0.0009) +[2023-10-08 19:04:27,459][21194] Updated weights for policy 1, policy_version 81780 (0.0008) +[2023-10-08 19:04:27,830][21194] Updated weights for policy 1, policy_version 81790 (0.0008) +[2023-10-08 19:04:28,095][21195] Updated weights for policy 0, policy_version 82410 (0.0010) +[2023-10-08 19:04:28,459][21195] Updated weights for policy 0, policy_version 82420 (0.0010) +[2023-10-08 19:04:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 168132608. Throughput: 0: 1757.7, 1: 1705.6. Samples: 42045092. Policy #0 lag: (min: 6.0, avg: 12.7, max: 38.0) +[2023-10-08 19:04:28,803][19739] Avg episode reward: [(0, '896.920'), (1, '912.790')] +[2023-10-08 19:04:28,830][21195] Updated weights for policy 0, policy_version 82430 (0.0009) +[2023-10-08 19:04:31,856][21194] Updated weights for policy 1, policy_version 81800 (0.0007) +[2023-10-08 19:04:32,231][21194] Updated weights for policy 1, policy_version 81810 (0.0009) +[2023-10-08 19:04:32,592][21194] Updated weights for policy 1, policy_version 81820 (0.0009) +[2023-10-08 19:04:32,741][21195] Updated weights for policy 0, policy_version 82440 (0.0009) +[2023-10-08 19:04:33,112][21195] Updated weights for policy 0, policy_version 82450 (0.0008) +[2023-10-08 19:04:33,479][21195] Updated weights for policy 0, policy_version 82460 (0.0010) +[2023-10-08 19:04:33,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 168230912. Throughput: 0: 1734.0, 1: 1732.9. Samples: 42060346. Policy #0 lag: (min: 6.0, avg: 12.7, max: 38.0) +[2023-10-08 19:04:33,803][19739] Avg episode reward: [(0, '896.920'), (1, '912.790')] +[2023-10-08 19:04:36,491][21194] Updated weights for policy 1, policy_version 81830 (0.0009) +[2023-10-08 19:04:36,869][21194] Updated weights for policy 1, policy_version 81840 (0.0010) +[2023-10-08 19:04:37,229][21195] Updated weights for policy 0, policy_version 82470 (0.0007) +[2023-10-08 19:04:37,238][21194] Updated weights for policy 1, policy_version 81850 (0.0007) +[2023-10-08 19:04:37,601][21195] Updated weights for policy 0, policy_version 82480 (0.0007) +[2023-10-08 19:04:37,964][21195] Updated weights for policy 0, policy_version 82490 (0.0008) +[2023-10-08 19:04:38,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 168296448. Throughput: 0: 1768.8, 1: 1712.8. Samples: 42076396. Policy #0 lag: (min: 6.0, avg: 12.7, max: 38.0) +[2023-10-08 19:04:38,803][19739] Avg episode reward: [(0, '896.920'), (1, '912.790')] +[2023-10-08 19:04:41,236][21194] Updated weights for policy 1, policy_version 81860 (0.0007) +[2023-10-08 19:04:41,606][21194] Updated weights for policy 1, policy_version 81870 (0.0008) +[2023-10-08 19:04:41,866][21195] Updated weights for policy 0, policy_version 82500 (0.0009) +[2023-10-08 19:04:41,973][21194] Updated weights for policy 1, policy_version 81880 (0.0008) +[2023-10-08 19:04:42,228][21195] Updated weights for policy 0, policy_version 82510 (0.0009) +[2023-10-08 19:04:42,597][21195] Updated weights for policy 0, policy_version 82520 (0.0008) +[2023-10-08 19:04:43,803][19739] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 168361984. Throughput: 0: 1734.3, 1: 1701.5. Samples: 42096138. Policy #0 lag: (min: 6.0, avg: 12.7, max: 38.0) +[2023-10-08 19:04:43,804][19739] Avg episode reward: [(0, '896.920'), (1, '913.100')] +[2023-10-08 19:04:45,847][21194] Updated weights for policy 1, policy_version 81890 (0.0008) +[2023-10-08 19:04:46,225][21194] Updated weights for policy 1, policy_version 81900 (0.0007) +[2023-10-08 19:04:46,582][21195] Updated weights for policy 0, policy_version 82530 (0.0010) +[2023-10-08 19:04:46,587][21194] Updated weights for policy 1, policy_version 81910 (0.0007) +[2023-10-08 19:04:46,952][21194] Updated weights for policy 1, policy_version 81920 (0.0007) +[2023-10-08 19:04:46,953][21195] Updated weights for policy 0, policy_version 82540 (0.0009) +[2023-10-08 19:04:47,326][21195] Updated weights for policy 0, policy_version 82550 (0.0008) +[2023-10-08 19:04:47,687][21195] Updated weights for policy 0, policy_version 82560 (0.0009) +[2023-10-08 19:04:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 168427520. Throughput: 0: 1722.0, 1: 1722.9. Samples: 42112452. Policy #0 lag: (min: 6.0, avg: 12.7, max: 38.0) +[2023-10-08 19:04:48,803][19739] Avg episode reward: [(0, '896.920'), (1, '928.200')] +[2023-10-08 19:04:50,753][21194] Updated weights for policy 1, policy_version 81930 (0.0008) +[2023-10-08 19:04:51,105][21194] Updated weights for policy 1, policy_version 81940 (0.0010) +[2023-10-08 19:04:51,469][21194] Updated weights for policy 1, policy_version 81950 (0.0008) +[2023-10-08 19:04:51,646][21195] Updated weights for policy 0, policy_version 82570 (0.0007) +[2023-10-08 19:04:52,016][21195] Updated weights for policy 0, policy_version 82580 (0.0007) +[2023-10-08 19:04:52,379][21195] Updated weights for policy 0, policy_version 82590 (0.0007) +[2023-10-08 19:04:53,802][19739] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 168493056. Throughput: 0: 1737.2, 1: 1704.6. Samples: 42127648. Policy #0 lag: (min: 6.0, avg: 12.7, max: 38.0) +[2023-10-08 19:04:53,803][19739] Avg episode reward: [(0, '896.920'), (1, '915.310')] +[2023-10-08 19:04:55,423][21194] Updated weights for policy 1, policy_version 81960 (0.0010) +[2023-10-08 19:04:55,793][21194] Updated weights for policy 1, policy_version 81970 (0.0011) +[2023-10-08 19:04:56,089][21195] Updated weights for policy 0, policy_version 82600 (0.0008) +[2023-10-08 19:04:56,157][21194] Updated weights for policy 1, policy_version 81980 (0.0009) +[2023-10-08 19:04:56,449][21195] Updated weights for policy 0, policy_version 82610 (0.0008) +[2023-10-08 19:04:56,818][21195] Updated weights for policy 0, policy_version 82620 (0.0009) +[2023-10-08 19:04:58,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 168558592. Throughput: 0: 1719.4, 1: 1724.7. Samples: 42148458. Policy #0 lag: (min: 6.0, avg: 12.7, max: 38.0) +[2023-10-08 19:04:58,803][19739] Avg episode reward: [(0, '896.920'), (1, '915.310')] +[2023-10-08 19:05:00,128][21194] Updated weights for policy 1, policy_version 81990 (0.0007) +[2023-10-08 19:05:00,501][21194] Updated weights for policy 1, policy_version 82000 (0.0009) +[2023-10-08 19:05:00,777][21195] Updated weights for policy 0, policy_version 82630 (0.0008) +[2023-10-08 19:05:00,861][21194] Updated weights for policy 1, policy_version 82010 (0.0008) +[2023-10-08 19:05:01,149][21195] Updated weights for policy 0, policy_version 82640 (0.0008) +[2023-10-08 19:05:01,522][21195] Updated weights for policy 0, policy_version 82650 (0.0009) +[2023-10-08 19:05:03,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 168624128. Throughput: 0: 1735.7, 1: 1704.8. Samples: 42163970. Policy #0 lag: (min: 20.0, avg: 24.0, max: 52.0) +[2023-10-08 19:05:03,804][19739] Avg episode reward: [(0, '896.920'), (1, '915.310')] +[2023-10-08 19:05:04,808][21194] Updated weights for policy 1, policy_version 82020 (0.0007) +[2023-10-08 19:05:05,179][21194] Updated weights for policy 1, policy_version 82030 (0.0007) +[2023-10-08 19:05:05,475][21195] Updated weights for policy 0, policy_version 82660 (0.0008) +[2023-10-08 19:05:05,549][21194] Updated weights for policy 1, policy_version 82040 (0.0008) +[2023-10-08 19:05:05,846][21195] Updated weights for policy 0, policy_version 82670 (0.0008) +[2023-10-08 19:05:06,209][21195] Updated weights for policy 0, policy_version 82680 (0.0007) +[2023-10-08 19:05:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 168689664. Throughput: 0: 1719.9, 1: 1708.0. Samples: 42179042. Policy #0 lag: (min: 20.0, avg: 24.0, max: 52.0) +[2023-10-08 19:05:08,803][19739] Avg episode reward: [(0, '912.140'), (1, '915.900')] +[2023-10-08 19:05:09,618][21194] Updated weights for policy 1, policy_version 82050 (0.0007) +[2023-10-08 19:05:09,974][21195] Updated weights for policy 0, policy_version 82690 (0.0007) +[2023-10-08 19:05:09,978][21194] Updated weights for policy 1, policy_version 82060 (0.0008) +[2023-10-08 19:05:10,338][21195] Updated weights for policy 0, policy_version 82700 (0.0008) +[2023-10-08 19:05:10,352][21194] Updated weights for policy 1, policy_version 82070 (0.0008) +[2023-10-08 19:05:10,697][21195] Updated weights for policy 0, policy_version 82710 (0.0008) +[2023-10-08 19:05:10,720][21194] Updated weights for policy 1, policy_version 82080 (0.0008) +[2023-10-08 19:05:11,065][21195] Updated weights for policy 0, policy_version 82720 (0.0009) +[2023-10-08 19:05:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 168755200. Throughput: 0: 1721.6, 1: 1729.7. Samples: 42200402. Policy #0 lag: (min: 20.0, avg: 24.0, max: 52.0) +[2023-10-08 19:05:13,804][19739] Avg episode reward: [(0, '912.140'), (1, '930.490')] +[2023-10-08 19:05:13,814][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000082720_84705280.pth... +[2023-10-08 19:05:13,814][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000082080_84049920.pth... +[2023-10-08 19:05:13,849][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000080480_82411520.pth +[2023-10-08 19:05:13,853][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000081088_83034112.pth +[2023-10-08 19:05:14,691][21194] Updated weights for policy 1, policy_version 82090 (0.0010) +[2023-10-08 19:05:15,053][21194] Updated weights for policy 1, policy_version 82100 (0.0008) +[2023-10-08 19:05:15,224][21195] Updated weights for policy 0, policy_version 82730 (0.0008) +[2023-10-08 19:05:15,411][21194] Updated weights for policy 1, policy_version 82110 (0.0008) +[2023-10-08 19:05:15,584][21195] Updated weights for policy 0, policy_version 82740 (0.0009) +[2023-10-08 19:05:15,943][21195] Updated weights for policy 0, policy_version 82750 (0.0007) +[2023-10-08 19:05:18,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 168820736. Throughput: 0: 1752.7, 1: 1703.6. Samples: 42215882. Policy #0 lag: (min: 20.0, avg: 24.0, max: 52.0) +[2023-10-08 19:05:18,804][19739] Avg episode reward: [(0, '912.140'), (1, '930.490')] +[2023-10-08 19:05:19,461][21194] Updated weights for policy 1, policy_version 82120 (0.0007) +[2023-10-08 19:05:19,818][21195] Updated weights for policy 0, policy_version 82760 (0.0007) +[2023-10-08 19:05:19,832][21194] Updated weights for policy 1, policy_version 82130 (0.0009) +[2023-10-08 19:05:20,184][21195] Updated weights for policy 0, policy_version 82770 (0.0009) +[2023-10-08 19:05:20,193][21194] Updated weights for policy 1, policy_version 82140 (0.0007) +[2023-10-08 19:05:20,548][21195] Updated weights for policy 0, policy_version 82780 (0.0007) +[2023-10-08 19:05:23,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 168886272. Throughput: 0: 1717.7, 1: 1720.0. Samples: 42231094. Policy #0 lag: (min: 20.0, avg: 24.0, max: 52.0) +[2023-10-08 19:05:23,803][19739] Avg episode reward: [(0, '912.180'), (1, '929.570')] +[2023-10-08 19:05:24,270][21194] Updated weights for policy 1, policy_version 82150 (0.0009) +[2023-10-08 19:05:24,553][21195] Updated weights for policy 0, policy_version 82790 (0.0010) +[2023-10-08 19:05:24,631][21194] Updated weights for policy 1, policy_version 82160 (0.0009) +[2023-10-08 19:05:24,949][21195] Updated weights for policy 0, policy_version 82800 (0.0009) +[2023-10-08 19:05:24,997][21194] Updated weights for policy 1, policy_version 82170 (0.0008) +[2023-10-08 19:05:25,306][21195] Updated weights for policy 0, policy_version 82810 (0.0007) +[2023-10-08 19:05:28,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 168951808. Throughput: 0: 1747.1, 1: 1725.7. Samples: 42252410. Policy #0 lag: (min: 20.0, avg: 24.0, max: 52.0) +[2023-10-08 19:05:28,803][19739] Avg episode reward: [(0, '912.180'), (1, '929.430')] +[2023-10-08 19:05:28,925][21194] Updated weights for policy 1, policy_version 82180 (0.0009) +[2023-10-08 19:05:29,300][21194] Updated weights for policy 1, policy_version 82190 (0.0008) +[2023-10-08 19:05:29,371][21195] Updated weights for policy 0, policy_version 82820 (0.0009) +[2023-10-08 19:05:29,652][21194] Updated weights for policy 1, policy_version 82200 (0.0008) +[2023-10-08 19:05:29,741][21195] Updated weights for policy 0, policy_version 82830 (0.0007) +[2023-10-08 19:05:30,103][21195] Updated weights for policy 0, policy_version 82840 (0.0009) +[2023-10-08 19:05:33,762][21194] Updated weights for policy 1, policy_version 82210 (0.0010) +[2023-10-08 19:05:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 169017344. Throughput: 0: 1748.1, 1: 1700.9. Samples: 42267656. Policy #0 lag: (min: 20.0, avg: 24.0, max: 52.0) +[2023-10-08 19:05:33,803][19739] Avg episode reward: [(0, '912.110'), (1, '929.430')] +[2023-10-08 19:05:34,052][21195] Updated weights for policy 0, policy_version 82850 (0.0007) +[2023-10-08 19:05:34,124][21194] Updated weights for policy 1, policy_version 82220 (0.0007) +[2023-10-08 19:05:34,417][21195] Updated weights for policy 0, policy_version 82860 (0.0007) +[2023-10-08 19:05:34,492][21194] Updated weights for policy 1, policy_version 82230 (0.0007) +[2023-10-08 19:05:34,784][21195] Updated weights for policy 0, policy_version 82870 (0.0007) +[2023-10-08 19:05:34,850][21194] Updated weights for policy 1, policy_version 82240 (0.0010) +[2023-10-08 19:05:35,153][21195] Updated weights for policy 0, policy_version 82880 (0.0008) +[2023-10-08 19:05:38,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 169082880. Throughput: 0: 1729.5, 1: 1718.0. Samples: 42282786. Policy #0 lag: (min: 20.0, avg: 24.0, max: 52.0) +[2023-10-08 19:05:38,803][19739] Avg episode reward: [(0, '912.240'), (1, '941.380')] +[2023-10-08 19:05:38,916][21194] Updated weights for policy 1, policy_version 82250 (0.0009) +[2023-10-08 19:05:39,092][21195] Updated weights for policy 0, policy_version 82890 (0.0008) +[2023-10-08 19:05:39,286][21194] Updated weights for policy 1, policy_version 82260 (0.0008) +[2023-10-08 19:05:39,461][21195] Updated weights for policy 0, policy_version 82900 (0.0009) +[2023-10-08 19:05:39,656][21194] Updated weights for policy 1, policy_version 82270 (0.0009) +[2023-10-08 19:05:39,833][21195] Updated weights for policy 0, policy_version 82910 (0.0009) +[2023-10-08 19:05:43,647][21194] Updated weights for policy 1, policy_version 82280 (0.0008) +[2023-10-08 19:05:43,677][21195] Updated weights for policy 0, policy_version 82920 (0.0010) +[2023-10-08 19:05:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.3, 300 sec: 13662.6). Total num frames: 169148416. Throughput: 0: 1747.5, 1: 1708.0. Samples: 42303952. Policy #0 lag: (min: 20.0, avg: 24.0, max: 52.0) +[2023-10-08 19:05:43,803][19739] Avg episode reward: [(0, '912.240'), (1, '941.380')] +[2023-10-08 19:05:44,013][21194] Updated weights for policy 1, policy_version 82290 (0.0008) +[2023-10-08 19:05:44,041][21195] Updated weights for policy 0, policy_version 82930 (0.0008) +[2023-10-08 19:05:44,373][21194] Updated weights for policy 1, policy_version 82300 (0.0009) +[2023-10-08 19:05:44,416][21195] Updated weights for policy 0, policy_version 82940 (0.0008) +[2023-10-08 19:05:48,242][21194] Updated weights for policy 1, policy_version 82310 (0.0008) +[2023-10-08 19:05:48,310][21195] Updated weights for policy 0, policy_version 82950 (0.0007) +[2023-10-08 19:05:48,604][21194] Updated weights for policy 1, policy_version 82320 (0.0008) +[2023-10-08 19:05:48,673][21195] Updated weights for policy 0, policy_version 82960 (0.0007) +[2023-10-08 19:05:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 169213952. Throughput: 0: 1727.9, 1: 1709.5. Samples: 42318654. Policy #0 lag: (min: 20.0, avg: 24.0, max: 52.0) +[2023-10-08 19:05:48,803][19739] Avg episode reward: [(0, '912.240'), (1, '956.720')] +[2023-10-08 19:05:48,970][21194] Updated weights for policy 1, policy_version 82330 (0.0007) +[2023-10-08 19:05:49,052][21195] Updated weights for policy 0, policy_version 82970 (0.0009) +[2023-10-08 19:05:52,988][21195] Updated weights for policy 0, policy_version 82980 (0.0009) +[2023-10-08 19:05:53,048][21194] Updated weights for policy 1, policy_version 82340 (0.0007) +[2023-10-08 19:05:53,363][21195] Updated weights for policy 0, policy_version 82990 (0.0008) +[2023-10-08 19:05:53,406][21194] Updated weights for policy 1, policy_version 82350 (0.0007) +[2023-10-08 19:05:53,719][21195] Updated weights for policy 0, policy_version 83000 (0.0008) +[2023-10-08 19:05:53,769][21194] Updated weights for policy 1, policy_version 82360 (0.0008) +[2023-10-08 19:05:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 169279488. Throughput: 0: 1747.9, 1: 1713.3. Samples: 42334798. Policy #0 lag: (min: 20.0, avg: 24.0, max: 52.0) +[2023-10-08 19:05:53,803][19739] Avg episode reward: [(0, '912.240'), (1, '967.680')] +[2023-10-08 19:05:57,566][21194] Updated weights for policy 1, policy_version 82370 (0.0008) +[2023-10-08 19:05:57,585][21195] Updated weights for policy 0, policy_version 83010 (0.0009) +[2023-10-08 19:05:57,928][21194] Updated weights for policy 1, policy_version 82380 (0.0008) +[2023-10-08 19:05:57,945][21195] Updated weights for policy 0, policy_version 83020 (0.0007) +[2023-10-08 19:05:58,290][21194] Updated weights for policy 1, policy_version 82390 (0.0007) +[2023-10-08 19:05:58,307][21195] Updated weights for policy 0, policy_version 83030 (0.0007) +[2023-10-08 19:05:58,663][21194] Updated weights for policy 1, policy_version 82400 (0.0007) +[2023-10-08 19:05:58,672][21195] Updated weights for policy 0, policy_version 83040 (0.0007) +[2023-10-08 19:05:58,803][19739] Fps is (10 sec: 19660.8, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 169410560. Throughput: 0: 1735.9, 1: 1708.1. Samples: 42355384. Policy #0 lag: (min: 28.0, avg: 30.0, max: 60.0) +[2023-10-08 19:05:58,803][19739] Avg episode reward: [(0, '912.240'), (1, '967.680')] +[2023-10-08 19:06:02,581][21195] Updated weights for policy 0, policy_version 83050 (0.0007) +[2023-10-08 19:06:02,807][21194] Updated weights for policy 1, policy_version 82410 (0.0007) +[2023-10-08 19:06:02,947][21195] Updated weights for policy 0, policy_version 83060 (0.0009) +[2023-10-08 19:06:03,182][21194] Updated weights for policy 1, policy_version 82420 (0.0008) +[2023-10-08 19:06:03,309][21195] Updated weights for policy 0, policy_version 83070 (0.0007) +[2023-10-08 19:06:03,539][21194] Updated weights for policy 1, policy_version 82430 (0.0007) +[2023-10-08 19:06:03,803][19739] Fps is (10 sec: 19660.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 169476096. Throughput: 0: 1712.4, 1: 1712.6. Samples: 42370006. Policy #0 lag: (min: 28.0, avg: 30.0, max: 60.0) +[2023-10-08 19:06:03,803][19739] Avg episode reward: [(0, '912.240'), (1, '952.750')] +[2023-10-08 19:06:07,298][21195] Updated weights for policy 0, policy_version 83080 (0.0008) +[2023-10-08 19:06:07,458][21194] Updated weights for policy 1, policy_version 82440 (0.0008) +[2023-10-08 19:06:07,662][21195] Updated weights for policy 0, policy_version 83090 (0.0008) +[2023-10-08 19:06:07,819][21194] Updated weights for policy 1, policy_version 82450 (0.0008) +[2023-10-08 19:06:08,030][21195] Updated weights for policy 0, policy_version 83100 (0.0007) +[2023-10-08 19:06:08,191][21194] Updated weights for policy 1, policy_version 82460 (0.0008) +[2023-10-08 19:06:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 169541632. Throughput: 0: 1743.4, 1: 1718.0. Samples: 42386854. Policy #0 lag: (min: 28.0, avg: 30.0, max: 60.0) +[2023-10-08 19:06:08,803][19739] Avg episode reward: [(0, '912.240'), (1, '952.750')] +[2023-10-08 19:06:11,947][21195] Updated weights for policy 0, policy_version 83110 (0.0009) +[2023-10-08 19:06:12,211][21194] Updated weights for policy 1, policy_version 82470 (0.0010) +[2023-10-08 19:06:12,327][21195] Updated weights for policy 0, policy_version 83120 (0.0008) +[2023-10-08 19:06:12,572][21194] Updated weights for policy 1, policy_version 82480 (0.0010) +[2023-10-08 19:06:12,689][21195] Updated weights for policy 0, policy_version 83130 (0.0009) +[2023-10-08 19:06:12,941][21194] Updated weights for policy 1, policy_version 82490 (0.0007) +[2023-10-08 19:06:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 169607168. Throughput: 0: 1715.2, 1: 1695.0. Samples: 42405870. Policy #0 lag: (min: 28.0, avg: 30.0, max: 60.0) +[2023-10-08 19:06:13,803][19739] Avg episode reward: [(0, '912.240'), (1, '952.750')] +[2023-10-08 19:06:16,742][21195] Updated weights for policy 0, policy_version 83140 (0.0008) +[2023-10-08 19:06:16,834][21194] Updated weights for policy 1, policy_version 82500 (0.0007) +[2023-10-08 19:06:17,103][21195] Updated weights for policy 0, policy_version 83150 (0.0009) +[2023-10-08 19:06:17,205][21194] Updated weights for policy 1, policy_version 82510 (0.0008) +[2023-10-08 19:06:17,469][21195] Updated weights for policy 0, policy_version 83160 (0.0007) +[2023-10-08 19:06:17,569][21194] Updated weights for policy 1, policy_version 82520 (0.0008) +[2023-10-08 19:06:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 169672704. Throughput: 0: 1711.1, 1: 1719.1. Samples: 42422014. Policy #0 lag: (min: 28.0, avg: 30.0, max: 60.0) +[2023-10-08 19:06:18,803][19739] Avg episode reward: [(0, '912.380'), (1, '963.740')] +[2023-10-08 19:06:21,390][21195] Updated weights for policy 0, policy_version 83170 (0.0009) +[2023-10-08 19:06:21,405][21194] Updated weights for policy 1, policy_version 82530 (0.0009) +[2023-10-08 19:06:21,757][21195] Updated weights for policy 0, policy_version 83180 (0.0007) +[2023-10-08 19:06:21,773][21194] Updated weights for policy 1, policy_version 82540 (0.0009) +[2023-10-08 19:06:22,115][21195] Updated weights for policy 0, policy_version 83190 (0.0007) +[2023-10-08 19:06:22,140][21194] Updated weights for policy 1, policy_version 82550 (0.0007) +[2023-10-08 19:06:22,478][21195] Updated weights for policy 0, policy_version 83200 (0.0007) +[2023-10-08 19:06:22,510][21194] Updated weights for policy 1, policy_version 82560 (0.0008) +[2023-10-08 19:06:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 169738240. Throughput: 0: 1726.4, 1: 1709.0. Samples: 42437380. Policy #0 lag: (min: 28.0, avg: 30.0, max: 60.0) +[2023-10-08 19:06:23,803][19739] Avg episode reward: [(0, '912.380'), (1, '963.740')] +[2023-10-08 19:06:26,551][21195] Updated weights for policy 0, policy_version 83210 (0.0007) +[2023-10-08 19:06:26,604][21194] Updated weights for policy 1, policy_version 82570 (0.0007) +[2023-10-08 19:06:26,914][21195] Updated weights for policy 0, policy_version 83220 (0.0007) +[2023-10-08 19:06:26,968][21194] Updated weights for policy 1, policy_version 82580 (0.0007) +[2023-10-08 19:06:27,284][21195] Updated weights for policy 0, policy_version 83230 (0.0007) +[2023-10-08 19:06:27,326][21194] Updated weights for policy 1, policy_version 82590 (0.0008) +[2023-10-08 19:06:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 169803776. Throughput: 0: 1713.5, 1: 1695.0. Samples: 42457336. Policy #0 lag: (min: 28.0, avg: 30.0, max: 60.0) +[2023-10-08 19:06:28,803][19739] Avg episode reward: [(0, '926.930'), (1, '963.740')] +[2023-10-08 19:06:31,058][21195] Updated weights for policy 0, policy_version 83240 (0.0010) +[2023-10-08 19:06:31,304][21194] Updated weights for policy 1, policy_version 82600 (0.0008) +[2023-10-08 19:06:31,423][21195] Updated weights for policy 0, policy_version 83250 (0.0009) +[2023-10-08 19:06:31,666][21194] Updated weights for policy 1, policy_version 82610 (0.0007) +[2023-10-08 19:06:31,791][21195] Updated weights for policy 0, policy_version 83260 (0.0010) +[2023-10-08 19:06:32,028][21194] Updated weights for policy 1, policy_version 82620 (0.0009) +[2023-10-08 19:06:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 169869312. Throughput: 0: 1729.0, 1: 1721.2. Samples: 42473910. Policy #0 lag: (min: 28.0, avg: 30.0, max: 60.0) +[2023-10-08 19:06:33,803][19739] Avg episode reward: [(0, '926.930'), (1, '979.010')] +[2023-10-08 19:06:35,766][21195] Updated weights for policy 0, policy_version 83270 (0.0009) +[2023-10-08 19:06:36,086][21194] Updated weights for policy 1, policy_version 82630 (0.0007) +[2023-10-08 19:06:36,132][21195] Updated weights for policy 0, policy_version 83280 (0.0008) +[2023-10-08 19:06:36,452][21194] Updated weights for policy 1, policy_version 82640 (0.0007) +[2023-10-08 19:06:36,499][21195] Updated weights for policy 0, policy_version 83290 (0.0007) +[2023-10-08 19:06:36,817][21194] Updated weights for policy 1, policy_version 82650 (0.0009) +[2023-10-08 19:06:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 169934848. Throughput: 0: 1710.1, 1: 1690.7. Samples: 42487834. Policy #0 lag: (min: 28.0, avg: 30.0, max: 60.0) +[2023-10-08 19:06:38,803][19739] Avg episode reward: [(0, '926.930'), (1, '979.010')] +[2023-10-08 19:06:40,338][21195] Updated weights for policy 0, policy_version 83300 (0.0009) +[2023-10-08 19:06:40,703][21195] Updated weights for policy 0, policy_version 83310 (0.0008) +[2023-10-08 19:06:40,922][21194] Updated weights for policy 1, policy_version 82660 (0.0010) +[2023-10-08 19:06:41,064][21195] Updated weights for policy 0, policy_version 83320 (0.0008) +[2023-10-08 19:06:41,291][21194] Updated weights for policy 1, policy_version 82670 (0.0007) +[2023-10-08 19:06:41,659][21194] Updated weights for policy 1, policy_version 82680 (0.0008) +[2023-10-08 19:06:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 170000384. Throughput: 0: 1724.3, 1: 1700.4. Samples: 42509496. Policy #0 lag: (min: 28.0, avg: 30.0, max: 60.0) +[2023-10-08 19:06:43,803][19739] Avg episode reward: [(0, '957.750'), (1, '979.010')] +[2023-10-08 19:06:44,863][21195] Updated weights for policy 0, policy_version 83330 (0.0008) +[2023-10-08 19:06:45,238][21195] Updated weights for policy 0, policy_version 83340 (0.0008) +[2023-10-08 19:06:45,483][21194] Updated weights for policy 1, policy_version 82690 (0.0008) +[2023-10-08 19:06:45,603][21195] Updated weights for policy 0, policy_version 83350 (0.0009) +[2023-10-08 19:06:45,846][21194] Updated weights for policy 1, policy_version 82700 (0.0009) +[2023-10-08 19:06:45,968][21195] Updated weights for policy 0, policy_version 83360 (0.0008) +[2023-10-08 19:06:46,208][21194] Updated weights for policy 1, policy_version 82710 (0.0010) +[2023-10-08 19:06:46,575][21194] Updated weights for policy 1, policy_version 82720 (0.0008) +[2023-10-08 19:06:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 170065920. Throughput: 0: 1749.7, 1: 1711.8. Samples: 42525776. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:06:48,803][19739] Avg episode reward: [(0, '957.750'), (1, '979.010')] +[2023-10-08 19:06:49,973][21195] Updated weights for policy 0, policy_version 83370 (0.0007) +[2023-10-08 19:06:50,342][21195] Updated weights for policy 0, policy_version 83380 (0.0008) +[2023-10-08 19:06:50,538][21194] Updated weights for policy 1, policy_version 82730 (0.0011) +[2023-10-08 19:06:50,701][21195] Updated weights for policy 0, policy_version 83390 (0.0008) +[2023-10-08 19:06:50,899][21194] Updated weights for policy 1, policy_version 82740 (0.0009) +[2023-10-08 19:06:51,259][21194] Updated weights for policy 1, policy_version 82750 (0.0007) +[2023-10-08 19:06:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 170131456. Throughput: 0: 1719.4, 1: 1692.7. Samples: 42540398. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:06:53,803][19739] Avg episode reward: [(0, '957.750'), (1, '979.010')] +[2023-10-08 19:06:54,701][21195] Updated weights for policy 0, policy_version 83400 (0.0007) +[2023-10-08 19:06:55,059][21195] Updated weights for policy 0, policy_version 83410 (0.0007) +[2023-10-08 19:06:55,132][21194] Updated weights for policy 1, policy_version 82760 (0.0008) +[2023-10-08 19:06:55,419][21195] Updated weights for policy 0, policy_version 83420 (0.0011) +[2023-10-08 19:06:55,499][21194] Updated weights for policy 1, policy_version 82770 (0.0009) +[2023-10-08 19:06:55,857][21194] Updated weights for policy 1, policy_version 82780 (0.0008) +[2023-10-08 19:06:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 170196992. Throughput: 0: 1745.3, 1: 1722.7. Samples: 42561930. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:06:58,803][19739] Avg episode reward: [(0, '974.710'), (1, '979.010')] +[2023-10-08 19:06:59,343][21195] Updated weights for policy 0, policy_version 83430 (0.0010) +[2023-10-08 19:06:59,716][21195] Updated weights for policy 0, policy_version 83440 (0.0010) +[2023-10-08 19:06:59,943][21194] Updated weights for policy 1, policy_version 82790 (0.0007) +[2023-10-08 19:07:00,086][21195] Updated weights for policy 0, policy_version 83450 (0.0007) +[2023-10-08 19:07:00,300][21194] Updated weights for policy 1, policy_version 82800 (0.0007) +[2023-10-08 19:07:00,663][21194] Updated weights for policy 1, policy_version 82810 (0.0008) +[2023-10-08 19:07:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 170262528. Throughput: 0: 1753.9, 1: 1699.4. Samples: 42577412. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:07:03,803][19739] Avg episode reward: [(0, '974.710'), (1, '979.010')] +[2023-10-08 19:07:04,042][21195] Updated weights for policy 0, policy_version 83460 (0.0008) +[2023-10-08 19:07:04,408][21195] Updated weights for policy 0, policy_version 83470 (0.0010) +[2023-10-08 19:07:04,491][21194] Updated weights for policy 1, policy_version 82820 (0.0008) +[2023-10-08 19:07:04,780][21195] Updated weights for policy 0, policy_version 83480 (0.0007) +[2023-10-08 19:07:04,859][21194] Updated weights for policy 1, policy_version 82830 (0.0007) +[2023-10-08 19:07:05,219][21194] Updated weights for policy 1, policy_version 82840 (0.0010) +[2023-10-08 19:07:08,631][21195] Updated weights for policy 0, policy_version 83490 (0.0008) +[2023-10-08 19:07:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 170328064. Throughput: 0: 1737.9, 1: 1719.7. Samples: 42592972. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:07:08,803][19739] Avg episode reward: [(0, '974.710'), (1, '979.010')] +[2023-10-08 19:07:08,991][21195] Updated weights for policy 0, policy_version 83500 (0.0008) +[2023-10-08 19:07:09,124][21194] Updated weights for policy 1, policy_version 82850 (0.0010) +[2023-10-08 19:07:09,357][21195] Updated weights for policy 0, policy_version 83510 (0.0007) +[2023-10-08 19:07:09,490][21194] Updated weights for policy 1, policy_version 82860 (0.0008) +[2023-10-08 19:07:09,730][21195] Updated weights for policy 0, policy_version 83520 (0.0007) +[2023-10-08 19:07:09,850][21194] Updated weights for policy 1, policy_version 82870 (0.0008) +[2023-10-08 19:07:10,220][21194] Updated weights for policy 1, policy_version 82880 (0.0010) +[2023-10-08 19:07:13,697][21195] Updated weights for policy 0, policy_version 83530 (0.0007) +[2023-10-08 19:07:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 170393600. Throughput: 0: 1749.6, 1: 1741.4. Samples: 42614430. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:07:13,803][19739] Avg episode reward: [(0, '974.710'), (1, '979.010')] +[2023-10-08 19:07:14,028][21194] Updated weights for policy 1, policy_version 82890 (0.0010) +[2023-10-08 19:07:14,065][21195] Updated weights for policy 0, policy_version 83540 (0.0008) +[2023-10-08 19:07:14,400][21194] Updated weights for policy 1, policy_version 82900 (0.0010) +[2023-10-08 19:07:14,440][21195] Updated weights for policy 0, policy_version 83550 (0.0007) +[2023-10-08 19:07:14,510][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000083552_85557248.pth... +[2023-10-08 19:07:14,539][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000081920_83886080.pth +[2023-10-08 19:07:14,763][21194] Updated weights for policy 1, policy_version 82910 (0.0007) +[2023-10-08 19:07:14,833][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000082912_84901888.pth... +[2023-10-08 19:07:14,861][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000081280_83230720.pth +[2023-10-08 19:07:18,432][21195] Updated weights for policy 0, policy_version 83560 (0.0008) +[2023-10-08 19:07:18,730][21194] Updated weights for policy 1, policy_version 82920 (0.0008) +[2023-10-08 19:07:18,796][21195] Updated weights for policy 0, policy_version 83570 (0.0008) +[2023-10-08 19:07:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 170459136. Throughput: 0: 1731.8, 1: 1713.6. Samples: 42628950. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:07:18,803][19739] Avg episode reward: [(0, '974.710'), (1, '979.010')] +[2023-10-08 19:07:19,093][21194] Updated weights for policy 1, policy_version 82930 (0.0007) +[2023-10-08 19:07:19,173][21195] Updated weights for policy 0, policy_version 83580 (0.0009) +[2023-10-08 19:07:19,462][21194] Updated weights for policy 1, policy_version 82940 (0.0007) +[2023-10-08 19:07:23,203][21195] Updated weights for policy 0, policy_version 83590 (0.0008) +[2023-10-08 19:07:23,553][21194] Updated weights for policy 1, policy_version 82950 (0.0008) +[2023-10-08 19:07:23,572][21195] Updated weights for policy 0, policy_version 83600 (0.0009) +[2023-10-08 19:07:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 170524672. Throughput: 0: 1746.8, 1: 1743.4. Samples: 42644894. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:07:23,803][19739] Avg episode reward: [(0, '990.170'), (1, '979.010')] +[2023-10-08 19:07:23,921][21194] Updated weights for policy 1, policy_version 82960 (0.0007) +[2023-10-08 19:07:23,941][21195] Updated weights for policy 0, policy_version 83610 (0.0008) +[2023-10-08 19:07:24,275][21194] Updated weights for policy 1, policy_version 82970 (0.0010) +[2023-10-08 19:07:27,698][21195] Updated weights for policy 0, policy_version 83620 (0.0008) +[2023-10-08 19:07:28,068][21195] Updated weights for policy 0, policy_version 83630 (0.0009) +[2023-10-08 19:07:28,252][21194] Updated weights for policy 1, policy_version 82980 (0.0009) +[2023-10-08 19:07:28,437][21195] Updated weights for policy 0, policy_version 83640 (0.0009) +[2023-10-08 19:07:28,625][21194] Updated weights for policy 1, policy_version 82990 (0.0009) +[2023-10-08 19:07:28,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 170622976. Throughput: 0: 1739.5, 1: 1744.8. Samples: 42666290. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:07:28,803][19739] Avg episode reward: [(0, '1005.470'), (1, '994.280')] +[2023-10-08 19:07:28,986][21194] Updated weights for policy 1, policy_version 83000 (0.0008) +[2023-10-08 19:07:32,359][21195] Updated weights for policy 0, policy_version 83650 (0.0008) +[2023-10-08 19:07:32,727][21195] Updated weights for policy 0, policy_version 83660 (0.0008) +[2023-10-08 19:07:32,992][21194] Updated weights for policy 1, policy_version 83010 (0.0008) +[2023-10-08 19:07:33,101][21195] Updated weights for policy 0, policy_version 83670 (0.0009) +[2023-10-08 19:07:33,351][21194] Updated weights for policy 1, policy_version 83020 (0.0009) +[2023-10-08 19:07:33,458][21195] Updated weights for policy 0, policy_version 83680 (0.0010) +[2023-10-08 19:07:33,714][21194] Updated weights for policy 1, policy_version 83030 (0.0007) +[2023-10-08 19:07:33,802][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 170688512. Throughput: 0: 1712.6, 1: 1727.1. Samples: 42680564. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:07:33,803][19739] Avg episode reward: [(0, '1005.470'), (1, '994.280')] +[2023-10-08 19:07:34,076][21194] Updated weights for policy 1, policy_version 83040 (0.0009) +[2023-10-08 19:07:37,353][21195] Updated weights for policy 0, policy_version 83690 (0.0009) +[2023-10-08 19:07:37,716][21195] Updated weights for policy 0, policy_version 83700 (0.0008) +[2023-10-08 19:07:37,926][21194] Updated weights for policy 1, policy_version 83050 (0.0007) +[2023-10-08 19:07:38,087][21195] Updated weights for policy 0, policy_version 83710 (0.0008) +[2023-10-08 19:07:38,293][21194] Updated weights for policy 1, policy_version 83060 (0.0008) +[2023-10-08 19:07:38,661][21194] Updated weights for policy 1, policy_version 83070 (0.0008) +[2023-10-08 19:07:38,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 170786816. Throughput: 0: 1747.0, 1: 1745.5. Samples: 42697562. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 19:07:38,803][19739] Avg episode reward: [(0, '1005.470'), (1, '994.280')] +[2023-10-08 19:07:41,957][21195] Updated weights for policy 0, policy_version 83720 (0.0008) +[2023-10-08 19:07:42,319][21195] Updated weights for policy 0, policy_version 83730 (0.0007) +[2023-10-08 19:07:42,487][21194] Updated weights for policy 1, policy_version 83080 (0.0008) +[2023-10-08 19:07:42,696][21195] Updated weights for policy 0, policy_version 83740 (0.0009) +[2023-10-08 19:07:42,856][21194] Updated weights for policy 1, policy_version 83090 (0.0007) +[2023-10-08 19:07:43,229][21194] Updated weights for policy 1, policy_version 83100 (0.0009) +[2023-10-08 19:07:43,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 170852352. Throughput: 0: 1715.6, 1: 1729.4. Samples: 42716952. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 19:07:43,803][19739] Avg episode reward: [(0, '1020.760'), (1, '994.280')] +[2023-10-08 19:07:46,675][21195] Updated weights for policy 0, policy_version 83750 (0.0008) +[2023-10-08 19:07:47,072][21195] Updated weights for policy 0, policy_version 83760 (0.0009) +[2023-10-08 19:07:47,149][21194] Updated weights for policy 1, policy_version 83110 (0.0008) +[2023-10-08 19:07:47,439][21195] Updated weights for policy 0, policy_version 83770 (0.0010) +[2023-10-08 19:07:47,517][21194] Updated weights for policy 1, policy_version 83120 (0.0008) +[2023-10-08 19:07:47,873][21194] Updated weights for policy 1, policy_version 83130 (0.0009) +[2023-10-08 19:07:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 170917888. Throughput: 0: 1707.6, 1: 1745.0. Samples: 42732778. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 19:07:48,803][19739] Avg episode reward: [(0, '1036.380'), (1, '994.280')] +[2023-10-08 19:07:51,345][21195] Updated weights for policy 0, policy_version 83780 (0.0007) +[2023-10-08 19:07:51,720][21195] Updated weights for policy 0, policy_version 83790 (0.0008) +[2023-10-08 19:07:51,938][21194] Updated weights for policy 1, policy_version 83140 (0.0008) +[2023-10-08 19:07:52,089][21195] Updated weights for policy 0, policy_version 83800 (0.0010) +[2023-10-08 19:07:52,303][21194] Updated weights for policy 1, policy_version 83150 (0.0008) +[2023-10-08 19:07:52,671][21194] Updated weights for policy 1, policy_version 83160 (0.0007) +[2023-10-08 19:07:53,803][19739] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 170983424. Throughput: 0: 1725.7, 1: 1728.5. Samples: 42748412. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 19:07:53,804][19739] Avg episode reward: [(0, '1051.070'), (1, '1009.100')] +[2023-10-08 19:07:56,035][21195] Updated weights for policy 0, policy_version 83810 (0.0010) +[2023-10-08 19:07:56,406][21195] Updated weights for policy 0, policy_version 83820 (0.0009) +[2023-10-08 19:07:56,653][21194] Updated weights for policy 1, policy_version 83170 (0.0007) +[2023-10-08 19:07:56,775][21195] Updated weights for policy 0, policy_version 83830 (0.0009) +[2023-10-08 19:07:57,021][21194] Updated weights for policy 1, policy_version 83180 (0.0007) +[2023-10-08 19:07:57,138][21195] Updated weights for policy 0, policy_version 83840 (0.0008) +[2023-10-08 19:07:57,379][21194] Updated weights for policy 1, policy_version 83190 (0.0009) +[2023-10-08 19:07:57,747][21194] Updated weights for policy 1, policy_version 83200 (0.0010) +[2023-10-08 19:07:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 171048960. Throughput: 0: 1707.7, 1: 1704.6. Samples: 42767984. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 19:07:58,803][19739] Avg episode reward: [(0, '1051.070'), (1, '1009.100')] +[2023-10-08 19:08:01,161][21195] Updated weights for policy 0, policy_version 83850 (0.0009) +[2023-10-08 19:08:01,525][21195] Updated weights for policy 0, policy_version 83860 (0.0008) +[2023-10-08 19:08:01,794][21194] Updated weights for policy 1, policy_version 83210 (0.0008) +[2023-10-08 19:08:01,894][21195] Updated weights for policy 0, policy_version 83870 (0.0007) +[2023-10-08 19:08:02,152][21194] Updated weights for policy 1, policy_version 83220 (0.0008) +[2023-10-08 19:08:02,524][21194] Updated weights for policy 1, policy_version 83230 (0.0010) +[2023-10-08 19:08:03,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 171114496. Throughput: 0: 1727.4, 1: 1734.2. Samples: 42784722. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 19:08:03,804][19739] Avg episode reward: [(0, '1051.070'), (1, '1009.100')] +[2023-10-08 19:08:05,748][21195] Updated weights for policy 0, policy_version 83880 (0.0009) +[2023-10-08 19:08:06,119][21195] Updated weights for policy 0, policy_version 83890 (0.0007) +[2023-10-08 19:08:06,406][21194] Updated weights for policy 1, policy_version 83240 (0.0007) +[2023-10-08 19:08:06,486][21195] Updated weights for policy 0, policy_version 83900 (0.0008) +[2023-10-08 19:08:06,779][21194] Updated weights for policy 1, policy_version 83250 (0.0007) +[2023-10-08 19:08:07,144][21194] Updated weights for policy 1, policy_version 83260 (0.0007) +[2023-10-08 19:08:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 171180032. Throughput: 0: 1713.3, 1: 1714.4. Samples: 42799138. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 19:08:08,803][19739] Avg episode reward: [(0, '1051.070'), (1, '1009.100')] +[2023-10-08 19:08:10,534][21195] Updated weights for policy 0, policy_version 83910 (0.0009) +[2023-10-08 19:08:10,902][21195] Updated weights for policy 0, policy_version 83920 (0.0007) +[2023-10-08 19:08:11,099][21194] Updated weights for policy 1, policy_version 83270 (0.0008) +[2023-10-08 19:08:11,269][21195] Updated weights for policy 0, policy_version 83930 (0.0008) +[2023-10-08 19:08:11,457][21194] Updated weights for policy 1, policy_version 83280 (0.0007) +[2023-10-08 19:08:11,813][21194] Updated weights for policy 1, policy_version 83290 (0.0007) +[2023-10-08 19:08:13,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 171245568. Throughput: 0: 1712.1, 1: 1707.0. Samples: 42820150. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 19:08:13,803][19739] Avg episode reward: [(0, '1051.070'), (1, '1039.420')] +[2023-10-08 19:08:15,099][21195] Updated weights for policy 0, policy_version 83940 (0.0009) +[2023-10-08 19:08:15,468][21195] Updated weights for policy 0, policy_version 83950 (0.0010) +[2023-10-08 19:08:15,600][21194] Updated weights for policy 1, policy_version 83300 (0.0008) +[2023-10-08 19:08:15,844][21195] Updated weights for policy 0, policy_version 83960 (0.0010) +[2023-10-08 19:08:15,962][21194] Updated weights for policy 1, policy_version 83310 (0.0008) +[2023-10-08 19:08:16,327][21194] Updated weights for policy 1, policy_version 83320 (0.0010) +[2023-10-08 19:08:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 171311104. Throughput: 0: 1733.5, 1: 1727.0. Samples: 42836288. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 19:08:18,804][19739] Avg episode reward: [(0, '1037.220'), (1, '1039.420')] +[2023-10-08 19:08:19,806][21195] Updated weights for policy 0, policy_version 83970 (0.0008) +[2023-10-08 19:08:20,176][21195] Updated weights for policy 0, policy_version 83980 (0.0009) +[2023-10-08 19:08:20,230][21194] Updated weights for policy 1, policy_version 83330 (0.0008) +[2023-10-08 19:08:20,549][21195] Updated weights for policy 0, policy_version 83990 (0.0008) +[2023-10-08 19:08:20,602][21194] Updated weights for policy 1, policy_version 83340 (0.0008) +[2023-10-08 19:08:20,909][21195] Updated weights for policy 0, policy_version 84000 (0.0008) +[2023-10-08 19:08:20,960][21194] Updated weights for policy 1, policy_version 83350 (0.0009) +[2023-10-08 19:08:21,328][21194] Updated weights for policy 1, policy_version 83360 (0.0007) +[2023-10-08 19:08:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 171376640. Throughput: 0: 1698.6, 1: 1711.5. Samples: 42851018. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 19:08:23,803][19739] Avg episode reward: [(0, '1037.220'), (1, '1039.420')] +[2023-10-08 19:08:24,996][21195] Updated weights for policy 0, policy_version 84010 (0.0008) +[2023-10-08 19:08:25,361][21195] Updated weights for policy 0, policy_version 84020 (0.0009) +[2023-10-08 19:08:25,387][21194] Updated weights for policy 1, policy_version 83370 (0.0009) +[2023-10-08 19:08:25,729][21195] Updated weights for policy 0, policy_version 84030 (0.0008) +[2023-10-08 19:08:25,756][21194] Updated weights for policy 1, policy_version 83380 (0.0007) +[2023-10-08 19:08:26,114][21194] Updated weights for policy 1, policy_version 83390 (0.0008) +[2023-10-08 19:08:28,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 171442176. Throughput: 0: 1729.1, 1: 1722.9. Samples: 42872292. Policy #0 lag: (min: 31.0, avg: 38.5, max: 63.0) +[2023-10-08 19:08:28,803][19739] Avg episode reward: [(0, '1037.220'), (1, '1039.420')] +[2023-10-08 19:08:29,675][21195] Updated weights for policy 0, policy_version 84040 (0.0009) +[2023-10-08 19:08:30,045][21195] Updated weights for policy 0, policy_version 84050 (0.0008) +[2023-10-08 19:08:30,247][21194] Updated weights for policy 1, policy_version 83400 (0.0008) +[2023-10-08 19:08:30,411][21195] Updated weights for policy 0, policy_version 84060 (0.0009) +[2023-10-08 19:08:30,617][21194] Updated weights for policy 1, policy_version 83410 (0.0009) +[2023-10-08 19:08:30,974][21194] Updated weights for policy 1, policy_version 83420 (0.0009) +[2023-10-08 19:08:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 171507712. Throughput: 0: 1734.1, 1: 1709.8. Samples: 42887752. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:08:33,804][19739] Avg episode reward: [(0, '1037.220'), (1, '1039.420')] +[2023-10-08 19:08:34,321][21195] Updated weights for policy 0, policy_version 84070 (0.0007) +[2023-10-08 19:08:34,699][21195] Updated weights for policy 0, policy_version 84080 (0.0008) +[2023-10-08 19:08:34,872][21194] Updated weights for policy 1, policy_version 83430 (0.0008) +[2023-10-08 19:08:35,060][21195] Updated weights for policy 0, policy_version 84090 (0.0009) +[2023-10-08 19:08:35,241][21194] Updated weights for policy 1, policy_version 83440 (0.0007) +[2023-10-08 19:08:35,602][21194] Updated weights for policy 1, policy_version 83450 (0.0008) +[2023-10-08 19:08:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 171573248. Throughput: 0: 1717.0, 1: 1718.3. Samples: 42903000. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:08:38,803][19739] Avg episode reward: [(0, '1037.220'), (1, '1039.420')] +[2023-10-08 19:08:38,950][21195] Updated weights for policy 0, policy_version 84100 (0.0008) +[2023-10-08 19:08:39,322][21195] Updated weights for policy 0, policy_version 84110 (0.0008) +[2023-10-08 19:08:39,548][21194] Updated weights for policy 1, policy_version 83460 (0.0009) +[2023-10-08 19:08:39,694][21195] Updated weights for policy 0, policy_version 84120 (0.0007) +[2023-10-08 19:08:39,925][21194] Updated weights for policy 1, policy_version 83470 (0.0007) +[2023-10-08 19:08:40,290][21194] Updated weights for policy 1, policy_version 83480 (0.0008) +[2023-10-08 19:08:43,623][21195] Updated weights for policy 0, policy_version 84130 (0.0007) +[2023-10-08 19:08:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 171638784. Throughput: 0: 1735.6, 1: 1739.5. Samples: 42924366. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:08:43,803][19739] Avg episode reward: [(0, '1037.220'), (1, '1039.420')] +[2023-10-08 19:08:43,995][21195] Updated weights for policy 0, policy_version 84140 (0.0010) +[2023-10-08 19:08:44,320][21194] Updated weights for policy 1, policy_version 83490 (0.0008) +[2023-10-08 19:08:44,358][21195] Updated weights for policy 0, policy_version 84150 (0.0008) +[2023-10-08 19:08:44,676][21194] Updated weights for policy 1, policy_version 83500 (0.0008) +[2023-10-08 19:08:44,724][21195] Updated weights for policy 0, policy_version 84160 (0.0007) +[2023-10-08 19:08:45,039][21194] Updated weights for policy 1, policy_version 83510 (0.0009) +[2023-10-08 19:08:45,409][21194] Updated weights for policy 1, policy_version 83520 (0.0008) +[2023-10-08 19:08:48,740][21195] Updated weights for policy 0, policy_version 84170 (0.0010) +[2023-10-08 19:08:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 171704320. Throughput: 0: 1724.0, 1: 1710.3. Samples: 42939266. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:08:48,803][19739] Avg episode reward: [(0, '1037.220'), (1, '1039.420')] +[2023-10-08 19:08:49,106][21195] Updated weights for policy 0, policy_version 84180 (0.0008) +[2023-10-08 19:08:49,301][21194] Updated weights for policy 1, policy_version 83530 (0.0010) +[2023-10-08 19:08:49,469][21195] Updated weights for policy 0, policy_version 84190 (0.0009) +[2023-10-08 19:08:49,666][21194] Updated weights for policy 1, policy_version 83540 (0.0009) +[2023-10-08 19:08:50,027][21194] Updated weights for policy 1, policy_version 83550 (0.0008) +[2023-10-08 19:08:53,360][21195] Updated weights for policy 0, policy_version 84200 (0.0007) +[2023-10-08 19:08:53,715][21195] Updated weights for policy 0, policy_version 84210 (0.0007) +[2023-10-08 19:08:53,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 171769856. Throughput: 0: 1734.0, 1: 1727.0. Samples: 42954882. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:08:53,804][19739] Avg episode reward: [(0, '1037.220'), (1, '1054.600')] +[2023-10-08 19:08:53,972][21194] Updated weights for policy 1, policy_version 83560 (0.0008) +[2023-10-08 19:08:54,084][21195] Updated weights for policy 0, policy_version 84220 (0.0008) +[2023-10-08 19:08:54,335][21194] Updated weights for policy 1, policy_version 83570 (0.0008) +[2023-10-08 19:08:54,703][21194] Updated weights for policy 1, policy_version 83580 (0.0007) +[2023-10-08 19:08:58,116][21195] Updated weights for policy 0, policy_version 84230 (0.0008) +[2023-10-08 19:08:58,475][21195] Updated weights for policy 0, policy_version 84240 (0.0008) +[2023-10-08 19:08:58,565][21194] Updated weights for policy 1, policy_version 83590 (0.0008) +[2023-10-08 19:08:58,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 171835392. Throughput: 0: 1737.9, 1: 1733.2. Samples: 42976348. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:08:58,804][19739] Avg episode reward: [(0, '1037.220'), (1, '1054.600')] +[2023-10-08 19:08:58,845][21195] Updated weights for policy 0, policy_version 84250 (0.0008) +[2023-10-08 19:08:58,929][21194] Updated weights for policy 1, policy_version 83600 (0.0008) +[2023-10-08 19:08:59,305][21194] Updated weights for policy 1, policy_version 83610 (0.0008) +[2023-10-08 19:09:02,628][21195] Updated weights for policy 0, policy_version 84260 (0.0008) +[2023-10-08 19:09:02,995][21195] Updated weights for policy 0, policy_version 84270 (0.0011) +[2023-10-08 19:09:03,284][21194] Updated weights for policy 1, policy_version 83620 (0.0007) +[2023-10-08 19:09:03,367][21195] Updated weights for policy 0, policy_version 84280 (0.0008) +[2023-10-08 19:09:03,655][21194] Updated weights for policy 1, policy_version 83630 (0.0008) +[2023-10-08 19:09:03,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 171933696. Throughput: 0: 1710.1, 1: 1712.8. Samples: 42990318. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:09:03,804][19739] Avg episode reward: [(0, '1037.220'), (1, '1054.600')] +[2023-10-08 19:09:04,025][21194] Updated weights for policy 1, policy_version 83640 (0.0009) +[2023-10-08 19:09:07,438][21195] Updated weights for policy 0, policy_version 84290 (0.0009) +[2023-10-08 19:09:07,803][21195] Updated weights for policy 0, policy_version 84300 (0.0007) +[2023-10-08 19:09:07,951][21194] Updated weights for policy 1, policy_version 83650 (0.0009) +[2023-10-08 19:09:08,170][21195] Updated weights for policy 0, policy_version 84310 (0.0008) +[2023-10-08 19:09:08,315][21194] Updated weights for policy 1, policy_version 83660 (0.0007) +[2023-10-08 19:09:08,527][21195] Updated weights for policy 0, policy_version 84320 (0.0008) +[2023-10-08 19:09:08,687][21194] Updated weights for policy 1, policy_version 83670 (0.0010) +[2023-10-08 19:09:08,803][19739] Fps is (10 sec: 16384.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 171999232. Throughput: 0: 1742.3, 1: 1725.2. Samples: 43007058. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:09:08,803][19739] Avg episode reward: [(0, '1037.220'), (1, '1069.080')] +[2023-10-08 19:09:09,050][21194] Updated weights for policy 1, policy_version 83680 (0.0011) +[2023-10-08 19:09:12,397][21195] Updated weights for policy 0, policy_version 84330 (0.0008) +[2023-10-08 19:09:12,755][21195] Updated weights for policy 0, policy_version 84340 (0.0009) +[2023-10-08 19:09:13,117][21195] Updated weights for policy 0, policy_version 84350 (0.0009) +[2023-10-08 19:09:13,131][21194] Updated weights for policy 1, policy_version 83690 (0.0008) +[2023-10-08 19:09:13,494][21194] Updated weights for policy 1, policy_version 83700 (0.0007) +[2023-10-08 19:09:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 172064768. Throughput: 0: 1721.7, 1: 1725.9. Samples: 43027432. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:09:13,803][19739] Avg episode reward: [(0, '1037.220'), (1, '1069.080')] +[2023-10-08 19:09:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000084352_86376448.pth... +[2023-10-08 19:09:13,847][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000082720_84705280.pth +[2023-10-08 19:09:13,856][21194] Updated weights for policy 1, policy_version 83710 (0.0010) +[2023-10-08 19:09:13,921][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000083712_85721088.pth... +[2023-10-08 19:09:13,964][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000082080_84049920.pth +[2023-10-08 19:09:16,940][21195] Updated weights for policy 0, policy_version 84360 (0.0010) +[2023-10-08 19:09:17,305][21195] Updated weights for policy 0, policy_version 84370 (0.0009) +[2023-10-08 19:09:17,689][21195] Updated weights for policy 0, policy_version 84380 (0.0009) +[2023-10-08 19:09:17,919][21194] Updated weights for policy 1, policy_version 83720 (0.0010) +[2023-10-08 19:09:18,288][21194] Updated weights for policy 1, policy_version 83730 (0.0008) +[2023-10-08 19:09:18,645][21194] Updated weights for policy 1, policy_version 83740 (0.0009) +[2023-10-08 19:09:18,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 172163072. Throughput: 0: 1716.5, 1: 1724.3. Samples: 43042588. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:09:18,803][19739] Avg episode reward: [(0, '1052.840'), (1, '1084.280')] +[2023-10-08 19:09:21,778][21195] Updated weights for policy 0, policy_version 84390 (0.0010) +[2023-10-08 19:09:22,140][21195] Updated weights for policy 0, policy_version 84400 (0.0008) +[2023-10-08 19:09:22,515][21195] Updated weights for policy 0, policy_version 84410 (0.0007) +[2023-10-08 19:09:22,671][21194] Updated weights for policy 1, policy_version 83750 (0.0009) +[2023-10-08 19:09:23,041][21194] Updated weights for policy 1, policy_version 83760 (0.0007) +[2023-10-08 19:09:23,403][21194] Updated weights for policy 1, policy_version 83770 (0.0011) +[2023-10-08 19:09:23,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 172228608. Throughput: 0: 1739.2, 1: 1719.5. Samples: 43058640. Policy #0 lag: (min: 19.0, avg: 19.1, max: 27.0) +[2023-10-08 19:09:23,803][19739] Avg episode reward: [(0, '1052.840'), (1, '1084.280')] +[2023-10-08 19:09:26,320][21195] Updated weights for policy 0, policy_version 84420 (0.0008) +[2023-10-08 19:09:26,687][21195] Updated weights for policy 0, policy_version 84430 (0.0007) +[2023-10-08 19:09:27,053][21195] Updated weights for policy 0, policy_version 84440 (0.0008) +[2023-10-08 19:09:27,353][21194] Updated weights for policy 1, policy_version 83780 (0.0007) +[2023-10-08 19:09:27,719][21194] Updated weights for policy 1, policy_version 83790 (0.0007) +[2023-10-08 19:09:28,077][21194] Updated weights for policy 1, policy_version 83800 (0.0007) +[2023-10-08 19:09:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 172294144. Throughput: 0: 1718.3, 1: 1703.0. Samples: 43078326. Policy #0 lag: (min: 19.0, avg: 19.1, max: 27.0) +[2023-10-08 19:09:28,804][19739] Avg episode reward: [(0, '1052.840'), (1, '1084.280')] +[2023-10-08 19:09:30,954][21195] Updated weights for policy 0, policy_version 84450 (0.0011) +[2023-10-08 19:09:31,325][21195] Updated weights for policy 0, policy_version 84460 (0.0011) +[2023-10-08 19:09:31,687][21195] Updated weights for policy 0, policy_version 84470 (0.0010) +[2023-10-08 19:09:32,058][21195] Updated weights for policy 0, policy_version 84480 (0.0010) +[2023-10-08 19:09:32,148][21194] Updated weights for policy 1, policy_version 83810 (0.0008) +[2023-10-08 19:09:32,522][21194] Updated weights for policy 1, policy_version 83820 (0.0008) +[2023-10-08 19:09:32,903][21194] Updated weights for policy 1, policy_version 83830 (0.0008) +[2023-10-08 19:09:33,264][21194] Updated weights for policy 1, policy_version 83840 (0.0008) +[2023-10-08 19:09:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 172359680. Throughput: 0: 1731.6, 1: 1722.0. Samples: 43094678. Policy #0 lag: (min: 19.0, avg: 19.1, max: 27.0) +[2023-10-08 19:09:33,803][19739] Avg episode reward: [(0, '1052.840'), (1, '1084.280')] +[2023-10-08 19:09:35,954][21195] Updated weights for policy 0, policy_version 84490 (0.0010) +[2023-10-08 19:09:36,326][21195] Updated weights for policy 0, policy_version 84500 (0.0008) +[2023-10-08 19:09:36,698][21195] Updated weights for policy 0, policy_version 84510 (0.0007) +[2023-10-08 19:09:37,231][21194] Updated weights for policy 1, policy_version 83850 (0.0009) +[2023-10-08 19:09:37,596][21194] Updated weights for policy 1, policy_version 83860 (0.0009) +[2023-10-08 19:09:37,970][21194] Updated weights for policy 1, policy_version 83870 (0.0008) +[2023-10-08 19:09:38,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 172425216. Throughput: 0: 1723.6, 1: 1721.1. Samples: 43109894. Policy #0 lag: (min: 19.0, avg: 19.1, max: 27.0) +[2023-10-08 19:09:38,804][19739] Avg episode reward: [(0, '1083.710'), (1, '1109.640')] +[2023-10-08 19:09:40,645][21195] Updated weights for policy 0, policy_version 84520 (0.0009) +[2023-10-08 19:09:41,013][21195] Updated weights for policy 0, policy_version 84530 (0.0008) +[2023-10-08 19:09:41,377][21195] Updated weights for policy 0, policy_version 84540 (0.0008) +[2023-10-08 19:09:41,783][21194] Updated weights for policy 1, policy_version 83880 (0.0010) +[2023-10-08 19:09:42,155][21194] Updated weights for policy 1, policy_version 83890 (0.0008) +[2023-10-08 19:09:42,517][21194] Updated weights for policy 1, policy_version 83900 (0.0008) +[2023-10-08 19:09:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 172490752. Throughput: 0: 1722.0, 1: 1695.6. Samples: 43130136. Policy #0 lag: (min: 19.0, avg: 19.1, max: 27.0) +[2023-10-08 19:09:43,803][19739] Avg episode reward: [(0, '1098.860'), (1, '1109.640')] +[2023-10-08 19:09:45,204][21195] Updated weights for policy 0, policy_version 84550 (0.0007) +[2023-10-08 19:09:45,569][21195] Updated weights for policy 0, policy_version 84560 (0.0009) +[2023-10-08 19:09:45,942][21195] Updated weights for policy 0, policy_version 84570 (0.0008) +[2023-10-08 19:09:46,550][21194] Updated weights for policy 1, policy_version 83910 (0.0007) +[2023-10-08 19:09:46,921][21194] Updated weights for policy 1, policy_version 83920 (0.0011) +[2023-10-08 19:09:47,278][21194] Updated weights for policy 1, policy_version 83930 (0.0009) +[2023-10-08 19:09:48,803][19739] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 172556288. Throughput: 0: 1755.2, 1: 1725.1. Samples: 43146930. Policy #0 lag: (min: 19.0, avg: 19.1, max: 27.0) +[2023-10-08 19:09:48,803][19739] Avg episode reward: [(0, '1098.860'), (1, '1124.890')] +[2023-10-08 19:09:49,894][21195] Updated weights for policy 0, policy_version 84580 (0.0008) +[2023-10-08 19:09:50,253][21195] Updated weights for policy 0, policy_version 84590 (0.0008) +[2023-10-08 19:09:50,620][21195] Updated weights for policy 0, policy_version 84600 (0.0007) +[2023-10-08 19:09:51,426][21194] Updated weights for policy 1, policy_version 83940 (0.0008) +[2023-10-08 19:09:51,779][21194] Updated weights for policy 1, policy_version 83950 (0.0010) +[2023-10-08 19:09:52,141][21194] Updated weights for policy 1, policy_version 83960 (0.0010) +[2023-10-08 19:09:53,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 172621824. Throughput: 0: 1723.2, 1: 1704.0. Samples: 43161282. Policy #0 lag: (min: 19.0, avg: 19.1, max: 27.0) +[2023-10-08 19:09:53,803][19739] Avg episode reward: [(0, '1098.860'), (1, '1124.890')] +[2023-10-08 19:09:54,591][21195] Updated weights for policy 0, policy_version 84610 (0.0010) +[2023-10-08 19:09:54,965][21195] Updated weights for policy 0, policy_version 84620 (0.0009) +[2023-10-08 19:09:55,329][21195] Updated weights for policy 0, policy_version 84630 (0.0009) +[2023-10-08 19:09:55,688][21195] Updated weights for policy 0, policy_version 84640 (0.0008) +[2023-10-08 19:09:56,132][21194] Updated weights for policy 1, policy_version 83970 (0.0009) +[2023-10-08 19:09:56,499][21194] Updated weights for policy 1, policy_version 83980 (0.0010) +[2023-10-08 19:09:56,863][21194] Updated weights for policy 1, policy_version 83990 (0.0010) +[2023-10-08 19:09:57,238][21194] Updated weights for policy 1, policy_version 84000 (0.0010) +[2023-10-08 19:09:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 172687360. Throughput: 0: 1742.5, 1: 1690.1. Samples: 43181898. Policy #0 lag: (min: 19.0, avg: 19.1, max: 27.0) +[2023-10-08 19:09:58,803][19739] Avg episode reward: [(0, '1098.860'), (1, '1140.120')] +[2023-10-08 19:09:59,557][21195] Updated weights for policy 0, policy_version 84650 (0.0008) +[2023-10-08 19:09:59,923][21195] Updated weights for policy 0, policy_version 84660 (0.0007) +[2023-10-08 19:10:00,296][21195] Updated weights for policy 0, policy_version 84670 (0.0008) +[2023-10-08 19:10:01,192][21194] Updated weights for policy 1, policy_version 84010 (0.0009) +[2023-10-08 19:10:01,560][21194] Updated weights for policy 1, policy_version 84020 (0.0010) +[2023-10-08 19:10:01,915][21194] Updated weights for policy 1, policy_version 84030 (0.0008) +[2023-10-08 19:10:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 172752896. Throughput: 0: 1751.2, 1: 1711.5. Samples: 43198410. Policy #0 lag: (min: 19.0, avg: 19.1, max: 27.0) +[2023-10-08 19:10:03,803][19739] Avg episode reward: [(0, '1098.860'), (1, '1140.000')] +[2023-10-08 19:10:04,084][21195] Updated weights for policy 0, policy_version 84680 (0.0007) +[2023-10-08 19:10:04,451][21195] Updated weights for policy 0, policy_version 84690 (0.0008) +[2023-10-08 19:10:04,824][21195] Updated weights for policy 0, policy_version 84700 (0.0008) +[2023-10-08 19:10:05,653][21194] Updated weights for policy 1, policy_version 84040 (0.0008) +[2023-10-08 19:10:06,024][21194] Updated weights for policy 1, policy_version 84050 (0.0009) +[2023-10-08 19:10:06,385][21194] Updated weights for policy 1, policy_version 84060 (0.0008) +[2023-10-08 19:10:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 172818432. Throughput: 0: 1728.4, 1: 1698.3. Samples: 43212844. Policy #0 lag: (min: 19.0, avg: 19.1, max: 27.0) +[2023-10-08 19:10:08,803][19739] Avg episode reward: [(0, '1098.860'), (1, '1114.740')] +[2023-10-08 19:10:08,806][21195] Updated weights for policy 0, policy_version 84710 (0.0009) +[2023-10-08 19:10:09,181][21195] Updated weights for policy 0, policy_version 84720 (0.0007) +[2023-10-08 19:10:09,552][21195] Updated weights for policy 0, policy_version 84730 (0.0008) +[2023-10-08 19:10:10,431][21194] Updated weights for policy 1, policy_version 84070 (0.0007) +[2023-10-08 19:10:10,801][21194] Updated weights for policy 1, policy_version 84080 (0.0008) +[2023-10-08 19:10:11,170][21194] Updated weights for policy 1, policy_version 84090 (0.0009) +[2023-10-08 19:10:13,481][21195] Updated weights for policy 0, policy_version 84740 (0.0010) +[2023-10-08 19:10:13,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 172883968. Throughput: 0: 1747.7, 1: 1717.6. Samples: 43234264. Policy #0 lag: (min: 19.0, avg: 19.1, max: 27.0) +[2023-10-08 19:10:13,804][19739] Avg episode reward: [(0, '1098.860'), (1, '1114.740')] +[2023-10-08 19:10:13,854][21195] Updated weights for policy 0, policy_version 84750 (0.0009) +[2023-10-08 19:10:14,226][21195] Updated weights for policy 0, policy_version 84760 (0.0008) +[2023-10-08 19:10:15,114][21194] Updated weights for policy 1, policy_version 84100 (0.0009) +[2023-10-08 19:10:15,480][21194] Updated weights for policy 1, policy_version 84110 (0.0010) +[2023-10-08 19:10:15,843][21194] Updated weights for policy 1, policy_version 84120 (0.0010) +[2023-10-08 19:10:18,085][21195] Updated weights for policy 0, policy_version 84770 (0.0010) +[2023-10-08 19:10:18,451][21195] Updated weights for policy 0, policy_version 84780 (0.0008) +[2023-10-08 19:10:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 172949504. Throughput: 0: 1729.6, 1: 1702.8. Samples: 43249140. Policy #0 lag: (min: 19.0, avg: 19.1, max: 27.0) +[2023-10-08 19:10:18,803][19739] Avg episode reward: [(0, '1098.860'), (1, '1114.740')] +[2023-10-08 19:10:18,821][21195] Updated weights for policy 0, policy_version 84790 (0.0009) +[2023-10-08 19:10:19,181][21195] Updated weights for policy 0, policy_version 84800 (0.0010) +[2023-10-08 19:10:19,908][21194] Updated weights for policy 1, policy_version 84130 (0.0009) +[2023-10-08 19:10:20,280][21194] Updated weights for policy 1, policy_version 84140 (0.0009) +[2023-10-08 19:10:20,645][21194] Updated weights for policy 1, policy_version 84150 (0.0007) +[2023-10-08 19:10:21,000][21194] Updated weights for policy 1, policy_version 84160 (0.0009) +[2023-10-08 19:10:23,236][21195] Updated weights for policy 0, policy_version 84810 (0.0010) +[2023-10-08 19:10:23,593][21195] Updated weights for policy 0, policy_version 84820 (0.0008) +[2023-10-08 19:10:23,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 173015040. Throughput: 0: 1746.3, 1: 1699.4. Samples: 43264950. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 19:10:23,803][19739] Avg episode reward: [(0, '1098.860'), (1, '1114.740')] +[2023-10-08 19:10:23,968][21195] Updated weights for policy 0, policy_version 84830 (0.0009) +[2023-10-08 19:10:25,160][21194] Updated weights for policy 1, policy_version 84170 (0.0007) +[2023-10-08 19:10:25,538][21194] Updated weights for policy 1, policy_version 84180 (0.0008) +[2023-10-08 19:10:25,897][21194] Updated weights for policy 1, policy_version 84190 (0.0009) +[2023-10-08 19:10:27,938][21195] Updated weights for policy 0, policy_version 84840 (0.0010) +[2023-10-08 19:10:28,313][21195] Updated weights for policy 0, policy_version 84850 (0.0009) +[2023-10-08 19:10:28,679][21195] Updated weights for policy 0, policy_version 84860 (0.0010) +[2023-10-08 19:10:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 173080576. Throughput: 0: 1740.5, 1: 1717.2. Samples: 43285734. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 19:10:28,803][19739] Avg episode reward: [(0, '1098.630'), (1, '1107.940')] +[2023-10-08 19:10:29,872][21194] Updated weights for policy 1, policy_version 84200 (0.0008) +[2023-10-08 19:10:30,243][21194] Updated weights for policy 1, policy_version 84210 (0.0008) +[2023-10-08 19:10:30,609][21194] Updated weights for policy 1, policy_version 84220 (0.0007) +[2023-10-08 19:10:32,561][21195] Updated weights for policy 0, policy_version 84870 (0.0009) +[2023-10-08 19:10:32,928][21195] Updated weights for policy 0, policy_version 84880 (0.0009) +[2023-10-08 19:10:33,296][21195] Updated weights for policy 0, policy_version 84890 (0.0008) +[2023-10-08 19:10:33,803][19739] Fps is (10 sec: 16383.8, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 173178880. Throughput: 0: 1713.1, 1: 1689.6. Samples: 43300054. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 19:10:33,804][19739] Avg episode reward: [(0, '1098.630'), (1, '1100.160')] +[2023-10-08 19:10:34,440][21194] Updated weights for policy 1, policy_version 84230 (0.0007) +[2023-10-08 19:10:34,804][21194] Updated weights for policy 1, policy_version 84240 (0.0007) +[2023-10-08 19:10:35,167][21194] Updated weights for policy 1, policy_version 84250 (0.0007) +[2023-10-08 19:10:37,304][21195] Updated weights for policy 0, policy_version 84900 (0.0009) +[2023-10-08 19:10:37,684][21195] Updated weights for policy 0, policy_version 84910 (0.0010) +[2023-10-08 19:10:38,054][21195] Updated weights for policy 0, policy_version 84920 (0.0010) +[2023-10-08 19:10:38,802][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 173244416. Throughput: 0: 1744.8, 1: 1714.0. Samples: 43316928. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 19:10:38,803][19739] Avg episode reward: [(0, '1099.180'), (1, '1100.160')] +[2023-10-08 19:10:39,125][21194] Updated weights for policy 1, policy_version 84260 (0.0007) +[2023-10-08 19:10:39,485][21194] Updated weights for policy 1, policy_version 84270 (0.0009) +[2023-10-08 19:10:39,847][21194] Updated weights for policy 1, policy_version 84280 (0.0009) +[2023-10-08 19:10:41,883][21195] Updated weights for policy 0, policy_version 84930 (0.0008) +[2023-10-08 19:10:42,256][21195] Updated weights for policy 0, policy_version 84940 (0.0009) +[2023-10-08 19:10:42,632][21195] Updated weights for policy 0, policy_version 84950 (0.0009) +[2023-10-08 19:10:42,997][21195] Updated weights for policy 0, policy_version 84960 (0.0007) +[2023-10-08 19:10:43,754][21194] Updated weights for policy 1, policy_version 84290 (0.0008) +[2023-10-08 19:10:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 173309952. Throughput: 0: 1722.3, 1: 1732.9. Samples: 43337384. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 19:10:43,803][19739] Avg episode reward: [(0, '1071.960'), (1, '1100.160')] +[2023-10-08 19:10:44,114][21194] Updated weights for policy 1, policy_version 84300 (0.0009) +[2023-10-08 19:10:44,491][21194] Updated weights for policy 1, policy_version 84310 (0.0007) +[2023-10-08 19:10:44,859][21194] Updated weights for policy 1, policy_version 84320 (0.0007) +[2023-10-08 19:10:46,902][21195] Updated weights for policy 0, policy_version 84970 (0.0008) +[2023-10-08 19:10:47,276][21195] Updated weights for policy 0, policy_version 84980 (0.0008) +[2023-10-08 19:10:47,651][21195] Updated weights for policy 0, policy_version 84990 (0.0009) +[2023-10-08 19:10:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 173375488. Throughput: 0: 1716.9, 1: 1710.4. Samples: 43352638. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 19:10:48,803][19739] Avg episode reward: [(0, '1071.860'), (1, '1104.560')] +[2023-10-08 19:10:48,970][21194] Updated weights for policy 1, policy_version 84330 (0.0008) +[2023-10-08 19:10:49,334][21194] Updated weights for policy 1, policy_version 84340 (0.0011) +[2023-10-08 19:10:49,706][21194] Updated weights for policy 1, policy_version 84350 (0.0009) +[2023-10-08 19:10:51,670][21195] Updated weights for policy 0, policy_version 85000 (0.0008) +[2023-10-08 19:10:52,027][21195] Updated weights for policy 0, policy_version 85010 (0.0009) +[2023-10-08 19:10:52,398][21195] Updated weights for policy 0, policy_version 85020 (0.0009) +[2023-10-08 19:10:53,468][21194] Updated weights for policy 1, policy_version 84360 (0.0008) +[2023-10-08 19:10:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 173441024. Throughput: 0: 1735.4, 1: 1727.9. Samples: 43368692. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 19:10:53,803][19739] Avg episode reward: [(0, '1070.110'), (1, '1104.560')] +[2023-10-08 19:10:53,829][21194] Updated weights for policy 1, policy_version 84370 (0.0010) +[2023-10-08 19:10:54,194][21194] Updated weights for policy 1, policy_version 84380 (0.0008) +[2023-10-08 19:10:56,229][21195] Updated weights for policy 0, policy_version 85030 (0.0008) +[2023-10-08 19:10:56,614][21195] Updated weights for policy 0, policy_version 85040 (0.0007) +[2023-10-08 19:10:56,979][21195] Updated weights for policy 0, policy_version 85050 (0.0007) +[2023-10-08 19:10:58,093][21194] Updated weights for policy 1, policy_version 84390 (0.0008) +[2023-10-08 19:10:58,466][21194] Updated weights for policy 1, policy_version 84400 (0.0009) +[2023-10-08 19:10:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 173506560. Throughput: 0: 1715.8, 1: 1723.7. Samples: 43389042. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 19:10:58,803][19739] Avg episode reward: [(0, '1070.110'), (1, '1104.560')] +[2023-10-08 19:10:58,834][21194] Updated weights for policy 1, policy_version 84410 (0.0008) +[2023-10-08 19:11:00,859][21195] Updated weights for policy 0, policy_version 85060 (0.0008) +[2023-10-08 19:11:01,223][21195] Updated weights for policy 0, policy_version 85070 (0.0009) +[2023-10-08 19:11:01,598][21195] Updated weights for policy 0, policy_version 85080 (0.0008) +[2023-10-08 19:11:02,771][21194] Updated weights for policy 1, policy_version 84420 (0.0008) +[2023-10-08 19:11:03,138][21194] Updated weights for policy 1, policy_version 84430 (0.0009) +[2023-10-08 19:11:03,496][21194] Updated weights for policy 1, policy_version 84440 (0.0007) +[2023-10-08 19:11:03,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 173604864. Throughput: 0: 1735.2, 1: 1721.7. Samples: 43404698. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 19:11:03,803][19739] Avg episode reward: [(0, '1070.110'), (1, '1104.560')] +[2023-10-08 19:11:05,515][21195] Updated weights for policy 0, policy_version 85090 (0.0009) +[2023-10-08 19:11:05,882][21195] Updated weights for policy 0, policy_version 85100 (0.0010) +[2023-10-08 19:11:06,251][21195] Updated weights for policy 0, policy_version 85110 (0.0010) +[2023-10-08 19:11:06,613][21195] Updated weights for policy 0, policy_version 85120 (0.0008) +[2023-10-08 19:11:07,578][21194] Updated weights for policy 1, policy_version 84450 (0.0010) +[2023-10-08 19:11:07,943][21194] Updated weights for policy 1, policy_version 84460 (0.0010) +[2023-10-08 19:11:08,305][21194] Updated weights for policy 1, policy_version 84470 (0.0008) +[2023-10-08 19:11:08,668][21194] Updated weights for policy 1, policy_version 84480 (0.0007) +[2023-10-08 19:11:08,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 173670400. Throughput: 0: 1717.8, 1: 1730.3. Samples: 43420116. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 19:11:08,803][19739] Avg episode reward: [(0, '1070.110'), (1, '1104.560')] +[2023-10-08 19:11:10,461][21195] Updated weights for policy 0, policy_version 85130 (0.0009) +[2023-10-08 19:11:10,828][21195] Updated weights for policy 0, policy_version 85140 (0.0009) +[2023-10-08 19:11:11,202][21195] Updated weights for policy 0, policy_version 85150 (0.0009) +[2023-10-08 19:11:12,693][21194] Updated weights for policy 1, policy_version 84490 (0.0009) +[2023-10-08 19:11:13,066][21194] Updated weights for policy 1, policy_version 84500 (0.0009) +[2023-10-08 19:11:13,430][21194] Updated weights for policy 1, policy_version 84510 (0.0009) +[2023-10-08 19:11:13,803][19739] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 173735936. Throughput: 0: 1729.7, 1: 1716.3. Samples: 43440806. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:11:13,804][19739] Avg episode reward: [(0, '1101.340'), (1, '1104.560')] +[2023-10-08 19:11:13,814][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000085152_87195648.pth... +[2023-10-08 19:11:13,814][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000084512_86540288.pth... +[2023-10-08 19:11:13,849][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000082912_84901888.pth +[2023-10-08 19:11:13,853][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000083552_85557248.pth +[2023-10-08 19:11:15,101][21195] Updated weights for policy 0, policy_version 85160 (0.0008) +[2023-10-08 19:11:15,464][21195] Updated weights for policy 0, policy_version 85170 (0.0010) +[2023-10-08 19:11:15,834][21195] Updated weights for policy 0, policy_version 85180 (0.0009) +[2023-10-08 19:11:17,414][21194] Updated weights for policy 1, policy_version 84520 (0.0008) +[2023-10-08 19:11:17,779][21194] Updated weights for policy 1, policy_version 84530 (0.0008) +[2023-10-08 19:11:18,137][21194] Updated weights for policy 1, policy_version 84540 (0.0008) +[2023-10-08 19:11:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 173801472. Throughput: 0: 1757.3, 1: 1730.1. Samples: 43456986. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:11:18,803][19739] Avg episode reward: [(0, '1101.340'), (1, '1104.560')] +[2023-10-08 19:11:19,560][21195] Updated weights for policy 0, policy_version 85190 (0.0009) +[2023-10-08 19:11:19,927][21195] Updated weights for policy 0, policy_version 85200 (0.0010) +[2023-10-08 19:11:20,308][21195] Updated weights for policy 0, policy_version 85210 (0.0008) +[2023-10-08 19:11:22,288][21194] Updated weights for policy 1, policy_version 84550 (0.0009) +[2023-10-08 19:11:22,666][21194] Updated weights for policy 1, policy_version 84560 (0.0008) +[2023-10-08 19:11:23,030][21194] Updated weights for policy 1, policy_version 84570 (0.0008) +[2023-10-08 19:11:23,802][19739] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 173867008. Throughput: 0: 1727.2, 1: 1724.4. Samples: 43472252. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:11:23,803][19739] Avg episode reward: [(0, '1101.340'), (1, '1104.560')] +[2023-10-08 19:11:24,253][21195] Updated weights for policy 0, policy_version 85220 (0.0008) +[2023-10-08 19:11:24,624][21195] Updated weights for policy 0, policy_version 85230 (0.0009) +[2023-10-08 19:11:24,992][21195] Updated weights for policy 0, policy_version 85240 (0.0008) +[2023-10-08 19:11:26,992][21194] Updated weights for policy 1, policy_version 84580 (0.0010) +[2023-10-08 19:11:27,359][21194] Updated weights for policy 1, policy_version 84590 (0.0009) +[2023-10-08 19:11:27,725][21194] Updated weights for policy 1, policy_version 84600 (0.0009) +[2023-10-08 19:11:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 173932544. Throughput: 0: 1758.2, 1: 1692.0. Samples: 43492646. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:11:28,803][19739] Avg episode reward: [(0, '1115.990'), (1, '1104.560')] +[2023-10-08 19:11:28,816][21195] Updated weights for policy 0, policy_version 85250 (0.0008) +[2023-10-08 19:11:29,182][21195] Updated weights for policy 0, policy_version 85260 (0.0010) +[2023-10-08 19:11:29,540][21195] Updated weights for policy 0, policy_version 85270 (0.0011) +[2023-10-08 19:11:29,907][21195] Updated weights for policy 0, policy_version 85280 (0.0011) +[2023-10-08 19:11:31,690][21194] Updated weights for policy 1, policy_version 84610 (0.0009) +[2023-10-08 19:11:32,052][21194] Updated weights for policy 1, policy_version 84620 (0.0009) +[2023-10-08 19:11:32,418][21194] Updated weights for policy 1, policy_version 84630 (0.0009) +[2023-10-08 19:11:32,784][21194] Updated weights for policy 1, policy_version 84640 (0.0008) +[2023-10-08 19:11:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 173998080. Throughput: 0: 1753.8, 1: 1718.4. Samples: 43508886. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:11:33,803][19739] Avg episode reward: [(0, '1115.990'), (1, '1104.560')] +[2023-10-08 19:11:33,860][21195] Updated weights for policy 0, policy_version 85290 (0.0007) +[2023-10-08 19:11:34,229][21195] Updated weights for policy 0, policy_version 85300 (0.0010) +[2023-10-08 19:11:34,598][21195] Updated weights for policy 0, policy_version 85310 (0.0008) +[2023-10-08 19:11:36,767][21194] Updated weights for policy 1, policy_version 84650 (0.0008) +[2023-10-08 19:11:37,134][21194] Updated weights for policy 1, policy_version 84660 (0.0007) +[2023-10-08 19:11:37,499][21194] Updated weights for policy 1, policy_version 84670 (0.0007) +[2023-10-08 19:11:38,569][21195] Updated weights for policy 0, policy_version 85320 (0.0009) +[2023-10-08 19:11:38,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 174063616. Throughput: 0: 1742.1, 1: 1708.2. Samples: 43523954. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:11:38,804][19739] Avg episode reward: [(0, '1102.120'), (1, '1104.560')] +[2023-10-08 19:11:38,946][21195] Updated weights for policy 0, policy_version 85330 (0.0010) +[2023-10-08 19:11:39,306][21195] Updated weights for policy 0, policy_version 85340 (0.0008) +[2023-10-08 19:11:41,434][21194] Updated weights for policy 1, policy_version 84680 (0.0007) +[2023-10-08 19:11:41,795][21194] Updated weights for policy 1, policy_version 84690 (0.0008) +[2023-10-08 19:11:42,157][21194] Updated weights for policy 1, policy_version 84700 (0.0008) +[2023-10-08 19:11:43,251][21195] Updated weights for policy 0, policy_version 85350 (0.0008) +[2023-10-08 19:11:43,636][21195] Updated weights for policy 0, policy_version 85360 (0.0008) +[2023-10-08 19:11:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 174129152. Throughput: 0: 1766.3, 1: 1695.3. Samples: 43544814. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:11:43,803][19739] Avg episode reward: [(0, '1102.120'), (1, '1119.370')] +[2023-10-08 19:11:44,000][21195] Updated weights for policy 0, policy_version 85370 (0.0010) +[2023-10-08 19:11:46,015][21194] Updated weights for policy 1, policy_version 84710 (0.0008) +[2023-10-08 19:11:46,374][21194] Updated weights for policy 1, policy_version 84720 (0.0007) +[2023-10-08 19:11:46,740][21194] Updated weights for policy 1, policy_version 84730 (0.0009) +[2023-10-08 19:11:47,819][21195] Updated weights for policy 0, policy_version 85380 (0.0008) +[2023-10-08 19:11:48,183][21195] Updated weights for policy 0, policy_version 85390 (0.0008) +[2023-10-08 19:11:48,555][21195] Updated weights for policy 0, policy_version 85400 (0.0007) +[2023-10-08 19:11:48,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 174194688. Throughput: 0: 1735.0, 1: 1720.4. Samples: 43560192. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:11:48,803][19739] Avg episode reward: [(0, '1116.760'), (1, '1133.580')] +[2023-10-08 19:11:50,700][21194] Updated weights for policy 1, policy_version 84740 (0.0010) +[2023-10-08 19:11:51,071][21194] Updated weights for policy 1, policy_version 84750 (0.0008) +[2023-10-08 19:11:51,435][21194] Updated weights for policy 1, policy_version 84760 (0.0009) +[2023-10-08 19:11:52,471][21195] Updated weights for policy 0, policy_version 85410 (0.0009) +[2023-10-08 19:11:52,836][21195] Updated weights for policy 0, policy_version 85420 (0.0008) +[2023-10-08 19:11:53,199][21195] Updated weights for policy 0, policy_version 85430 (0.0008) +[2023-10-08 19:11:53,567][21195] Updated weights for policy 0, policy_version 85440 (0.0008) +[2023-10-08 19:11:53,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 174292992. Throughput: 0: 1763.6, 1: 1695.3. Samples: 43575766. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:11:53,803][19739] Avg episode reward: [(0, '1116.760'), (1, '1133.580')] +[2023-10-08 19:11:55,427][21194] Updated weights for policy 1, policy_version 84770 (0.0010) +[2023-10-08 19:11:55,801][21194] Updated weights for policy 1, policy_version 84780 (0.0008) +[2023-10-08 19:11:56,165][21194] Updated weights for policy 1, policy_version 84790 (0.0007) +[2023-10-08 19:11:56,535][21194] Updated weights for policy 1, policy_version 84800 (0.0008) +[2023-10-08 19:11:57,520][21195] Updated weights for policy 0, policy_version 85450 (0.0009) +[2023-10-08 19:11:57,885][21195] Updated weights for policy 0, policy_version 85460 (0.0009) +[2023-10-08 19:11:58,252][21195] Updated weights for policy 0, policy_version 85470 (0.0008) +[2023-10-08 19:11:58,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 174358528. Throughput: 0: 1744.8, 1: 1715.3. Samples: 43596512. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:11:58,803][19739] Avg episode reward: [(0, '1116.760'), (1, '1133.580')] +[2023-10-08 19:12:00,475][21194] Updated weights for policy 1, policy_version 84810 (0.0008) +[2023-10-08 19:12:00,850][21194] Updated weights for policy 1, policy_version 84820 (0.0009) +[2023-10-08 19:12:01,215][21194] Updated weights for policy 1, policy_version 84830 (0.0009) +[2023-10-08 19:12:02,139][21195] Updated weights for policy 0, policy_version 85480 (0.0010) +[2023-10-08 19:12:02,510][21195] Updated weights for policy 0, policy_version 85490 (0.0008) +[2023-10-08 19:12:02,886][21195] Updated weights for policy 0, policy_version 85500 (0.0008) +[2023-10-08 19:12:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 174424064. Throughput: 0: 1727.5, 1: 1709.5. Samples: 43611650. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:12:03,804][19739] Avg episode reward: [(0, '1130.450'), (1, '1134.320')] +[2023-10-08 19:12:03,805][20740] Saving new best policy, reward=1130.450! +[2023-10-08 19:12:05,281][21194] Updated weights for policy 1, policy_version 84840 (0.0009) +[2023-10-08 19:12:05,654][21194] Updated weights for policy 1, policy_version 84850 (0.0012) +[2023-10-08 19:12:06,014][21194] Updated weights for policy 1, policy_version 84860 (0.0010) +[2023-10-08 19:12:06,634][21195] Updated weights for policy 0, policy_version 85510 (0.0010) +[2023-10-08 19:12:06,998][21195] Updated weights for policy 0, policy_version 85520 (0.0008) +[2023-10-08 19:12:07,375][21195] Updated weights for policy 0, policy_version 85530 (0.0008) +[2023-10-08 19:12:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 174489600. Throughput: 0: 1754.5, 1: 1704.8. Samples: 43627922. Policy #0 lag: (min: 22.0, avg: 37.8, max: 54.0) +[2023-10-08 19:12:08,803][19739] Avg episode reward: [(0, '1115.170'), (1, '1104.790')] +[2023-10-08 19:12:09,903][21194] Updated weights for policy 1, policy_version 84870 (0.0009) +[2023-10-08 19:12:10,264][21194] Updated weights for policy 1, policy_version 84880 (0.0010) +[2023-10-08 19:12:10,642][21194] Updated weights for policy 1, policy_version 84890 (0.0010) +[2023-10-08 19:12:11,086][21195] Updated weights for policy 0, policy_version 85540 (0.0007) +[2023-10-08 19:12:11,448][21195] Updated weights for policy 0, policy_version 85550 (0.0007) +[2023-10-08 19:12:11,827][21195] Updated weights for policy 0, policy_version 85560 (0.0008) +[2023-10-08 19:12:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 174555136. Throughput: 0: 1729.9, 1: 1737.0. Samples: 43648654. Policy #0 lag: (min: 22.0, avg: 37.8, max: 54.0) +[2023-10-08 19:12:13,804][19739] Avg episode reward: [(0, '1069.560'), (1, '1109.440')] +[2023-10-08 19:12:14,564][21194] Updated weights for policy 1, policy_version 84900 (0.0009) +[2023-10-08 19:12:14,926][21194] Updated weights for policy 1, policy_version 84910 (0.0008) +[2023-10-08 19:12:15,291][21194] Updated weights for policy 1, policy_version 84920 (0.0009) +[2023-10-08 19:12:15,724][21195] Updated weights for policy 0, policy_version 85570 (0.0008) +[2023-10-08 19:12:16,104][21195] Updated weights for policy 0, policy_version 85580 (0.0007) +[2023-10-08 19:12:16,477][21195] Updated weights for policy 0, policy_version 85590 (0.0010) +[2023-10-08 19:12:16,848][21195] Updated weights for policy 0, policy_version 85600 (0.0010) +[2023-10-08 19:12:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 174620672. Throughput: 0: 1739.1, 1: 1707.7. Samples: 43663994. Policy #0 lag: (min: 22.0, avg: 37.8, max: 54.0) +[2023-10-08 19:12:18,803][19739] Avg episode reward: [(0, '1069.560'), (1, '1110.000')] +[2023-10-08 19:12:19,244][21194] Updated weights for policy 1, policy_version 84930 (0.0009) +[2023-10-08 19:12:19,602][21194] Updated weights for policy 1, policy_version 84940 (0.0007) +[2023-10-08 19:12:19,969][21194] Updated weights for policy 1, policy_version 84950 (0.0007) +[2023-10-08 19:12:20,329][21194] Updated weights for policy 1, policy_version 84960 (0.0007) +[2023-10-08 19:12:20,823][21195] Updated weights for policy 0, policy_version 85610 (0.0011) +[2023-10-08 19:12:21,181][21195] Updated weights for policy 0, policy_version 85620 (0.0009) +[2023-10-08 19:12:21,562][21195] Updated weights for policy 0, policy_version 85630 (0.0009) +[2023-10-08 19:12:23,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 174686208. Throughput: 0: 1730.7, 1: 1729.0. Samples: 43679638. Policy #0 lag: (min: 22.0, avg: 37.8, max: 54.0) +[2023-10-08 19:12:23,803][19739] Avg episode reward: [(0, '1069.560'), (1, '1101.990')] +[2023-10-08 19:12:24,282][21194] Updated weights for policy 1, policy_version 84970 (0.0009) +[2023-10-08 19:12:24,656][21194] Updated weights for policy 1, policy_version 84980 (0.0008) +[2023-10-08 19:12:25,022][21194] Updated weights for policy 1, policy_version 84990 (0.0007) +[2023-10-08 19:12:25,458][21195] Updated weights for policy 0, policy_version 85640 (0.0008) +[2023-10-08 19:12:25,824][21195] Updated weights for policy 0, policy_version 85650 (0.0008) +[2023-10-08 19:12:26,186][21195] Updated weights for policy 0, policy_version 85660 (0.0007) +[2023-10-08 19:12:28,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 174751744. Throughput: 0: 1732.1, 1: 1745.5. Samples: 43701308. Policy #0 lag: (min: 22.0, avg: 37.8, max: 54.0) +[2023-10-08 19:12:28,804][19739] Avg episode reward: [(0, '1069.560'), (1, '1101.990')] +[2023-10-08 19:12:28,884][21194] Updated weights for policy 1, policy_version 85000 (0.0009) +[2023-10-08 19:12:29,257][21194] Updated weights for policy 1, policy_version 85010 (0.0008) +[2023-10-08 19:12:29,616][21194] Updated weights for policy 1, policy_version 85020 (0.0008) +[2023-10-08 19:12:30,025][21195] Updated weights for policy 0, policy_version 85670 (0.0009) +[2023-10-08 19:12:30,409][21195] Updated weights for policy 0, policy_version 85680 (0.0008) +[2023-10-08 19:12:30,779][21195] Updated weights for policy 0, policy_version 85690 (0.0008) +[2023-10-08 19:12:33,435][21194] Updated weights for policy 1, policy_version 85030 (0.0009) +[2023-10-08 19:12:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 174817280. Throughput: 0: 1760.5, 1: 1719.6. Samples: 43716798. Policy #0 lag: (min: 22.0, avg: 37.8, max: 54.0) +[2023-10-08 19:12:33,804][19739] Avg episode reward: [(0, '1069.560'), (1, '1101.990')] +[2023-10-08 19:12:33,810][21194] Updated weights for policy 1, policy_version 85040 (0.0011) +[2023-10-08 19:12:34,168][21194] Updated weights for policy 1, policy_version 85050 (0.0011) +[2023-10-08 19:12:34,814][21195] Updated weights for policy 0, policy_version 85700 (0.0008) +[2023-10-08 19:12:35,190][21195] Updated weights for policy 0, policy_version 85710 (0.0011) +[2023-10-08 19:12:35,553][21195] Updated weights for policy 0, policy_version 85720 (0.0008) +[2023-10-08 19:12:37,968][21194] Updated weights for policy 1, policy_version 85060 (0.0009) +[2023-10-08 19:12:38,338][21194] Updated weights for policy 1, policy_version 85070 (0.0009) +[2023-10-08 19:12:38,700][21194] Updated weights for policy 1, policy_version 85080 (0.0008) +[2023-10-08 19:12:38,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13662.6). Total num frames: 174882816. Throughput: 0: 1733.0, 1: 1747.2. Samples: 43732378. Policy #0 lag: (min: 22.0, avg: 37.8, max: 54.0) +[2023-10-08 19:12:38,803][19739] Avg episode reward: [(0, '1069.560'), (1, '1101.990')] +[2023-10-08 19:12:39,337][21195] Updated weights for policy 0, policy_version 85730 (0.0008) +[2023-10-08 19:12:39,705][21195] Updated weights for policy 0, policy_version 85740 (0.0008) +[2023-10-08 19:12:40,076][21195] Updated weights for policy 0, policy_version 85750 (0.0008) +[2023-10-08 19:12:40,443][21195] Updated weights for policy 0, policy_version 85760 (0.0008) +[2023-10-08 19:12:42,652][21194] Updated weights for policy 1, policy_version 85090 (0.0009) +[2023-10-08 19:12:43,030][21194] Updated weights for policy 1, policy_version 85100 (0.0008) +[2023-10-08 19:12:43,400][21194] Updated weights for policy 1, policy_version 85110 (0.0007) +[2023-10-08 19:12:43,761][21194] Updated weights for policy 1, policy_version 85120 (0.0008) +[2023-10-08 19:12:43,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 174981120. Throughput: 0: 1747.9, 1: 1735.2. Samples: 43753254. Policy #0 lag: (min: 22.0, avg: 37.8, max: 54.0) +[2023-10-08 19:12:43,803][19739] Avg episode reward: [(0, '1069.560'), (1, '1101.990')] +[2023-10-08 19:12:44,408][21195] Updated weights for policy 0, policy_version 85770 (0.0007) +[2023-10-08 19:12:44,769][21195] Updated weights for policy 0, policy_version 85780 (0.0009) +[2023-10-08 19:12:45,137][21195] Updated weights for policy 0, policy_version 85790 (0.0008) +[2023-10-08 19:12:47,775][21194] Updated weights for policy 1, policy_version 85130 (0.0009) +[2023-10-08 19:12:48,139][21194] Updated weights for policy 1, policy_version 85140 (0.0009) +[2023-10-08 19:12:48,499][21194] Updated weights for policy 1, policy_version 85150 (0.0010) +[2023-10-08 19:12:48,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 175046656. Throughput: 0: 1765.7, 1: 1738.5. Samples: 43769342. Policy #0 lag: (min: 22.0, avg: 37.8, max: 54.0) +[2023-10-08 19:12:48,803][19739] Avg episode reward: [(0, '1069.560'), (1, '1101.990')] +[2023-10-08 19:12:49,006][21195] Updated weights for policy 0, policy_version 85800 (0.0009) +[2023-10-08 19:12:49,385][21195] Updated weights for policy 0, policy_version 85810 (0.0007) +[2023-10-08 19:12:49,758][21195] Updated weights for policy 0, policy_version 85820 (0.0008) +[2023-10-08 19:12:52,287][21194] Updated weights for policy 1, policy_version 85160 (0.0008) +[2023-10-08 19:12:52,643][21194] Updated weights for policy 1, policy_version 85170 (0.0007) +[2023-10-08 19:12:53,018][21194] Updated weights for policy 1, policy_version 85180 (0.0008) +[2023-10-08 19:12:53,538][21195] Updated weights for policy 0, policy_version 85830 (0.0010) +[2023-10-08 19:12:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 175112192. Throughput: 0: 1739.6, 1: 1744.6. Samples: 43784712. Policy #0 lag: (min: 22.0, avg: 37.8, max: 54.0) +[2023-10-08 19:12:53,803][19739] Avg episode reward: [(0, '1069.560'), (1, '1101.990')] +[2023-10-08 19:12:53,911][21195] Updated weights for policy 0, policy_version 85840 (0.0010) +[2023-10-08 19:12:54,277][21195] Updated weights for policy 0, policy_version 85850 (0.0010) +[2023-10-08 19:12:57,232][21194] Updated weights for policy 1, policy_version 85190 (0.0008) +[2023-10-08 19:12:57,602][21194] Updated weights for policy 1, policy_version 85200 (0.0007) +[2023-10-08 19:12:57,973][21194] Updated weights for policy 1, policy_version 85210 (0.0008) +[2023-10-08 19:12:58,295][21195] Updated weights for policy 0, policy_version 85860 (0.0009) +[2023-10-08 19:12:58,662][21195] Updated weights for policy 0, policy_version 85870 (0.0010) +[2023-10-08 19:12:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 175177728. Throughput: 0: 1758.5, 1: 1716.7. Samples: 43805036. Policy #0 lag: (min: 22.0, avg: 37.8, max: 54.0) +[2023-10-08 19:12:58,803][19739] Avg episode reward: [(0, '1069.560'), (1, '1101.950')] +[2023-10-08 19:12:59,030][21195] Updated weights for policy 0, policy_version 85880 (0.0009) +[2023-10-08 19:13:01,892][21194] Updated weights for policy 1, policy_version 85220 (0.0008) +[2023-10-08 19:13:02,250][21194] Updated weights for policy 1, policy_version 85230 (0.0007) +[2023-10-08 19:13:02,620][21194] Updated weights for policy 1, policy_version 85240 (0.0008) +[2023-10-08 19:13:02,924][21195] Updated weights for policy 0, policy_version 85890 (0.0010) +[2023-10-08 19:13:03,302][21195] Updated weights for policy 0, policy_version 85900 (0.0008) +[2023-10-08 19:13:03,665][21195] Updated weights for policy 0, policy_version 85910 (0.0009) +[2023-10-08 19:13:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 175243264. Throughput: 0: 1736.3, 1: 1740.3. Samples: 43820438. Policy #0 lag: (min: 22.0, avg: 37.8, max: 54.0) +[2023-10-08 19:13:03,803][19739] Avg episode reward: [(0, '1069.560'), (1, '1102.180')] +[2023-10-08 19:13:04,030][21195] Updated weights for policy 0, policy_version 85920 (0.0008) +[2023-10-08 19:13:06,738][21194] Updated weights for policy 1, policy_version 85250 (0.0008) +[2023-10-08 19:13:07,098][21194] Updated weights for policy 1, policy_version 85260 (0.0010) +[2023-10-08 19:13:07,464][21194] Updated weights for policy 1, policy_version 85270 (0.0008) +[2023-10-08 19:13:07,795][21195] Updated weights for policy 0, policy_version 85930 (0.0008) +[2023-10-08 19:13:07,828][21194] Updated weights for policy 1, policy_version 85280 (0.0009) +[2023-10-08 19:13:08,168][21195] Updated weights for policy 0, policy_version 85940 (0.0008) +[2023-10-08 19:13:08,539][21195] Updated weights for policy 0, policy_version 85950 (0.0008) +[2023-10-08 19:13:08,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 175341568. Throughput: 0: 1763.6, 1: 1718.7. Samples: 43836340. Policy #0 lag: (min: 10.0, avg: 10.0, max: 10.0) +[2023-10-08 19:13:08,803][19739] Avg episode reward: [(0, '1069.560'), (1, '1102.180')] +[2023-10-08 19:13:11,739][21194] Updated weights for policy 1, policy_version 85290 (0.0007) +[2023-10-08 19:13:12,100][21194] Updated weights for policy 1, policy_version 85300 (0.0007) +[2023-10-08 19:13:12,461][21194] Updated weights for policy 1, policy_version 85310 (0.0009) +[2023-10-08 19:13:12,522][21195] Updated weights for policy 0, policy_version 85960 (0.0009) +[2023-10-08 19:13:12,888][21195] Updated weights for policy 0, policy_version 85970 (0.0008) +[2023-10-08 19:13:13,264][21195] Updated weights for policy 0, policy_version 85980 (0.0008) +[2023-10-08 19:13:13,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 175407104. Throughput: 0: 1743.6, 1: 1699.6. Samples: 43856252. Policy #0 lag: (min: 10.0, avg: 10.0, max: 10.0) +[2023-10-08 19:13:13,803][19739] Avg episode reward: [(0, '1069.560'), (1, '1102.180')] +[2023-10-08 19:13:13,813][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000085312_87359488.pth... +[2023-10-08 19:13:13,813][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000085984_88047616.pth... +[2023-10-08 19:13:13,850][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000084352_86376448.pth +[2023-10-08 19:13:13,852][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000083712_85721088.pth +[2023-10-08 19:13:16,549][21194] Updated weights for policy 1, policy_version 85320 (0.0008) +[2023-10-08 19:13:16,917][21194] Updated weights for policy 1, policy_version 85330 (0.0007) +[2023-10-08 19:13:17,281][21194] Updated weights for policy 1, policy_version 85340 (0.0008) +[2023-10-08 19:13:17,337][21195] Updated weights for policy 0, policy_version 85990 (0.0008) +[2023-10-08 19:13:17,726][21195] Updated weights for policy 0, policy_version 86000 (0.0008) +[2023-10-08 19:13:18,086][21195] Updated weights for policy 0, policy_version 86010 (0.0009) +[2023-10-08 19:13:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 175472640. Throughput: 0: 1722.0, 1: 1728.0. Samples: 43872044. Policy #0 lag: (min: 10.0, avg: 10.0, max: 10.0) +[2023-10-08 19:13:18,803][19739] Avg episode reward: [(0, '1069.560'), (1, '1102.180')] +[2023-10-08 19:13:21,334][21194] Updated weights for policy 1, policy_version 85350 (0.0009) +[2023-10-08 19:13:21,697][21194] Updated weights for policy 1, policy_version 85360 (0.0009) +[2023-10-08 19:13:21,983][21195] Updated weights for policy 0, policy_version 86020 (0.0007) +[2023-10-08 19:13:22,064][21194] Updated weights for policy 1, policy_version 85370 (0.0009) +[2023-10-08 19:13:22,344][21195] Updated weights for policy 0, policy_version 86030 (0.0009) +[2023-10-08 19:13:22,709][21195] Updated weights for policy 0, policy_version 86040 (0.0010) +[2023-10-08 19:13:23,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 175538176. Throughput: 0: 1750.9, 1: 1699.4. Samples: 43887642. Policy #0 lag: (min: 10.0, avg: 10.0, max: 10.0) +[2023-10-08 19:13:23,803][19739] Avg episode reward: [(0, '1069.560'), (1, '1103.270')] +[2023-10-08 19:13:26,022][21194] Updated weights for policy 1, policy_version 85380 (0.0008) +[2023-10-08 19:13:26,381][21194] Updated weights for policy 1, policy_version 85390 (0.0010) +[2023-10-08 19:13:26,656][21195] Updated weights for policy 0, policy_version 86050 (0.0010) +[2023-10-08 19:13:26,737][21194] Updated weights for policy 1, policy_version 85400 (0.0010) +[2023-10-08 19:13:27,016][21195] Updated weights for policy 0, policy_version 86060 (0.0007) +[2023-10-08 19:13:27,381][21195] Updated weights for policy 0, policy_version 86070 (0.0011) +[2023-10-08 19:13:27,750][21195] Updated weights for policy 0, policy_version 86080 (0.0009) +[2023-10-08 19:13:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 175603712. Throughput: 0: 1717.3, 1: 1711.2. Samples: 43907536. Policy #0 lag: (min: 10.0, avg: 10.0, max: 10.0) +[2023-10-08 19:13:28,803][19739] Avg episode reward: [(0, '1069.570'), (1, '1103.270')] +[2023-10-08 19:13:30,531][21194] Updated weights for policy 1, policy_version 85410 (0.0009) +[2023-10-08 19:13:30,895][21194] Updated weights for policy 1, policy_version 85420 (0.0007) +[2023-10-08 19:13:31,260][21194] Updated weights for policy 1, policy_version 85430 (0.0007) +[2023-10-08 19:13:31,622][21194] Updated weights for policy 1, policy_version 85440 (0.0007) +[2023-10-08 19:13:31,744][21195] Updated weights for policy 0, policy_version 86090 (0.0010) +[2023-10-08 19:13:32,112][21195] Updated weights for policy 0, policy_version 86100 (0.0010) +[2023-10-08 19:13:32,471][21195] Updated weights for policy 0, policy_version 86110 (0.0008) +[2023-10-08 19:13:33,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 175669248. Throughput: 0: 1715.9, 1: 1713.3. Samples: 43923656. Policy #0 lag: (min: 10.0, avg: 10.0, max: 10.0) +[2023-10-08 19:13:33,803][19739] Avg episode reward: [(0, '1069.570'), (1, '1103.270')] +[2023-10-08 19:13:35,661][21194] Updated weights for policy 1, policy_version 85450 (0.0010) +[2023-10-08 19:13:36,024][21194] Updated weights for policy 1, policy_version 85460 (0.0011) +[2023-10-08 19:13:36,391][21194] Updated weights for policy 1, policy_version 85470 (0.0008) +[2023-10-08 19:13:36,448][21195] Updated weights for policy 0, policy_version 86120 (0.0007) +[2023-10-08 19:13:36,818][21195] Updated weights for policy 0, policy_version 86130 (0.0008) +[2023-10-08 19:13:37,186][21195] Updated weights for policy 0, policy_version 86140 (0.0007) +[2023-10-08 19:13:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 175734784. Throughput: 0: 1728.2, 1: 1695.3. Samples: 43938768. Policy #0 lag: (min: 10.0, avg: 10.0, max: 10.0) +[2023-10-08 19:13:38,803][19739] Avg episode reward: [(0, '1069.570'), (1, '1103.270')] +[2023-10-08 19:13:40,326][21194] Updated weights for policy 1, policy_version 85480 (0.0010) +[2023-10-08 19:13:40,687][21194] Updated weights for policy 1, policy_version 85490 (0.0010) +[2023-10-08 19:13:41,061][21194] Updated weights for policy 1, policy_version 85500 (0.0010) +[2023-10-08 19:13:41,135][21195] Updated weights for policy 0, policy_version 86150 (0.0007) +[2023-10-08 19:13:41,508][21195] Updated weights for policy 0, policy_version 86160 (0.0007) +[2023-10-08 19:13:41,874][21195] Updated weights for policy 0, policy_version 86170 (0.0007) +[2023-10-08 19:13:43,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 175800320. Throughput: 0: 1713.0, 1: 1720.2. Samples: 43959530. Policy #0 lag: (min: 10.0, avg: 10.0, max: 10.0) +[2023-10-08 19:13:43,804][19739] Avg episode reward: [(0, '1069.570'), (1, '1103.270')] +[2023-10-08 19:13:45,017][21194] Updated weights for policy 1, policy_version 85510 (0.0007) +[2023-10-08 19:13:45,382][21194] Updated weights for policy 1, policy_version 85520 (0.0008) +[2023-10-08 19:13:45,747][21194] Updated weights for policy 1, policy_version 85530 (0.0010) +[2023-10-08 19:13:45,783][21195] Updated weights for policy 0, policy_version 86180 (0.0008) +[2023-10-08 19:13:46,141][21195] Updated weights for policy 0, policy_version 86190 (0.0009) +[2023-10-08 19:13:46,516][21195] Updated weights for policy 0, policy_version 86200 (0.0009) +[2023-10-08 19:13:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 175865856. Throughput: 0: 1727.6, 1: 1700.6. Samples: 43974710. Policy #0 lag: (min: 10.0, avg: 10.0, max: 10.0) +[2023-10-08 19:13:48,803][19739] Avg episode reward: [(0, '1069.480'), (1, '1103.200')] +[2023-10-08 19:13:49,698][21194] Updated weights for policy 1, policy_version 85540 (0.0008) +[2023-10-08 19:13:50,052][21194] Updated weights for policy 1, policy_version 85550 (0.0009) +[2023-10-08 19:13:50,412][21194] Updated weights for policy 1, policy_version 85560 (0.0007) +[2023-10-08 19:13:50,561][21195] Updated weights for policy 0, policy_version 86210 (0.0010) +[2023-10-08 19:13:50,926][21195] Updated weights for policy 0, policy_version 86220 (0.0009) +[2023-10-08 19:13:51,303][21195] Updated weights for policy 0, policy_version 86230 (0.0009) +[2023-10-08 19:13:51,673][21195] Updated weights for policy 0, policy_version 86240 (0.0007) +[2023-10-08 19:13:53,802][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 175931392. Throughput: 0: 1699.8, 1: 1715.6. Samples: 43990036. Policy #0 lag: (min: 10.0, avg: 10.0, max: 10.0) +[2023-10-08 19:13:53,803][19739] Avg episode reward: [(0, '1069.230'), (1, '1059.190')] +[2023-10-08 19:13:54,268][21194] Updated weights for policy 1, policy_version 85570 (0.0008) +[2023-10-08 19:13:54,642][21194] Updated weights for policy 1, policy_version 85580 (0.0010) +[2023-10-08 19:13:55,002][21194] Updated weights for policy 1, policy_version 85590 (0.0007) +[2023-10-08 19:13:55,333][21195] Updated weights for policy 0, policy_version 86250 (0.0007) +[2023-10-08 19:13:55,368][21194] Updated weights for policy 1, policy_version 85600 (0.0009) +[2023-10-08 19:13:55,701][21195] Updated weights for policy 0, policy_version 86260 (0.0007) +[2023-10-08 19:13:56,070][21195] Updated weights for policy 0, policy_version 86270 (0.0007) +[2023-10-08 19:13:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 175996928. Throughput: 0: 1719.6, 1: 1736.9. Samples: 44011794. Policy #0 lag: (min: 10.0, avg: 10.0, max: 10.0) +[2023-10-08 19:13:58,803][19739] Avg episode reward: [(0, '1069.230'), (1, '1041.600')] +[2023-10-08 19:13:59,277][21194] Updated weights for policy 1, policy_version 85610 (0.0008) +[2023-10-08 19:13:59,640][21194] Updated weights for policy 1, policy_version 85620 (0.0007) +[2023-10-08 19:13:59,956][21195] Updated weights for policy 0, policy_version 86280 (0.0009) +[2023-10-08 19:14:00,012][21194] Updated weights for policy 1, policy_version 85630 (0.0007) +[2023-10-08 19:14:00,323][21195] Updated weights for policy 0, policy_version 86290 (0.0009) +[2023-10-08 19:14:00,682][21195] Updated weights for policy 0, policy_version 86300 (0.0007) +[2023-10-08 19:14:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 176062464. Throughput: 0: 1740.6, 1: 1706.5. Samples: 44027164. Policy #0 lag: (min: 15.0, avg: 22.1, max: 47.0) +[2023-10-08 19:14:03,803][19739] Avg episode reward: [(0, '1069.230'), (1, '1041.600')] +[2023-10-08 19:14:03,982][21194] Updated weights for policy 1, policy_version 85640 (0.0010) +[2023-10-08 19:14:04,345][21194] Updated weights for policy 1, policy_version 85650 (0.0011) +[2023-10-08 19:14:04,706][21194] Updated weights for policy 1, policy_version 85660 (0.0009) +[2023-10-08 19:14:04,757][21195] Updated weights for policy 0, policy_version 86310 (0.0008) +[2023-10-08 19:14:05,142][21195] Updated weights for policy 0, policy_version 86320 (0.0008) +[2023-10-08 19:14:05,502][21195] Updated weights for policy 0, policy_version 86330 (0.0009) +[2023-10-08 19:14:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 176128000. Throughput: 0: 1709.5, 1: 1728.7. Samples: 44042360. Policy #0 lag: (min: 15.0, avg: 22.1, max: 47.0) +[2023-10-08 19:14:08,803][19739] Avg episode reward: [(0, '1069.230'), (1, '1041.600')] +[2023-10-08 19:14:08,824][21194] Updated weights for policy 1, policy_version 85670 (0.0009) +[2023-10-08 19:14:09,178][21194] Updated weights for policy 1, policy_version 85680 (0.0007) +[2023-10-08 19:14:09,247][21195] Updated weights for policy 0, policy_version 86340 (0.0009) +[2023-10-08 19:14:09,542][21194] Updated weights for policy 1, policy_version 85690 (0.0007) +[2023-10-08 19:14:09,616][21195] Updated weights for policy 0, policy_version 86350 (0.0010) +[2023-10-08 19:14:09,987][21195] Updated weights for policy 0, policy_version 86360 (0.0008) +[2023-10-08 19:14:13,654][21194] Updated weights for policy 1, policy_version 85700 (0.0008) +[2023-10-08 19:14:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 176193536. Throughput: 0: 1745.2, 1: 1728.7. Samples: 44063860. Policy #0 lag: (min: 15.0, avg: 22.1, max: 47.0) +[2023-10-08 19:14:13,803][19739] Avg episode reward: [(0, '1069.230'), (1, '1041.990')] +[2023-10-08 19:14:13,864][21195] Updated weights for policy 0, policy_version 86370 (0.0010) +[2023-10-08 19:14:14,018][21194] Updated weights for policy 1, policy_version 85710 (0.0008) +[2023-10-08 19:14:14,230][21195] Updated weights for policy 0, policy_version 86380 (0.0009) +[2023-10-08 19:14:14,377][21194] Updated weights for policy 1, policy_version 85720 (0.0008) +[2023-10-08 19:14:14,595][21195] Updated weights for policy 0, policy_version 86390 (0.0007) +[2023-10-08 19:14:14,963][21195] Updated weights for policy 0, policy_version 86400 (0.0007) +[2023-10-08 19:14:18,263][21194] Updated weights for policy 1, policy_version 85730 (0.0007) +[2023-10-08 19:14:18,636][21194] Updated weights for policy 1, policy_version 85740 (0.0009) +[2023-10-08 19:14:18,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 176259072. Throughput: 0: 1737.2, 1: 1713.7. Samples: 44078948. Policy #0 lag: (min: 15.0, avg: 22.1, max: 47.0) +[2023-10-08 19:14:18,804][19739] Avg episode reward: [(0, '1069.230'), (1, '1042.050')] +[2023-10-08 19:14:18,908][21195] Updated weights for policy 0, policy_version 86410 (0.0009) +[2023-10-08 19:14:19,001][21194] Updated weights for policy 1, policy_version 85750 (0.0008) +[2023-10-08 19:14:19,276][21195] Updated weights for policy 0, policy_version 86420 (0.0008) +[2023-10-08 19:14:19,361][21194] Updated weights for policy 1, policy_version 85760 (0.0010) +[2023-10-08 19:14:19,636][21195] Updated weights for policy 0, policy_version 86430 (0.0009) +[2023-10-08 19:14:23,407][21194] Updated weights for policy 1, policy_version 85770 (0.0009) +[2023-10-08 19:14:23,673][21195] Updated weights for policy 0, policy_version 86440 (0.0010) +[2023-10-08 19:14:23,777][21194] Updated weights for policy 1, policy_version 85780 (0.0008) +[2023-10-08 19:14:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 176324608. Throughput: 0: 1724.4, 1: 1732.6. Samples: 44094336. Policy #0 lag: (min: 15.0, avg: 22.1, max: 47.0) +[2023-10-08 19:14:23,803][19739] Avg episode reward: [(0, '1069.230'), (1, '1034.790')] +[2023-10-08 19:14:24,040][21195] Updated weights for policy 0, policy_version 86450 (0.0008) +[2023-10-08 19:14:24,142][21194] Updated weights for policy 1, policy_version 85790 (0.0009) +[2023-10-08 19:14:24,405][21195] Updated weights for policy 0, policy_version 86460 (0.0007) +[2023-10-08 19:14:28,129][21194] Updated weights for policy 1, policy_version 85800 (0.0008) +[2023-10-08 19:14:28,356][21195] Updated weights for policy 0, policy_version 86470 (0.0007) +[2023-10-08 19:14:28,489][21194] Updated weights for policy 1, policy_version 85810 (0.0008) +[2023-10-08 19:14:28,721][21195] Updated weights for policy 0, policy_version 86480 (0.0009) +[2023-10-08 19:14:28,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 176390144. Throughput: 0: 1745.2, 1: 1724.9. Samples: 44115684. Policy #0 lag: (min: 15.0, avg: 22.1, max: 47.0) +[2023-10-08 19:14:28,803][19739] Avg episode reward: [(0, '1069.230'), (1, '1034.790')] +[2023-10-08 19:14:28,856][21194] Updated weights for policy 1, policy_version 85820 (0.0008) +[2023-10-08 19:14:29,082][21195] Updated weights for policy 0, policy_version 86490 (0.0009) +[2023-10-08 19:14:32,767][21194] Updated weights for policy 1, policy_version 85830 (0.0008) +[2023-10-08 19:14:33,012][21195] Updated weights for policy 0, policy_version 86500 (0.0008) +[2023-10-08 19:14:33,137][21194] Updated weights for policy 1, policy_version 85840 (0.0008) +[2023-10-08 19:14:33,378][21195] Updated weights for policy 0, policy_version 86510 (0.0009) +[2023-10-08 19:14:33,505][21194] Updated weights for policy 1, policy_version 85850 (0.0009) +[2023-10-08 19:14:33,755][21195] Updated weights for policy 0, policy_version 86520 (0.0008) +[2023-10-08 19:14:33,803][19739] Fps is (10 sec: 16383.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 176488448. Throughput: 0: 1728.6, 1: 1731.1. Samples: 44130394. Policy #0 lag: (min: 15.0, avg: 22.1, max: 47.0) +[2023-10-08 19:14:33,804][19739] Avg episode reward: [(0, '1077.900'), (1, '1034.790')] +[2023-10-08 19:14:37,554][21194] Updated weights for policy 1, policy_version 85860 (0.0008) +[2023-10-08 19:14:37,582][21195] Updated weights for policy 0, policy_version 86530 (0.0008) +[2023-10-08 19:14:37,925][21194] Updated weights for policy 1, policy_version 85870 (0.0008) +[2023-10-08 19:14:37,947][21195] Updated weights for policy 0, policy_version 86540 (0.0008) +[2023-10-08 19:14:38,293][21194] Updated weights for policy 1, policy_version 85880 (0.0008) +[2023-10-08 19:14:38,324][21195] Updated weights for policy 0, policy_version 86550 (0.0010) +[2023-10-08 19:14:38,685][21195] Updated weights for policy 0, policy_version 86560 (0.0010) +[2023-10-08 19:14:38,802][19739] Fps is (10 sec: 19661.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 176586752. Throughput: 0: 1754.2, 1: 1726.0. Samples: 44146644. Policy #0 lag: (min: 15.0, avg: 22.1, max: 47.0) +[2023-10-08 19:14:38,803][19739] Avg episode reward: [(0, '1077.900'), (1, '1045.010')] +[2023-10-08 19:14:42,350][21194] Updated weights for policy 1, policy_version 85890 (0.0008) +[2023-10-08 19:14:42,664][21195] Updated weights for policy 0, policy_version 86570 (0.0007) +[2023-10-08 19:14:42,715][21194] Updated weights for policy 1, policy_version 85900 (0.0008) +[2023-10-08 19:14:43,037][21195] Updated weights for policy 0, policy_version 86580 (0.0007) +[2023-10-08 19:14:43,072][21194] Updated weights for policy 1, policy_version 85910 (0.0008) +[2023-10-08 19:14:43,406][21195] Updated weights for policy 0, policy_version 86590 (0.0008) +[2023-10-08 19:14:43,444][21194] Updated weights for policy 1, policy_version 85920 (0.0009) +[2023-10-08 19:14:43,802][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 176652288. Throughput: 0: 1734.1, 1: 1699.0. Samples: 44166282. Policy #0 lag: (min: 15.0, avg: 22.1, max: 47.0) +[2023-10-08 19:14:43,803][19739] Avg episode reward: [(0, '1084.290'), (1, '1045.010')] +[2023-10-08 19:14:47,402][21195] Updated weights for policy 0, policy_version 86600 (0.0007) +[2023-10-08 19:14:47,413][21194] Updated weights for policy 1, policy_version 85930 (0.0010) +[2023-10-08 19:14:47,769][21194] Updated weights for policy 1, policy_version 85940 (0.0008) +[2023-10-08 19:14:47,773][21195] Updated weights for policy 0, policy_version 86610 (0.0008) +[2023-10-08 19:14:48,138][21194] Updated weights for policy 1, policy_version 85950 (0.0007) +[2023-10-08 19:14:48,140][21195] Updated weights for policy 0, policy_version 86620 (0.0009) +[2023-10-08 19:14:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 176717824. Throughput: 0: 1714.2, 1: 1719.5. Samples: 44181680. Policy #0 lag: (min: 15.0, avg: 22.1, max: 47.0) +[2023-10-08 19:14:48,803][19739] Avg episode reward: [(0, '1064.680'), (1, '1045.010')] +[2023-10-08 19:14:51,971][21194] Updated weights for policy 1, policy_version 85960 (0.0009) +[2023-10-08 19:14:52,005][21195] Updated weights for policy 0, policy_version 86630 (0.0009) +[2023-10-08 19:14:52,337][21194] Updated weights for policy 1, policy_version 85970 (0.0008) +[2023-10-08 19:14:52,388][21195] Updated weights for policy 0, policy_version 86640 (0.0007) +[2023-10-08 19:14:52,700][21194] Updated weights for policy 1, policy_version 85980 (0.0008) +[2023-10-08 19:14:52,747][21195] Updated weights for policy 0, policy_version 86650 (0.0008) +[2023-10-08 19:14:53,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 176783360. Throughput: 0: 1741.2, 1: 1715.2. Samples: 44197898. Policy #0 lag: (min: 15.0, avg: 22.1, max: 47.0) +[2023-10-08 19:14:53,804][19739] Avg episode reward: [(0, '1042.210'), (1, '1045.010')] +[2023-10-08 19:14:56,628][21194] Updated weights for policy 1, policy_version 85990 (0.0009) +[2023-10-08 19:14:56,758][21195] Updated weights for policy 0, policy_version 86660 (0.0007) +[2023-10-08 19:14:56,998][21194] Updated weights for policy 1, policy_version 86000 (0.0007) +[2023-10-08 19:14:57,117][21195] Updated weights for policy 0, policy_version 86670 (0.0008) +[2023-10-08 19:14:57,365][21194] Updated weights for policy 1, policy_version 86010 (0.0008) +[2023-10-08 19:14:57,493][21195] Updated weights for policy 0, policy_version 86680 (0.0009) +[2023-10-08 19:14:58,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 176848896. Throughput: 0: 1708.2, 1: 1695.6. Samples: 44217028. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:14:58,804][19739] Avg episode reward: [(0, '1057.740'), (1, '1044.820')] +[2023-10-08 19:15:01,267][21194] Updated weights for policy 1, policy_version 86020 (0.0007) +[2023-10-08 19:15:01,469][21195] Updated weights for policy 0, policy_version 86690 (0.0008) +[2023-10-08 19:15:01,642][21194] Updated weights for policy 1, policy_version 86030 (0.0008) +[2023-10-08 19:15:01,842][21195] Updated weights for policy 0, policy_version 86700 (0.0008) +[2023-10-08 19:15:02,010][21194] Updated weights for policy 1, policy_version 86040 (0.0008) +[2023-10-08 19:15:02,206][21195] Updated weights for policy 0, policy_version 86710 (0.0008) +[2023-10-08 19:15:02,573][21195] Updated weights for policy 0, policy_version 86720 (0.0007) +[2023-10-08 19:15:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 176914432. Throughput: 0: 1710.9, 1: 1727.8. Samples: 44233688. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:15:03,804][19739] Avg episode reward: [(0, '1073.120'), (1, '1044.820')] +[2023-10-08 19:15:06,075][21194] Updated weights for policy 1, policy_version 86050 (0.0009) +[2023-10-08 19:15:06,439][21194] Updated weights for policy 1, policy_version 86060 (0.0008) +[2023-10-08 19:15:06,557][21195] Updated weights for policy 0, policy_version 86730 (0.0008) +[2023-10-08 19:15:06,799][21194] Updated weights for policy 1, policy_version 86070 (0.0008) +[2023-10-08 19:15:06,929][21195] Updated weights for policy 0, policy_version 86740 (0.0009) +[2023-10-08 19:15:07,164][21194] Updated weights for policy 1, policy_version 86080 (0.0009) +[2023-10-08 19:15:07,294][21195] Updated weights for policy 0, policy_version 86750 (0.0009) +[2023-10-08 19:15:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13884.8). Total num frames: 176979968. Throughput: 0: 1721.8, 1: 1698.0. Samples: 44248226. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:15:08,805][19739] Avg episode reward: [(0, '1073.120'), (1, '1044.820')] +[2023-10-08 19:15:11,127][21195] Updated weights for policy 0, policy_version 86760 (0.0009) +[2023-10-08 19:15:11,220][21194] Updated weights for policy 1, policy_version 86090 (0.0009) +[2023-10-08 19:15:11,492][21195] Updated weights for policy 0, policy_version 86770 (0.0008) +[2023-10-08 19:15:11,584][21194] Updated weights for policy 1, policy_version 86100 (0.0009) +[2023-10-08 19:15:11,858][21195] Updated weights for policy 0, policy_version 86780 (0.0008) +[2023-10-08 19:15:11,947][21194] Updated weights for policy 1, policy_version 86110 (0.0009) +[2023-10-08 19:15:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 177045504. Throughput: 0: 1705.4, 1: 1696.9. Samples: 44268788. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:15:13,803][19739] Avg episode reward: [(0, '1073.120'), (1, '1044.820')] +[2023-10-08 19:15:13,811][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000086112_88178688.pth... +[2023-10-08 19:15:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000086784_88866816.pth... +[2023-10-08 19:15:13,842][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000084512_86540288.pth +[2023-10-08 19:15:13,850][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000085152_87195648.pth +[2023-10-08 19:15:15,820][21194] Updated weights for policy 1, policy_version 86120 (0.0009) +[2023-10-08 19:15:15,972][21195] Updated weights for policy 0, policy_version 86790 (0.0008) +[2023-10-08 19:15:16,189][21194] Updated weights for policy 1, policy_version 86130 (0.0007) +[2023-10-08 19:15:16,333][21195] Updated weights for policy 0, policy_version 86800 (0.0008) +[2023-10-08 19:15:16,545][21194] Updated weights for policy 1, policy_version 86140 (0.0009) +[2023-10-08 19:15:16,701][21195] Updated weights for policy 0, policy_version 86810 (0.0009) +[2023-10-08 19:15:18,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 177111040. Throughput: 0: 1727.4, 1: 1707.5. Samples: 44284962. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:15:18,803][19739] Avg episode reward: [(0, '1073.120'), (1, '1044.820')] +[2023-10-08 19:15:20,606][21194] Updated weights for policy 1, policy_version 86150 (0.0008) +[2023-10-08 19:15:20,703][21195] Updated weights for policy 0, policy_version 86820 (0.0008) +[2023-10-08 19:15:20,978][21194] Updated weights for policy 1, policy_version 86160 (0.0007) +[2023-10-08 19:15:21,066][21195] Updated weights for policy 0, policy_version 86830 (0.0007) +[2023-10-08 19:15:21,338][21194] Updated weights for policy 1, policy_version 86170 (0.0009) +[2023-10-08 19:15:21,436][21195] Updated weights for policy 0, policy_version 86840 (0.0007) +[2023-10-08 19:15:23,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 177176576. Throughput: 0: 1702.8, 1: 1695.2. Samples: 44299556. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:15:23,803][19739] Avg episode reward: [(0, '1071.650'), (1, '1044.820')] +[2023-10-08 19:15:25,311][21194] Updated weights for policy 1, policy_version 86180 (0.0008) +[2023-10-08 19:15:25,379][21195] Updated weights for policy 0, policy_version 86850 (0.0009) +[2023-10-08 19:15:25,673][21194] Updated weights for policy 1, policy_version 86190 (0.0008) +[2023-10-08 19:15:25,748][21195] Updated weights for policy 0, policy_version 86860 (0.0010) +[2023-10-08 19:15:26,038][21194] Updated weights for policy 1, policy_version 86200 (0.0010) +[2023-10-08 19:15:26,114][21195] Updated weights for policy 0, policy_version 86870 (0.0007) +[2023-10-08 19:15:26,483][21195] Updated weights for policy 0, policy_version 86880 (0.0008) +[2023-10-08 19:15:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 177242112. Throughput: 0: 1718.0, 1: 1717.1. Samples: 44320860. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:15:28,803][19739] Avg episode reward: [(0, '1071.650'), (1, '1044.820')] +[2023-10-08 19:15:30,031][21194] Updated weights for policy 1, policy_version 86210 (0.0007) +[2023-10-08 19:15:30,383][21194] Updated weights for policy 1, policy_version 86220 (0.0007) +[2023-10-08 19:15:30,493][21195] Updated weights for policy 0, policy_version 86890 (0.0009) +[2023-10-08 19:15:30,749][21194] Updated weights for policy 1, policy_version 86230 (0.0008) +[2023-10-08 19:15:30,859][21195] Updated weights for policy 0, policy_version 86900 (0.0008) +[2023-10-08 19:15:31,112][21194] Updated weights for policy 1, policy_version 86240 (0.0007) +[2023-10-08 19:15:31,224][21195] Updated weights for policy 0, policy_version 86910 (0.0008) +[2023-10-08 19:15:33,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 177307648. Throughput: 0: 1732.6, 1: 1697.2. Samples: 44336022. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:15:33,804][19739] Avg episode reward: [(0, '1071.650'), (1, '1044.820')] +[2023-10-08 19:15:35,022][21194] Updated weights for policy 1, policy_version 86250 (0.0009) +[2023-10-08 19:15:35,266][21195] Updated weights for policy 0, policy_version 86920 (0.0007) +[2023-10-08 19:15:35,386][21194] Updated weights for policy 1, policy_version 86260 (0.0008) +[2023-10-08 19:15:35,630][21195] Updated weights for policy 0, policy_version 86930 (0.0008) +[2023-10-08 19:15:35,752][21194] Updated weights for policy 1, policy_version 86270 (0.0009) +[2023-10-08 19:15:35,998][21195] Updated weights for policy 0, policy_version 86940 (0.0007) +[2023-10-08 19:15:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.1, 300 sec: 13773.7). Total num frames: 177373184. Throughput: 0: 1704.1, 1: 1704.1. Samples: 44351268. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:15:38,804][19739] Avg episode reward: [(0, '1071.720'), (1, '1044.820')] +[2023-10-08 19:15:39,772][21194] Updated weights for policy 1, policy_version 86280 (0.0009) +[2023-10-08 19:15:39,975][21195] Updated weights for policy 0, policy_version 86950 (0.0007) +[2023-10-08 19:15:40,130][21194] Updated weights for policy 1, policy_version 86290 (0.0009) +[2023-10-08 19:15:40,362][21195] Updated weights for policy 0, policy_version 86960 (0.0009) +[2023-10-08 19:15:40,502][21194] Updated weights for policy 1, policy_version 86300 (0.0008) +[2023-10-08 19:15:40,735][21195] Updated weights for policy 0, policy_version 86970 (0.0008) +[2023-10-08 19:15:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 177438720. Throughput: 0: 1735.0, 1: 1724.8. Samples: 44372720. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:15:43,803][19739] Avg episode reward: [(0, '1059.820'), (1, '1044.820')] +[2023-10-08 19:15:44,500][21195] Updated weights for policy 0, policy_version 86980 (0.0009) +[2023-10-08 19:15:44,520][21194] Updated weights for policy 1, policy_version 86310 (0.0009) +[2023-10-08 19:15:44,865][21195] Updated weights for policy 0, policy_version 86990 (0.0007) +[2023-10-08 19:15:44,890][21194] Updated weights for policy 1, policy_version 86320 (0.0008) +[2023-10-08 19:15:45,245][21195] Updated weights for policy 0, policy_version 87000 (0.0007) +[2023-10-08 19:15:45,254][21194] Updated weights for policy 1, policy_version 86330 (0.0008) +[2023-10-08 19:15:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 177504256. Throughput: 0: 1733.5, 1: 1694.1. Samples: 44387928. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:15:48,803][19739] Avg episode reward: [(0, '1059.820'), (1, '1044.820')] +[2023-10-08 19:15:49,255][21195] Updated weights for policy 0, policy_version 87010 (0.0008) +[2023-10-08 19:15:49,378][21194] Updated weights for policy 1, policy_version 86340 (0.0009) +[2023-10-08 19:15:49,630][21195] Updated weights for policy 0, policy_version 87020 (0.0008) +[2023-10-08 19:15:49,745][21194] Updated weights for policy 1, policy_version 86350 (0.0008) +[2023-10-08 19:15:49,995][21195] Updated weights for policy 0, policy_version 87030 (0.0010) +[2023-10-08 19:15:50,118][21194] Updated weights for policy 1, policy_version 86360 (0.0008) +[2023-10-08 19:15:50,366][21195] Updated weights for policy 0, policy_version 87040 (0.0008) +[2023-10-08 19:15:53,746][21194] Updated weights for policy 1, policy_version 86370 (0.0008) +[2023-10-08 19:15:53,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 177569792. Throughput: 0: 1720.1, 1: 1718.1. Samples: 44402944. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:15:53,803][19739] Avg episode reward: [(0, '1059.820'), (1, '1044.820')] +[2023-10-08 19:15:54,121][21194] Updated weights for policy 1, policy_version 86380 (0.0008) +[2023-10-08 19:15:54,343][21195] Updated weights for policy 0, policy_version 87050 (0.0007) +[2023-10-08 19:15:54,473][21194] Updated weights for policy 1, policy_version 86390 (0.0007) +[2023-10-08 19:15:54,721][21195] Updated weights for policy 0, policy_version 87060 (0.0007) +[2023-10-08 19:15:54,842][21194] Updated weights for policy 1, policy_version 86400 (0.0007) +[2023-10-08 19:15:55,088][21195] Updated weights for policy 0, policy_version 87070 (0.0007) +[2023-10-08 19:15:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 177635328. Throughput: 0: 1721.5, 1: 1734.9. Samples: 44424326. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:15:58,803][19739] Avg episode reward: [(0, '1059.960'), (1, '1029.540')] +[2023-10-08 19:15:58,920][21194] Updated weights for policy 1, policy_version 86410 (0.0008) +[2023-10-08 19:15:58,988][21195] Updated weights for policy 0, policy_version 87080 (0.0007) +[2023-10-08 19:15:59,287][21194] Updated weights for policy 1, policy_version 86420 (0.0008) +[2023-10-08 19:15:59,350][21195] Updated weights for policy 0, policy_version 87090 (0.0007) +[2023-10-08 19:15:59,648][21194] Updated weights for policy 1, policy_version 86430 (0.0009) +[2023-10-08 19:15:59,722][21195] Updated weights for policy 0, policy_version 87100 (0.0008) +[2023-10-08 19:16:03,711][21194] Updated weights for policy 1, policy_version 86440 (0.0008) +[2023-10-08 19:16:03,727][21195] Updated weights for policy 0, policy_version 87110 (0.0007) +[2023-10-08 19:16:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.3, 300 sec: 13662.6). Total num frames: 177700864. Throughput: 0: 1718.4, 1: 1712.5. Samples: 44439350. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:16:03,803][19739] Avg episode reward: [(0, '1059.960'), (1, '1029.540')] +[2023-10-08 19:16:04,078][21194] Updated weights for policy 1, policy_version 86450 (0.0008) +[2023-10-08 19:16:04,095][21195] Updated weights for policy 0, policy_version 87120 (0.0007) +[2023-10-08 19:16:04,435][21194] Updated weights for policy 1, policy_version 86460 (0.0010) +[2023-10-08 19:16:04,467][21195] Updated weights for policy 0, policy_version 87130 (0.0007) +[2023-10-08 19:16:08,326][21194] Updated weights for policy 1, policy_version 86470 (0.0008) +[2023-10-08 19:16:08,378][21195] Updated weights for policy 0, policy_version 87140 (0.0007) +[2023-10-08 19:16:08,689][21194] Updated weights for policy 1, policy_version 86480 (0.0007) +[2023-10-08 19:16:08,749][21195] Updated weights for policy 0, policy_version 87150 (0.0009) +[2023-10-08 19:16:08,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 177766400. Throughput: 0: 1729.8, 1: 1726.4. Samples: 44455086. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:16:08,803][19739] Avg episode reward: [(0, '1059.960'), (1, '1029.540')] +[2023-10-08 19:16:09,055][21194] Updated weights for policy 1, policy_version 86490 (0.0010) +[2023-10-08 19:16:09,113][21195] Updated weights for policy 0, policy_version 87160 (0.0007) +[2023-10-08 19:16:12,918][21194] Updated weights for policy 1, policy_version 86500 (0.0008) +[2023-10-08 19:16:13,020][21195] Updated weights for policy 0, policy_version 87170 (0.0010) +[2023-10-08 19:16:13,282][21194] Updated weights for policy 1, policy_version 86510 (0.0008) +[2023-10-08 19:16:13,397][21195] Updated weights for policy 0, policy_version 87180 (0.0008) +[2023-10-08 19:16:13,640][21194] Updated weights for policy 1, policy_version 86520 (0.0008) +[2023-10-08 19:16:13,771][21195] Updated weights for policy 0, policy_version 87190 (0.0008) +[2023-10-08 19:16:13,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 177831936. Throughput: 0: 1730.0, 1: 1723.5. Samples: 44476266. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:16:13,804][19739] Avg episode reward: [(0, '1060.200'), (1, '1029.310')] +[2023-10-08 19:16:14,131][21195] Updated weights for policy 0, policy_version 87200 (0.0008) +[2023-10-08 19:16:17,566][21194] Updated weights for policy 1, policy_version 86530 (0.0010) +[2023-10-08 19:16:17,935][21194] Updated weights for policy 1, policy_version 86540 (0.0009) +[2023-10-08 19:16:18,025][21195] Updated weights for policy 0, policy_version 87210 (0.0009) +[2023-10-08 19:16:18,295][21194] Updated weights for policy 1, policy_version 86550 (0.0007) +[2023-10-08 19:16:18,388][21195] Updated weights for policy 0, policy_version 87220 (0.0008) +[2023-10-08 19:16:18,661][21194] Updated weights for policy 1, policy_version 86560 (0.0007) +[2023-10-08 19:16:18,754][21195] Updated weights for policy 0, policy_version 87230 (0.0010) +[2023-10-08 19:16:18,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 177930240. Throughput: 0: 1708.0, 1: 1734.2. Samples: 44490918. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:16:18,803][19739] Avg episode reward: [(0, '1059.730'), (1, '1029.310')] +[2023-10-08 19:16:22,572][21194] Updated weights for policy 1, policy_version 86570 (0.0010) +[2023-10-08 19:16:22,887][21195] Updated weights for policy 0, policy_version 87240 (0.0009) +[2023-10-08 19:16:22,925][21194] Updated weights for policy 1, policy_version 86580 (0.0007) +[2023-10-08 19:16:23,251][21195] Updated weights for policy 0, policy_version 87250 (0.0010) +[2023-10-08 19:16:23,289][21194] Updated weights for policy 1, policy_version 86590 (0.0009) +[2023-10-08 19:16:23,615][21195] Updated weights for policy 0, policy_version 87260 (0.0008) +[2023-10-08 19:16:23,803][19739] Fps is (10 sec: 19661.5, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 178028544. Throughput: 0: 1734.5, 1: 1739.9. Samples: 44507616. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:16:23,803][19739] Avg episode reward: [(0, '1059.730'), (1, '1013.790')] +[2023-10-08 19:16:27,482][21194] Updated weights for policy 1, policy_version 86600 (0.0008) +[2023-10-08 19:16:27,556][21195] Updated weights for policy 0, policy_version 87270 (0.0008) +[2023-10-08 19:16:27,835][21194] Updated weights for policy 1, policy_version 86610 (0.0008) +[2023-10-08 19:16:27,946][21195] Updated weights for policy 0, policy_version 87280 (0.0009) +[2023-10-08 19:16:28,207][21194] Updated weights for policy 1, policy_version 86620 (0.0010) +[2023-10-08 19:16:28,315][21195] Updated weights for policy 0, policy_version 87290 (0.0008) +[2023-10-08 19:16:28,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 178094080. Throughput: 0: 1719.7, 1: 1714.1. Samples: 44527242. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:16:28,803][19739] Avg episode reward: [(0, '1059.730'), (1, '1023.460')] +[2023-10-08 19:16:32,102][21194] Updated weights for policy 1, policy_version 86630 (0.0010) +[2023-10-08 19:16:32,269][21195] Updated weights for policy 0, policy_version 87300 (0.0007) +[2023-10-08 19:16:32,465][21194] Updated weights for policy 1, policy_version 86640 (0.0009) +[2023-10-08 19:16:32,640][21195] Updated weights for policy 0, policy_version 87310 (0.0007) +[2023-10-08 19:16:32,829][21194] Updated weights for policy 1, policy_version 86650 (0.0009) +[2023-10-08 19:16:32,999][21195] Updated weights for policy 0, policy_version 87320 (0.0007) +[2023-10-08 19:16:33,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 178159616. Throughput: 0: 1706.3, 1: 1735.8. Samples: 44542822. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:16:33,803][19739] Avg episode reward: [(0, '1059.730'), (1, '1023.430')] +[2023-10-08 19:16:36,662][21194] Updated weights for policy 1, policy_version 86660 (0.0008) +[2023-10-08 19:16:36,923][21195] Updated weights for policy 0, policy_version 87330 (0.0008) +[2023-10-08 19:16:37,018][21194] Updated weights for policy 1, policy_version 86670 (0.0007) +[2023-10-08 19:16:37,295][21195] Updated weights for policy 0, policy_version 87340 (0.0010) +[2023-10-08 19:16:37,381][21194] Updated weights for policy 1, policy_version 86680 (0.0007) +[2023-10-08 19:16:37,656][21195] Updated weights for policy 0, policy_version 87350 (0.0009) +[2023-10-08 19:16:38,017][21195] Updated weights for policy 0, policy_version 87360 (0.0008) +[2023-10-08 19:16:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 178225152. Throughput: 0: 1740.8, 1: 1732.6. Samples: 44559248. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:16:38,803][19739] Avg episode reward: [(0, '1059.730'), (1, '1023.430')] +[2023-10-08 19:16:41,309][21194] Updated weights for policy 1, policy_version 86690 (0.0008) +[2023-10-08 19:16:41,679][21194] Updated weights for policy 1, policy_version 86700 (0.0007) +[2023-10-08 19:16:41,989][21195] Updated weights for policy 0, policy_version 87370 (0.0007) +[2023-10-08 19:16:42,040][21194] Updated weights for policy 1, policy_version 86710 (0.0007) +[2023-10-08 19:16:42,357][21195] Updated weights for policy 0, policy_version 87380 (0.0007) +[2023-10-08 19:16:42,412][21194] Updated weights for policy 1, policy_version 86720 (0.0007) +[2023-10-08 19:16:42,727][21195] Updated weights for policy 0, policy_version 87390 (0.0009) +[2023-10-08 19:16:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 178290688. Throughput: 0: 1716.3, 1: 1706.9. Samples: 44578370. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:16:43,803][19739] Avg episode reward: [(0, '1059.730'), (1, '1023.430')] +[2023-10-08 19:16:46,479][21194] Updated weights for policy 1, policy_version 86730 (0.0007) +[2023-10-08 19:16:46,683][21195] Updated weights for policy 0, policy_version 87400 (0.0008) +[2023-10-08 19:16:46,832][21194] Updated weights for policy 1, policy_version 86740 (0.0008) +[2023-10-08 19:16:47,046][21195] Updated weights for policy 0, policy_version 87410 (0.0007) +[2023-10-08 19:16:47,202][21194] Updated weights for policy 1, policy_version 86750 (0.0008) +[2023-10-08 19:16:47,409][21195] Updated weights for policy 0, policy_version 87420 (0.0007) +[2023-10-08 19:16:48,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 178356224. Throughput: 0: 1720.8, 1: 1738.0. Samples: 44594998. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:16:48,804][19739] Avg episode reward: [(0, '1059.730'), (1, '1009.080')] +[2023-10-08 19:16:51,245][21195] Updated weights for policy 0, policy_version 87430 (0.0007) +[2023-10-08 19:16:51,286][21194] Updated weights for policy 1, policy_version 86760 (0.0007) +[2023-10-08 19:16:51,618][21195] Updated weights for policy 0, policy_version 87440 (0.0007) +[2023-10-08 19:16:51,648][21194] Updated weights for policy 1, policy_version 86770 (0.0008) +[2023-10-08 19:16:51,973][21195] Updated weights for policy 0, policy_version 87450 (0.0007) +[2023-10-08 19:16:52,024][21194] Updated weights for policy 1, policy_version 86780 (0.0009) +[2023-10-08 19:16:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 178421760. Throughput: 0: 1721.6, 1: 1709.0. Samples: 44609460. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 19:16:53,803][19739] Avg episode reward: [(0, '1059.730'), (1, '1009.080')] +[2023-10-08 19:16:55,787][21194] Updated weights for policy 1, policy_version 86790 (0.0007) +[2023-10-08 19:16:55,793][21195] Updated weights for policy 0, policy_version 87460 (0.0008) +[2023-10-08 19:16:56,144][21194] Updated weights for policy 1, policy_version 86800 (0.0007) +[2023-10-08 19:16:56,158][21195] Updated weights for policy 0, policy_version 87470 (0.0007) +[2023-10-08 19:16:56,507][21194] Updated weights for policy 1, policy_version 86810 (0.0009) +[2023-10-08 19:16:56,527][21195] Updated weights for policy 0, policy_version 87480 (0.0008) +[2023-10-08 19:16:58,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 178487296. Throughput: 0: 1713.7, 1: 1714.2. Samples: 44630520. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 19:16:58,803][19739] Avg episode reward: [(0, '1059.730'), (1, '1009.080')] +[2023-10-08 19:17:00,327][21195] Updated weights for policy 0, policy_version 87490 (0.0008) +[2023-10-08 19:17:00,657][21194] Updated weights for policy 1, policy_version 86820 (0.0007) +[2023-10-08 19:17:00,681][21195] Updated weights for policy 0, policy_version 87500 (0.0008) +[2023-10-08 19:17:01,023][21194] Updated weights for policy 1, policy_version 86830 (0.0008) +[2023-10-08 19:17:01,044][21195] Updated weights for policy 0, policy_version 87510 (0.0008) +[2023-10-08 19:17:01,386][21194] Updated weights for policy 1, policy_version 86840 (0.0008) +[2023-10-08 19:17:01,414][21195] Updated weights for policy 0, policy_version 87520 (0.0008) +[2023-10-08 19:17:03,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 178552832. Throughput: 0: 1745.8, 1: 1716.6. Samples: 44646724. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 19:17:03,804][19739] Avg episode reward: [(0, '1059.730'), (1, '1004.460')] +[2023-10-08 19:17:05,203][21195] Updated weights for policy 0, policy_version 87530 (0.0008) +[2023-10-08 19:17:05,244][21194] Updated weights for policy 1, policy_version 86850 (0.0008) +[2023-10-08 19:17:05,572][21195] Updated weights for policy 0, policy_version 87540 (0.0008) +[2023-10-08 19:17:05,603][21194] Updated weights for policy 1, policy_version 86860 (0.0007) +[2023-10-08 19:17:05,928][21195] Updated weights for policy 0, policy_version 87550 (0.0009) +[2023-10-08 19:17:05,967][21194] Updated weights for policy 1, policy_version 86870 (0.0007) +[2023-10-08 19:17:06,337][21194] Updated weights for policy 1, policy_version 86880 (0.0009) +[2023-10-08 19:17:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 178618368. Throughput: 0: 1721.3, 1: 1696.8. Samples: 44661434. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 19:17:08,803][19739] Avg episode reward: [(0, '1059.730'), (1, '991.100')] +[2023-10-08 19:17:09,822][21195] Updated weights for policy 0, policy_version 87560 (0.0008) +[2023-10-08 19:17:10,195][21195] Updated weights for policy 0, policy_version 87570 (0.0008) +[2023-10-08 19:17:10,356][21194] Updated weights for policy 1, policy_version 86890 (0.0008) +[2023-10-08 19:17:10,550][21195] Updated weights for policy 0, policy_version 87580 (0.0008) +[2023-10-08 19:17:10,713][21194] Updated weights for policy 1, policy_version 86900 (0.0008) +[2023-10-08 19:17:11,077][21194] Updated weights for policy 1, policy_version 86910 (0.0008) +[2023-10-08 19:17:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 178683904. Throughput: 0: 1736.2, 1: 1720.7. Samples: 44682802. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 19:17:13,804][19739] Avg episode reward: [(0, '1059.730'), (1, '991.100')] +[2023-10-08 19:17:13,817][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000087584_89686016.pth... +[2023-10-08 19:17:13,817][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000086912_88997888.pth... +[2023-10-08 19:17:13,853][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000085312_87359488.pth +[2023-10-08 19:17:13,854][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000085984_88047616.pth +[2023-10-08 19:17:14,581][21195] Updated weights for policy 0, policy_version 87590 (0.0008) +[2023-10-08 19:17:14,970][21195] Updated weights for policy 0, policy_version 87600 (0.0008) +[2023-10-08 19:17:15,096][21194] Updated weights for policy 1, policy_version 86920 (0.0008) +[2023-10-08 19:17:15,336][21195] Updated weights for policy 0, policy_version 87610 (0.0009) +[2023-10-08 19:17:15,467][21194] Updated weights for policy 1, policy_version 86930 (0.0008) +[2023-10-08 19:17:15,833][21194] Updated weights for policy 1, policy_version 86940 (0.0011) +[2023-10-08 19:17:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 178749440. Throughput: 0: 1751.7, 1: 1699.0. Samples: 44698104. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 19:17:18,803][19739] Avg episode reward: [(0, '1059.730'), (1, '991.100')] +[2023-10-08 19:17:19,366][21195] Updated weights for policy 0, policy_version 87620 (0.0008) +[2023-10-08 19:17:19,659][21194] Updated weights for policy 1, policy_version 86950 (0.0009) +[2023-10-08 19:17:19,739][21195] Updated weights for policy 0, policy_version 87630 (0.0007) +[2023-10-08 19:17:20,030][21194] Updated weights for policy 1, policy_version 86960 (0.0009) +[2023-10-08 19:17:20,099][21195] Updated weights for policy 0, policy_version 87640 (0.0007) +[2023-10-08 19:17:20,400][21194] Updated weights for policy 1, policy_version 86970 (0.0008) +[2023-10-08 19:17:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 178814976. Throughput: 0: 1715.2, 1: 1710.2. Samples: 44713390. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 19:17:23,804][19739] Avg episode reward: [(0, '1059.730'), (1, '991.100')] +[2023-10-08 19:17:24,064][21195] Updated weights for policy 0, policy_version 87650 (0.0008) +[2023-10-08 19:17:24,329][21194] Updated weights for policy 1, policy_version 86980 (0.0008) +[2023-10-08 19:17:24,434][21195] Updated weights for policy 0, policy_version 87660 (0.0007) +[2023-10-08 19:17:24,699][21194] Updated weights for policy 1, policy_version 86990 (0.0007) +[2023-10-08 19:17:24,809][21195] Updated weights for policy 0, policy_version 87670 (0.0007) +[2023-10-08 19:17:25,068][21194] Updated weights for policy 1, policy_version 87000 (0.0007) +[2023-10-08 19:17:25,170][21195] Updated weights for policy 0, policy_version 87680 (0.0009) +[2023-10-08 19:17:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 178880512. Throughput: 0: 1739.0, 1: 1732.4. Samples: 44734582. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 19:17:28,804][19739] Avg episode reward: [(0, '1059.730'), (1, '950.660')] +[2023-10-08 19:17:29,001][21194] Updated weights for policy 1, policy_version 87010 (0.0010) +[2023-10-08 19:17:29,171][21195] Updated weights for policy 0, policy_version 87690 (0.0010) +[2023-10-08 19:17:29,369][21194] Updated weights for policy 1, policy_version 87020 (0.0008) +[2023-10-08 19:17:29,535][21195] Updated weights for policy 0, policy_version 87700 (0.0008) +[2023-10-08 19:17:29,730][21194] Updated weights for policy 1, policy_version 87030 (0.0009) +[2023-10-08 19:17:29,905][21195] Updated weights for policy 0, policy_version 87710 (0.0007) +[2023-10-08 19:17:30,094][21194] Updated weights for policy 1, policy_version 87040 (0.0008) +[2023-10-08 19:17:33,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 178946048. Throughput: 0: 1730.7, 1: 1705.0. Samples: 44749606. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 19:17:33,803][19739] Avg episode reward: [(0, '1059.730'), (1, '906.950')] +[2023-10-08 19:17:33,803][21195] Updated weights for policy 0, policy_version 87720 (0.0008) +[2023-10-08 19:17:34,170][21194] Updated weights for policy 1, policy_version 87050 (0.0008) +[2023-10-08 19:17:34,182][21195] Updated weights for policy 0, policy_version 87730 (0.0008) +[2023-10-08 19:17:34,541][21194] Updated weights for policy 1, policy_version 87060 (0.0008) +[2023-10-08 19:17:34,552][21195] Updated weights for policy 0, policy_version 87740 (0.0008) +[2023-10-08 19:17:34,910][21194] Updated weights for policy 1, policy_version 87070 (0.0009) +[2023-10-08 19:17:38,498][21195] Updated weights for policy 0, policy_version 87750 (0.0009) +[2023-10-08 19:17:38,709][21194] Updated weights for policy 1, policy_version 87080 (0.0007) +[2023-10-08 19:17:38,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 179011584. Throughput: 0: 1725.5, 1: 1737.1. Samples: 44765276. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 19:17:38,803][19739] Avg episode reward: [(0, '1075.080'), (1, '920.800')] +[2023-10-08 19:17:38,863][21195] Updated weights for policy 0, policy_version 87760 (0.0009) +[2023-10-08 19:17:39,072][21194] Updated weights for policy 1, policy_version 87090 (0.0008) +[2023-10-08 19:17:39,225][21195] Updated weights for policy 0, policy_version 87770 (0.0007) +[2023-10-08 19:17:39,445][21194] Updated weights for policy 1, policy_version 87100 (0.0008) +[2023-10-08 19:17:43,390][21195] Updated weights for policy 0, policy_version 87780 (0.0009) +[2023-10-08 19:17:43,514][21194] Updated weights for policy 1, policy_version 87110 (0.0008) +[2023-10-08 19:17:43,754][21195] Updated weights for policy 0, policy_version 87790 (0.0008) +[2023-10-08 19:17:43,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 179077120. Throughput: 0: 1731.4, 1: 1737.9. Samples: 44786640. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 19:17:43,804][19739] Avg episode reward: [(0, '1075.080'), (1, '920.800')] +[2023-10-08 19:17:43,875][21194] Updated weights for policy 1, policy_version 87120 (0.0009) +[2023-10-08 19:17:44,128][21195] Updated weights for policy 0, policy_version 87800 (0.0007) +[2023-10-08 19:17:44,238][21194] Updated weights for policy 1, policy_version 87130 (0.0010) +[2023-10-08 19:17:47,885][21195] Updated weights for policy 0, policy_version 87810 (0.0008) +[2023-10-08 19:17:48,231][21194] Updated weights for policy 1, policy_version 87140 (0.0010) +[2023-10-08 19:17:48,248][21195] Updated weights for policy 0, policy_version 87820 (0.0008) +[2023-10-08 19:17:48,603][21194] Updated weights for policy 1, policy_version 87150 (0.0007) +[2023-10-08 19:17:48,607][21195] Updated weights for policy 0, policy_version 87830 (0.0008) +[2023-10-08 19:17:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 179142656. Throughput: 0: 1707.4, 1: 1723.1. Samples: 44801094. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 19:17:48,803][19739] Avg episode reward: [(0, '1075.080'), (1, '920.800')] +[2023-10-08 19:17:48,962][21194] Updated weights for policy 1, policy_version 87160 (0.0007) +[2023-10-08 19:17:48,983][21195] Updated weights for policy 0, policy_version 87840 (0.0008) +[2023-10-08 19:17:52,777][21194] Updated weights for policy 1, policy_version 87170 (0.0008) +[2023-10-08 19:17:53,071][21195] Updated weights for policy 0, policy_version 87850 (0.0009) +[2023-10-08 19:17:53,142][21194] Updated weights for policy 1, policy_version 87180 (0.0008) +[2023-10-08 19:17:53,445][21195] Updated weights for policy 0, policy_version 87860 (0.0009) +[2023-10-08 19:17:53,505][21194] Updated weights for policy 1, policy_version 87190 (0.0008) +[2023-10-08 19:17:53,803][21195] Updated weights for policy 0, policy_version 87870 (0.0009) +[2023-10-08 19:17:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 179208192. Throughput: 0: 1729.2, 1: 1743.3. Samples: 44817698. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:17:53,804][19739] Avg episode reward: [(0, '1075.080'), (1, '920.800')] +[2023-10-08 19:17:53,865][21194] Updated weights for policy 1, policy_version 87200 (0.0009) +[2023-10-08 19:17:57,711][21194] Updated weights for policy 1, policy_version 87210 (0.0007) +[2023-10-08 19:17:57,823][21195] Updated weights for policy 0, policy_version 87880 (0.0009) +[2023-10-08 19:17:58,073][21194] Updated weights for policy 1, policy_version 87220 (0.0007) +[2023-10-08 19:17:58,190][21195] Updated weights for policy 0, policy_version 87890 (0.0010) +[2023-10-08 19:17:58,436][21194] Updated weights for policy 1, policy_version 87230 (0.0007) +[2023-10-08 19:17:58,552][21195] Updated weights for policy 0, policy_version 87900 (0.0009) +[2023-10-08 19:17:58,802][19739] Fps is (10 sec: 19660.8, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 179339264. Throughput: 0: 1716.9, 1: 1734.1. Samples: 44838100. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:17:58,803][19739] Avg episode reward: [(0, '1099.580'), (1, '920.800')] +[2023-10-08 19:18:02,505][21194] Updated weights for policy 1, policy_version 87240 (0.0008) +[2023-10-08 19:18:02,732][21195] Updated weights for policy 0, policy_version 87910 (0.0008) +[2023-10-08 19:18:02,865][21194] Updated weights for policy 1, policy_version 87250 (0.0008) +[2023-10-08 19:18:03,101][21195] Updated weights for policy 0, policy_version 87920 (0.0008) +[2023-10-08 19:18:03,235][21194] Updated weights for policy 1, policy_version 87260 (0.0007) +[2023-10-08 19:18:03,465][21195] Updated weights for policy 0, policy_version 87930 (0.0008) +[2023-10-08 19:18:03,803][19739] Fps is (10 sec: 19661.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 179404800. Throughput: 0: 1687.9, 1: 1746.7. Samples: 44852660. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:18:03,803][19739] Avg episode reward: [(0, '1099.580'), (1, '935.730')] +[2023-10-08 19:18:06,912][21194] Updated weights for policy 1, policy_version 87270 (0.0009) +[2023-10-08 19:18:07,277][21194] Updated weights for policy 1, policy_version 87280 (0.0007) +[2023-10-08 19:18:07,456][21195] Updated weights for policy 0, policy_version 87940 (0.0008) +[2023-10-08 19:18:07,647][21194] Updated weights for policy 1, policy_version 87290 (0.0008) +[2023-10-08 19:18:07,824][21195] Updated weights for policy 0, policy_version 87950 (0.0008) +[2023-10-08 19:18:08,195][21195] Updated weights for policy 0, policy_version 87960 (0.0009) +[2023-10-08 19:18:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 179470336. Throughput: 0: 1719.3, 1: 1737.7. Samples: 44868952. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:18:08,803][19739] Avg episode reward: [(0, '1099.580'), (1, '950.170')] +[2023-10-08 19:18:11,708][21194] Updated weights for policy 1, policy_version 87300 (0.0007) +[2023-10-08 19:18:12,081][21194] Updated weights for policy 1, policy_version 87310 (0.0008) +[2023-10-08 19:18:12,131][21195] Updated weights for policy 0, policy_version 87970 (0.0008) +[2023-10-08 19:18:12,445][21194] Updated weights for policy 1, policy_version 87320 (0.0007) +[2023-10-08 19:18:12,496][21195] Updated weights for policy 0, policy_version 87980 (0.0008) +[2023-10-08 19:18:12,866][21195] Updated weights for policy 0, policy_version 87990 (0.0008) +[2023-10-08 19:18:13,241][21195] Updated weights for policy 0, policy_version 88000 (0.0011) +[2023-10-08 19:18:13,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 179535872. Throughput: 0: 1708.8, 1: 1714.0. Samples: 44888612. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:18:13,804][19739] Avg episode reward: [(0, '1099.580'), (1, '950.170')] +[2023-10-08 19:18:16,443][21194] Updated weights for policy 1, policy_version 87330 (0.0008) +[2023-10-08 19:18:16,814][21194] Updated weights for policy 1, policy_version 87340 (0.0007) +[2023-10-08 19:18:17,086][21195] Updated weights for policy 0, policy_version 88010 (0.0008) +[2023-10-08 19:18:17,177][21194] Updated weights for policy 1, policy_version 87350 (0.0007) +[2023-10-08 19:18:17,456][21195] Updated weights for policy 0, policy_version 88020 (0.0008) +[2023-10-08 19:18:17,539][21194] Updated weights for policy 1, policy_version 87360 (0.0007) +[2023-10-08 19:18:17,824][21195] Updated weights for policy 0, policy_version 88030 (0.0008) +[2023-10-08 19:18:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 179601408. Throughput: 0: 1703.4, 1: 1743.2. Samples: 44904702. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:18:18,803][19739] Avg episode reward: [(0, '1099.580'), (1, '938.760')] +[2023-10-08 19:18:21,398][21194] Updated weights for policy 1, policy_version 87370 (0.0010) +[2023-10-08 19:18:21,755][21194] Updated weights for policy 1, policy_version 87380 (0.0009) +[2023-10-08 19:18:21,757][21195] Updated weights for policy 0, policy_version 88040 (0.0007) +[2023-10-08 19:18:22,120][21194] Updated weights for policy 1, policy_version 87390 (0.0007) +[2023-10-08 19:18:22,126][21195] Updated weights for policy 0, policy_version 88050 (0.0008) +[2023-10-08 19:18:22,502][21195] Updated weights for policy 0, policy_version 88060 (0.0010) +[2023-10-08 19:18:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 179666944. Throughput: 0: 1718.8, 1: 1719.5. Samples: 44920000. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:18:23,804][19739] Avg episode reward: [(0, '1099.580'), (1, '939.320')] +[2023-10-08 19:18:26,320][21194] Updated weights for policy 1, policy_version 87400 (0.0007) +[2023-10-08 19:18:26,390][21195] Updated weights for policy 0, policy_version 88070 (0.0008) +[2023-10-08 19:18:26,695][21194] Updated weights for policy 1, policy_version 87410 (0.0007) +[2023-10-08 19:18:26,749][21195] Updated weights for policy 0, policy_version 88080 (0.0009) +[2023-10-08 19:18:27,060][21194] Updated weights for policy 1, policy_version 87420 (0.0007) +[2023-10-08 19:18:27,110][21195] Updated weights for policy 0, policy_version 88090 (0.0007) +[2023-10-08 19:18:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 179732480. Throughput: 0: 1699.4, 1: 1711.2. Samples: 44940114. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:18:28,803][19739] Avg episode reward: [(0, '1099.580'), (1, '939.300')] +[2023-10-08 19:18:30,960][21195] Updated weights for policy 0, policy_version 88100 (0.0007) +[2023-10-08 19:18:31,121][21194] Updated weights for policy 1, policy_version 87430 (0.0008) +[2023-10-08 19:18:31,331][21195] Updated weights for policy 0, policy_version 88110 (0.0007) +[2023-10-08 19:18:31,490][21194] Updated weights for policy 1, policy_version 87440 (0.0009) +[2023-10-08 19:18:31,690][21195] Updated weights for policy 0, policy_version 88120 (0.0008) +[2023-10-08 19:18:31,853][21194] Updated weights for policy 1, policy_version 87450 (0.0008) +[2023-10-08 19:18:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 179798016. Throughput: 0: 1721.7, 1: 1732.6. Samples: 44956538. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:18:33,804][19739] Avg episode reward: [(0, '1099.580'), (1, '909.070')] +[2023-10-08 19:18:35,674][21195] Updated weights for policy 0, policy_version 88130 (0.0008) +[2023-10-08 19:18:35,787][21194] Updated weights for policy 1, policy_version 87460 (0.0009) +[2023-10-08 19:18:36,040][21195] Updated weights for policy 0, policy_version 88140 (0.0007) +[2023-10-08 19:18:36,153][21194] Updated weights for policy 1, policy_version 87470 (0.0009) +[2023-10-08 19:18:36,415][21195] Updated weights for policy 0, policy_version 88150 (0.0007) +[2023-10-08 19:18:36,526][21194] Updated weights for policy 1, policy_version 87480 (0.0008) +[2023-10-08 19:18:36,779][21195] Updated weights for policy 0, policy_version 88160 (0.0009) +[2023-10-08 19:18:38,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 179863552. Throughput: 0: 1702.4, 1: 1699.9. Samples: 44970804. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:18:38,804][19739] Avg episode reward: [(0, '1099.580'), (1, '909.070')] +[2023-10-08 19:18:40,414][21194] Updated weights for policy 1, policy_version 87490 (0.0007) +[2023-10-08 19:18:40,632][21195] Updated weights for policy 0, policy_version 88170 (0.0008) +[2023-10-08 19:18:40,778][21194] Updated weights for policy 1, policy_version 87500 (0.0010) +[2023-10-08 19:18:40,991][21195] Updated weights for policy 0, policy_version 88180 (0.0007) +[2023-10-08 19:18:41,141][21194] Updated weights for policy 1, policy_version 87510 (0.0008) +[2023-10-08 19:18:41,354][21195] Updated weights for policy 0, policy_version 88190 (0.0008) +[2023-10-08 19:18:41,500][21194] Updated weights for policy 1, policy_version 87520 (0.0009) +[2023-10-08 19:18:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 179929088. Throughput: 0: 1720.3, 1: 1715.2. Samples: 44992698. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:18:43,804][19739] Avg episode reward: [(0, '1095.320'), (1, '923.980')] +[2023-10-08 19:18:45,197][21195] Updated weights for policy 0, policy_version 88200 (0.0007) +[2023-10-08 19:18:45,404][21194] Updated weights for policy 1, policy_version 87530 (0.0009) +[2023-10-08 19:18:45,560][21195] Updated weights for policy 0, policy_version 88210 (0.0010) +[2023-10-08 19:18:45,757][21194] Updated weights for policy 1, policy_version 87540 (0.0010) +[2023-10-08 19:18:45,928][21195] Updated weights for policy 0, policy_version 88220 (0.0008) +[2023-10-08 19:18:46,124][21194] Updated weights for policy 1, policy_version 87550 (0.0009) +[2023-10-08 19:18:48,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 179994624. Throughput: 0: 1748.2, 1: 1706.7. Samples: 45008130. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:18:48,803][19739] Avg episode reward: [(0, '1109.680'), (1, '924.130')] +[2023-10-08 19:18:49,928][21195] Updated weights for policy 0, policy_version 88230 (0.0007) +[2023-10-08 19:18:50,177][21194] Updated weights for policy 1, policy_version 87560 (0.0008) +[2023-10-08 19:18:50,293][21195] Updated weights for policy 0, policy_version 88240 (0.0008) +[2023-10-08 19:18:50,539][21194] Updated weights for policy 1, policy_version 87570 (0.0007) +[2023-10-08 19:18:50,655][21195] Updated weights for policy 0, policy_version 88250 (0.0008) +[2023-10-08 19:18:50,898][21194] Updated weights for policy 1, policy_version 87580 (0.0008) +[2023-10-08 19:18:53,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 180060160. Throughput: 0: 1720.6, 1: 1702.5. Samples: 45022994. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:18:53,803][19739] Avg episode reward: [(0, '1109.680'), (1, '924.130')] +[2023-10-08 19:18:54,363][21195] Updated weights for policy 0, policy_version 88260 (0.0008) +[2023-10-08 19:18:54,740][21195] Updated weights for policy 0, policy_version 88270 (0.0010) +[2023-10-08 19:18:54,860][21194] Updated weights for policy 1, policy_version 87590 (0.0007) +[2023-10-08 19:18:55,112][21195] Updated weights for policy 0, policy_version 88280 (0.0009) +[2023-10-08 19:18:55,214][21194] Updated weights for policy 1, policy_version 87600 (0.0009) +[2023-10-08 19:18:55,578][21194] Updated weights for policy 1, policy_version 87610 (0.0008) +[2023-10-08 19:18:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 180125696. Throughput: 0: 1743.6, 1: 1723.7. Samples: 45044640. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:18:58,803][19739] Avg episode reward: [(0, '1109.680'), (1, '924.130')] +[2023-10-08 19:18:59,235][21195] Updated weights for policy 0, policy_version 88290 (0.0009) +[2023-10-08 19:18:59,510][21194] Updated weights for policy 1, policy_version 87620 (0.0007) +[2023-10-08 19:18:59,604][21195] Updated weights for policy 0, policy_version 88300 (0.0007) +[2023-10-08 19:18:59,869][21194] Updated weights for policy 1, policy_version 87630 (0.0007) +[2023-10-08 19:18:59,976][21195] Updated weights for policy 0, policy_version 88310 (0.0008) +[2023-10-08 19:19:00,238][21194] Updated weights for policy 1, policy_version 87640 (0.0008) +[2023-10-08 19:19:00,342][21195] Updated weights for policy 0, policy_version 88320 (0.0009) +[2023-10-08 19:19:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 180191232. Throughput: 0: 1752.0, 1: 1692.9. Samples: 45059724. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:19:03,803][19739] Avg episode reward: [(0, '1109.880'), (1, '924.130')] +[2023-10-08 19:19:04,235][21194] Updated weights for policy 1, policy_version 87650 (0.0011) +[2023-10-08 19:19:04,402][21195] Updated weights for policy 0, policy_version 88330 (0.0008) +[2023-10-08 19:19:04,595][21194] Updated weights for policy 1, policy_version 87660 (0.0008) +[2023-10-08 19:19:04,777][21195] Updated weights for policy 0, policy_version 88340 (0.0007) +[2023-10-08 19:19:04,961][21194] Updated weights for policy 1, policy_version 87670 (0.0007) +[2023-10-08 19:19:05,135][21195] Updated weights for policy 0, policy_version 88350 (0.0009) +[2023-10-08 19:19:05,326][21194] Updated weights for policy 1, policy_version 87680 (0.0007) +[2023-10-08 19:19:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 180256768. Throughput: 0: 1731.9, 1: 1715.4. Samples: 45075128. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:19:08,803][19739] Avg episode reward: [(0, '1109.880'), (1, '924.130')] +[2023-10-08 19:19:09,057][21195] Updated weights for policy 0, policy_version 88360 (0.0007) +[2023-10-08 19:19:09,187][21194] Updated weights for policy 1, policy_version 87690 (0.0009) +[2023-10-08 19:19:09,421][21195] Updated weights for policy 0, policy_version 88370 (0.0007) +[2023-10-08 19:19:09,549][21194] Updated weights for policy 1, policy_version 87700 (0.0008) +[2023-10-08 19:19:09,793][21195] Updated weights for policy 0, policy_version 88380 (0.0009) +[2023-10-08 19:19:09,920][21194] Updated weights for policy 1, policy_version 87710 (0.0007) +[2023-10-08 19:19:13,607][21195] Updated weights for policy 0, policy_version 88390 (0.0008) +[2023-10-08 19:19:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.3, 300 sec: 13773.7). Total num frames: 180322304. Throughput: 0: 1748.0, 1: 1722.7. Samples: 45096294. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:19:13,803][19739] Avg episode reward: [(0, '1125.550'), (1, '939.330')] +[2023-10-08 19:19:13,977][21195] Updated weights for policy 0, policy_version 88400 (0.0007) +[2023-10-08 19:19:14,057][21194] Updated weights for policy 1, policy_version 87720 (0.0007) +[2023-10-08 19:19:14,338][21195] Updated weights for policy 0, policy_version 88410 (0.0008) +[2023-10-08 19:19:14,429][21194] Updated weights for policy 1, policy_version 87730 (0.0007) +[2023-10-08 19:19:14,560][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000088416_90537984.pth... +[2023-10-08 19:19:14,594][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000086784_88866816.pth +[2023-10-08 19:19:14,797][21194] Updated weights for policy 1, policy_version 87740 (0.0007) +[2023-10-08 19:19:14,943][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000087744_89849856.pth... +[2023-10-08 19:19:14,982][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000086112_88178688.pth +[2023-10-08 19:19:18,272][21195] Updated weights for policy 0, policy_version 88420 (0.0009) +[2023-10-08 19:19:18,645][21195] Updated weights for policy 0, policy_version 88430 (0.0009) +[2023-10-08 19:19:18,666][21194] Updated weights for policy 1, policy_version 87750 (0.0008) +[2023-10-08 19:19:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 180387840. Throughput: 0: 1726.6, 1: 1702.7. Samples: 45110854. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:19:18,803][19739] Avg episode reward: [(0, '1125.550'), (1, '939.330')] +[2023-10-08 19:19:19,005][21195] Updated weights for policy 0, policy_version 88440 (0.0008) +[2023-10-08 19:19:19,036][21194] Updated weights for policy 1, policy_version 87760 (0.0007) +[2023-10-08 19:19:19,394][21194] Updated weights for policy 1, policy_version 87770 (0.0008) +[2023-10-08 19:19:22,980][21195] Updated weights for policy 0, policy_version 88450 (0.0009) +[2023-10-08 19:19:23,304][21194] Updated weights for policy 1, policy_version 87780 (0.0009) +[2023-10-08 19:19:23,349][21195] Updated weights for policy 0, policy_version 88460 (0.0008) +[2023-10-08 19:19:23,673][21194] Updated weights for policy 1, policy_version 87790 (0.0009) +[2023-10-08 19:19:23,719][21195] Updated weights for policy 0, policy_version 88470 (0.0009) +[2023-10-08 19:19:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 180453376. Throughput: 0: 1737.9, 1: 1730.1. Samples: 45126862. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:19:23,803][19739] Avg episode reward: [(0, '1125.550'), (1, '939.330')] +[2023-10-08 19:19:24,038][21194] Updated weights for policy 1, policy_version 87800 (0.0010) +[2023-10-08 19:19:24,078][21195] Updated weights for policy 0, policy_version 88480 (0.0007) +[2023-10-08 19:19:28,027][21195] Updated weights for policy 0, policy_version 88490 (0.0008) +[2023-10-08 19:19:28,045][21194] Updated weights for policy 1, policy_version 87810 (0.0009) +[2023-10-08 19:19:28,397][21195] Updated weights for policy 0, policy_version 88500 (0.0009) +[2023-10-08 19:19:28,412][21194] Updated weights for policy 1, policy_version 87820 (0.0009) +[2023-10-08 19:19:28,759][21195] Updated weights for policy 0, policy_version 88510 (0.0008) +[2023-10-08 19:19:28,773][21194] Updated weights for policy 1, policy_version 87830 (0.0007) +[2023-10-08 19:19:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 180518912. Throughput: 0: 1727.4, 1: 1724.7. Samples: 45148042. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:19:28,803][19739] Avg episode reward: [(0, '1125.550'), (1, '939.330')] +[2023-10-08 19:19:29,136][21194] Updated weights for policy 1, policy_version 87840 (0.0007) +[2023-10-08 19:19:32,691][21195] Updated weights for policy 0, policy_version 88520 (0.0009) +[2023-10-08 19:19:32,980][21194] Updated weights for policy 1, policy_version 87850 (0.0007) +[2023-10-08 19:19:33,058][21195] Updated weights for policy 0, policy_version 88530 (0.0007) +[2023-10-08 19:19:33,351][21194] Updated weights for policy 1, policy_version 87860 (0.0007) +[2023-10-08 19:19:33,442][21195] Updated weights for policy 0, policy_version 88540 (0.0008) +[2023-10-08 19:19:33,711][21194] Updated weights for policy 1, policy_version 87870 (0.0008) +[2023-10-08 19:19:33,802][19739] Fps is (10 sec: 19661.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 180649984. Throughput: 0: 1702.8, 1: 1724.8. Samples: 45162372. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:19:33,803][19739] Avg episode reward: [(0, '1156.570'), (1, '939.330')] +[2023-10-08 19:19:33,804][20740] Saving new best policy, reward=1156.570! +[2023-10-08 19:19:37,297][21195] Updated weights for policy 0, policy_version 88550 (0.0008) +[2023-10-08 19:19:37,627][21194] Updated weights for policy 1, policy_version 87880 (0.0009) +[2023-10-08 19:19:37,655][21195] Updated weights for policy 0, policy_version 88560 (0.0009) +[2023-10-08 19:19:37,992][21194] Updated weights for policy 1, policy_version 87890 (0.0008) +[2023-10-08 19:19:38,026][21195] Updated weights for policy 0, policy_version 88570 (0.0008) +[2023-10-08 19:19:38,354][21194] Updated weights for policy 1, policy_version 87900 (0.0008) +[2023-10-08 19:19:38,803][19739] Fps is (10 sec: 19660.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 180715520. Throughput: 0: 1733.6, 1: 1740.7. Samples: 45179336. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:19:38,804][19739] Avg episode reward: [(0, '1156.570'), (1, '939.330')] +[2023-10-08 19:19:42,078][21195] Updated weights for policy 0, policy_version 88580 (0.0010) +[2023-10-08 19:19:42,460][21195] Updated weights for policy 0, policy_version 88590 (0.0009) +[2023-10-08 19:19:42,467][21194] Updated weights for policy 1, policy_version 87910 (0.0007) +[2023-10-08 19:19:42,823][21194] Updated weights for policy 1, policy_version 87920 (0.0008) +[2023-10-08 19:19:42,829][21195] Updated weights for policy 0, policy_version 88600 (0.0010) +[2023-10-08 19:19:43,192][21194] Updated weights for policy 1, policy_version 87930 (0.0008) +[2023-10-08 19:19:43,803][19739] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 180781056. Throughput: 0: 1707.9, 1: 1716.0. Samples: 45198718. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:19:43,804][19739] Avg episode reward: [(0, '1156.570'), (1, '939.330')] +[2023-10-08 19:19:46,821][21195] Updated weights for policy 0, policy_version 88610 (0.0008) +[2023-10-08 19:19:47,124][21194] Updated weights for policy 1, policy_version 87940 (0.0009) +[2023-10-08 19:19:47,194][21195] Updated weights for policy 0, policy_version 88620 (0.0009) +[2023-10-08 19:19:47,481][21194] Updated weights for policy 1, policy_version 87950 (0.0008) +[2023-10-08 19:19:47,557][21195] Updated weights for policy 0, policy_version 88630 (0.0008) +[2023-10-08 19:19:47,856][21194] Updated weights for policy 1, policy_version 87960 (0.0008) +[2023-10-08 19:19:47,920][21195] Updated weights for policy 0, policy_version 88640 (0.0008) +[2023-10-08 19:19:48,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 180846592. Throughput: 0: 1694.6, 1: 1740.5. Samples: 45214304. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:19:48,803][19739] Avg episode reward: [(0, '1172.210'), (1, '939.330')] +[2023-10-08 19:19:48,804][20740] Saving new best policy, reward=1172.210! +[2023-10-08 19:19:51,735][21194] Updated weights for policy 1, policy_version 87970 (0.0010) +[2023-10-08 19:19:51,995][21195] Updated weights for policy 0, policy_version 88650 (0.0009) +[2023-10-08 19:19:52,103][21194] Updated weights for policy 1, policy_version 87980 (0.0008) +[2023-10-08 19:19:52,362][21195] Updated weights for policy 0, policy_version 88660 (0.0009) +[2023-10-08 19:19:52,466][21194] Updated weights for policy 1, policy_version 87990 (0.0008) +[2023-10-08 19:19:52,734][21195] Updated weights for policy 0, policy_version 88670 (0.0008) +[2023-10-08 19:19:52,824][21194] Updated weights for policy 1, policy_version 88000 (0.0007) +[2023-10-08 19:19:53,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 180912128. Throughput: 0: 1719.0, 1: 1731.1. Samples: 45230380. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:19:53,803][19739] Avg episode reward: [(0, '1172.490'), (1, '939.330')] +[2023-10-08 19:19:53,804][20740] Saving new best policy, reward=1172.490! +[2023-10-08 19:19:56,401][21195] Updated weights for policy 0, policy_version 88680 (0.0007) +[2023-10-08 19:19:56,767][21195] Updated weights for policy 0, policy_version 88690 (0.0008) +[2023-10-08 19:19:56,876][21194] Updated weights for policy 1, policy_version 88010 (0.0008) +[2023-10-08 19:19:57,144][21195] Updated weights for policy 0, policy_version 88700 (0.0009) +[2023-10-08 19:19:57,237][21194] Updated weights for policy 1, policy_version 88020 (0.0008) +[2023-10-08 19:19:57,593][21194] Updated weights for policy 1, policy_version 88030 (0.0011) +[2023-10-08 19:19:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 180977664. Throughput: 0: 1704.7, 1: 1711.3. Samples: 45250016. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:19:58,803][19739] Avg episode reward: [(0, '1172.490'), (1, '939.330')] +[2023-10-08 19:20:00,954][21195] Updated weights for policy 0, policy_version 88710 (0.0009) +[2023-10-08 19:20:01,322][21195] Updated weights for policy 0, policy_version 88720 (0.0008) +[2023-10-08 19:20:01,655][21194] Updated weights for policy 1, policy_version 88040 (0.0009) +[2023-10-08 19:20:01,698][21195] Updated weights for policy 0, policy_version 88730 (0.0007) +[2023-10-08 19:20:02,016][21194] Updated weights for policy 1, policy_version 88050 (0.0009) +[2023-10-08 19:20:02,380][21194] Updated weights for policy 1, policy_version 88060 (0.0008) +[2023-10-08 19:20:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 181043200. Throughput: 0: 1729.4, 1: 1740.4. Samples: 45266998. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:20:03,804][19739] Avg episode reward: [(0, '1173.350'), (1, '939.330')] +[2023-10-08 19:20:03,805][20740] Saving new best policy, reward=1173.350! +[2023-10-08 19:20:05,780][21195] Updated weights for policy 0, policy_version 88740 (0.0009) +[2023-10-08 19:20:06,147][21195] Updated weights for policy 0, policy_version 88750 (0.0009) +[2023-10-08 19:20:06,323][21194] Updated weights for policy 1, policy_version 88070 (0.0008) +[2023-10-08 19:20:06,528][21195] Updated weights for policy 0, policy_version 88760 (0.0008) +[2023-10-08 19:20:06,677][21194] Updated weights for policy 1, policy_version 88080 (0.0007) +[2023-10-08 19:20:07,038][21194] Updated weights for policy 1, policy_version 88090 (0.0010) +[2023-10-08 19:20:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 181108736. Throughput: 0: 1716.6, 1: 1715.7. Samples: 45281318. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:20:08,803][19739] Avg episode reward: [(0, '1172.610'), (1, '939.330')] +[2023-10-08 19:20:10,393][21195] Updated weights for policy 0, policy_version 88770 (0.0009) +[2023-10-08 19:20:10,779][21195] Updated weights for policy 0, policy_version 88780 (0.0010) +[2023-10-08 19:20:11,012][21194] Updated weights for policy 1, policy_version 88100 (0.0009) +[2023-10-08 19:20:11,137][21195] Updated weights for policy 0, policy_version 88790 (0.0009) +[2023-10-08 19:20:11,363][21194] Updated weights for policy 1, policy_version 88110 (0.0008) +[2023-10-08 19:20:11,504][21195] Updated weights for policy 0, policy_version 88800 (0.0007) +[2023-10-08 19:20:11,726][21194] Updated weights for policy 1, policy_version 88120 (0.0008) +[2023-10-08 19:20:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 181174272. Throughput: 0: 1719.7, 1: 1711.3. Samples: 45302438. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:20:13,803][19739] Avg episode reward: [(0, '1172.610'), (1, '939.600')] +[2023-10-08 19:20:15,484][21195] Updated weights for policy 0, policy_version 88810 (0.0008) +[2023-10-08 19:20:15,559][21194] Updated weights for policy 1, policy_version 88130 (0.0009) +[2023-10-08 19:20:15,848][21195] Updated weights for policy 0, policy_version 88820 (0.0007) +[2023-10-08 19:20:15,928][21194] Updated weights for policy 1, policy_version 88140 (0.0009) +[2023-10-08 19:20:16,210][21195] Updated weights for policy 0, policy_version 88830 (0.0007) +[2023-10-08 19:20:16,290][21194] Updated weights for policy 1, policy_version 88150 (0.0007) +[2023-10-08 19:20:16,661][21194] Updated weights for policy 1, policy_version 88160 (0.0007) +[2023-10-08 19:20:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 181239808. Throughput: 0: 1749.1, 1: 1723.1. Samples: 45318620. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:20:18,803][19739] Avg episode reward: [(0, '1172.610'), (1, '939.600')] +[2023-10-08 19:20:20,232][21195] Updated weights for policy 0, policy_version 88840 (0.0009) +[2023-10-08 19:20:20,596][21195] Updated weights for policy 0, policy_version 88850 (0.0008) +[2023-10-08 19:20:20,601][21194] Updated weights for policy 1, policy_version 88170 (0.0008) +[2023-10-08 19:20:20,965][21194] Updated weights for policy 1, policy_version 88180 (0.0008) +[2023-10-08 19:20:20,966][21195] Updated weights for policy 0, policy_version 88860 (0.0010) +[2023-10-08 19:20:21,332][21194] Updated weights for policy 1, policy_version 88190 (0.0008) +[2023-10-08 19:20:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 181305344. Throughput: 0: 1717.2, 1: 1703.1. Samples: 45333250. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:20:23,803][19739] Avg episode reward: [(0, '1172.610'), (1, '939.140')] +[2023-10-08 19:20:24,907][21195] Updated weights for policy 0, policy_version 88870 (0.0008) +[2023-10-08 19:20:25,196][21194] Updated weights for policy 1, policy_version 88200 (0.0008) +[2023-10-08 19:20:25,278][21195] Updated weights for policy 0, policy_version 88880 (0.0009) +[2023-10-08 19:20:25,560][21194] Updated weights for policy 1, policy_version 88210 (0.0010) +[2023-10-08 19:20:25,647][21195] Updated weights for policy 0, policy_version 88890 (0.0009) +[2023-10-08 19:20:25,929][21194] Updated weights for policy 1, policy_version 88220 (0.0010) +[2023-10-08 19:20:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 181370880. Throughput: 0: 1740.2, 1: 1725.2. Samples: 45354658. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:20:28,804][19739] Avg episode reward: [(0, '1158.300'), (1, '924.740')] +[2023-10-08 19:20:29,571][21195] Updated weights for policy 0, policy_version 88900 (0.0007) +[2023-10-08 19:20:29,951][21195] Updated weights for policy 0, policy_version 88910 (0.0008) +[2023-10-08 19:20:30,163][21194] Updated weights for policy 1, policy_version 88230 (0.0007) +[2023-10-08 19:20:30,314][21195] Updated weights for policy 0, policy_version 88920 (0.0008) +[2023-10-08 19:20:30,528][21194] Updated weights for policy 1, policy_version 88240 (0.0010) +[2023-10-08 19:20:30,891][21194] Updated weights for policy 1, policy_version 88250 (0.0010) +[2023-10-08 19:20:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 181436416. Throughput: 0: 1756.2, 1: 1703.6. Samples: 45369996. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:20:33,803][19739] Avg episode reward: [(0, '1158.380'), (1, '924.740')] +[2023-10-08 19:20:34,275][21195] Updated weights for policy 0, policy_version 88930 (0.0008) +[2023-10-08 19:20:34,649][21195] Updated weights for policy 0, policy_version 88940 (0.0007) +[2023-10-08 19:20:34,832][21194] Updated weights for policy 1, policy_version 88260 (0.0008) +[2023-10-08 19:20:35,014][21195] Updated weights for policy 0, policy_version 88950 (0.0008) +[2023-10-08 19:20:35,202][21194] Updated weights for policy 1, policy_version 88270 (0.0008) +[2023-10-08 19:20:35,371][21195] Updated weights for policy 0, policy_version 88960 (0.0009) +[2023-10-08 19:20:35,575][21194] Updated weights for policy 1, policy_version 88280 (0.0009) +[2023-10-08 19:20:38,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 181501952. Throughput: 0: 1730.5, 1: 1704.7. Samples: 45384964. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:20:38,803][19739] Avg episode reward: [(0, '1158.380'), (1, '938.870')] +[2023-10-08 19:20:39,246][21195] Updated weights for policy 0, policy_version 88970 (0.0008) +[2023-10-08 19:20:39,542][21194] Updated weights for policy 1, policy_version 88290 (0.0007) +[2023-10-08 19:20:39,619][21195] Updated weights for policy 0, policy_version 88980 (0.0007) +[2023-10-08 19:20:39,919][21194] Updated weights for policy 1, policy_version 88300 (0.0007) +[2023-10-08 19:20:39,977][21195] Updated weights for policy 0, policy_version 88990 (0.0010) +[2023-10-08 19:20:40,283][21194] Updated weights for policy 1, policy_version 88310 (0.0009) +[2023-10-08 19:20:40,640][21194] Updated weights for policy 1, policy_version 88320 (0.0011) +[2023-10-08 19:20:43,770][21195] Updated weights for policy 0, policy_version 89000 (0.0007) +[2023-10-08 19:20:43,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.3, 300 sec: 13773.7). Total num frames: 181567488. Throughput: 0: 1757.0, 1: 1721.2. Samples: 45406534. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:20:43,803][19739] Avg episode reward: [(0, '1158.380'), (1, '947.910')] +[2023-10-08 19:20:44,151][21195] Updated weights for policy 0, policy_version 89010 (0.0008) +[2023-10-08 19:20:44,526][21195] Updated weights for policy 0, policy_version 89020 (0.0009) +[2023-10-08 19:20:44,663][21194] Updated weights for policy 1, policy_version 88330 (0.0008) +[2023-10-08 19:20:45,025][21194] Updated weights for policy 1, policy_version 88340 (0.0009) +[2023-10-08 19:20:45,396][21194] Updated weights for policy 1, policy_version 88350 (0.0007) +[2023-10-08 19:20:48,593][21195] Updated weights for policy 0, policy_version 89030 (0.0009) +[2023-10-08 19:20:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 181633024. Throughput: 0: 1737.2, 1: 1692.5. Samples: 45421334. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:20:48,803][19739] Avg episode reward: [(0, '1158.380'), (1, '947.910')] +[2023-10-08 19:20:48,962][21195] Updated weights for policy 0, policy_version 89040 (0.0007) +[2023-10-08 19:20:49,324][21195] Updated weights for policy 0, policy_version 89050 (0.0007) +[2023-10-08 19:20:49,436][21194] Updated weights for policy 1, policy_version 88360 (0.0009) +[2023-10-08 19:20:49,808][21194] Updated weights for policy 1, policy_version 88370 (0.0008) +[2023-10-08 19:20:50,173][21194] Updated weights for policy 1, policy_version 88380 (0.0009) +[2023-10-08 19:20:53,046][21195] Updated weights for policy 0, policy_version 89060 (0.0009) +[2023-10-08 19:20:53,416][21195] Updated weights for policy 0, policy_version 89070 (0.0011) +[2023-10-08 19:20:53,792][21195] Updated weights for policy 0, policy_version 89080 (0.0008) +[2023-10-08 19:20:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 181698560. Throughput: 0: 1747.4, 1: 1711.0. Samples: 45436946. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:20:53,803][19739] Avg episode reward: [(0, '1158.380'), (1, '947.910')] +[2023-10-08 19:20:54,140][21194] Updated weights for policy 1, policy_version 88390 (0.0007) +[2023-10-08 19:20:54,510][21194] Updated weights for policy 1, policy_version 88400 (0.0007) +[2023-10-08 19:20:54,884][21194] Updated weights for policy 1, policy_version 88410 (0.0010) +[2023-10-08 19:20:57,666][21195] Updated weights for policy 0, policy_version 89090 (0.0008) +[2023-10-08 19:20:58,037][21195] Updated weights for policy 0, policy_version 89100 (0.0012) +[2023-10-08 19:20:58,405][21195] Updated weights for policy 0, policy_version 89110 (0.0010) +[2023-10-08 19:20:58,770][21195] Updated weights for policy 0, policy_version 89120 (0.0009) +[2023-10-08 19:20:58,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 181796864. Throughput: 0: 1747.6, 1: 1715.8. Samples: 45458290. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:20:58,803][19739] Avg episode reward: [(0, '1138.190'), (1, '947.910')] +[2023-10-08 19:20:58,904][21194] Updated weights for policy 1, policy_version 88420 (0.0007) +[2023-10-08 19:20:59,272][21194] Updated weights for policy 1, policy_version 88430 (0.0007) +[2023-10-08 19:20:59,640][21194] Updated weights for policy 1, policy_version 88440 (0.0008) +[2023-10-08 19:21:02,589][21195] Updated weights for policy 0, policy_version 89130 (0.0008) +[2023-10-08 19:21:02,954][21195] Updated weights for policy 0, policy_version 89140 (0.0008) +[2023-10-08 19:21:03,321][21195] Updated weights for policy 0, policy_version 89150 (0.0009) +[2023-10-08 19:21:03,600][21194] Updated weights for policy 1, policy_version 88450 (0.0009) +[2023-10-08 19:21:03,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 181862400. Throughput: 0: 1726.1, 1: 1702.0. Samples: 45472886. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:21:03,803][19739] Avg episode reward: [(0, '1138.190'), (1, '947.910')] +[2023-10-08 19:21:03,958][21194] Updated weights for policy 1, policy_version 88460 (0.0009) +[2023-10-08 19:21:04,329][21194] Updated weights for policy 1, policy_version 88470 (0.0007) +[2023-10-08 19:21:04,695][21194] Updated weights for policy 1, policy_version 88480 (0.0007) +[2023-10-08 19:21:07,239][21195] Updated weights for policy 0, policy_version 89160 (0.0008) +[2023-10-08 19:21:07,597][21195] Updated weights for policy 0, policy_version 89170 (0.0009) +[2023-10-08 19:21:07,972][21195] Updated weights for policy 0, policy_version 89180 (0.0007) +[2023-10-08 19:21:08,584][21194] Updated weights for policy 1, policy_version 88490 (0.0010) +[2023-10-08 19:21:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13884.8). Total num frames: 181927936. Throughput: 0: 1756.1, 1: 1723.4. Samples: 45489828. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:21:08,803][19739] Avg episode reward: [(0, '1138.190'), (1, '947.910')] +[2023-10-08 19:21:08,944][21194] Updated weights for policy 1, policy_version 88500 (0.0007) +[2023-10-08 19:21:09,315][21194] Updated weights for policy 1, policy_version 88510 (0.0008) +[2023-10-08 19:21:11,893][21195] Updated weights for policy 0, policy_version 89190 (0.0009) +[2023-10-08 19:21:12,270][21195] Updated weights for policy 0, policy_version 89200 (0.0008) +[2023-10-08 19:21:12,641][21195] Updated weights for policy 0, policy_version 89210 (0.0007) +[2023-10-08 19:21:13,147][21194] Updated weights for policy 1, policy_version 88520 (0.0007) +[2023-10-08 19:21:13,508][21194] Updated weights for policy 1, policy_version 88530 (0.0008) +[2023-10-08 19:21:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 181993472. Throughput: 0: 1726.4, 1: 1720.9. Samples: 45509788. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:21:13,803][19739] Avg episode reward: [(0, '1138.190'), (1, '962.080')] +[2023-10-08 19:21:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000089216_91357184.pth... +[2023-10-08 19:21:13,845][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000087584_89686016.pth +[2023-10-08 19:21:13,849][20740] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p0/milestones/checkpoint_000089216_91357184.pth +[2023-10-08 19:21:13,879][21194] Updated weights for policy 1, policy_version 88540 (0.0008) +[2023-10-08 19:21:14,027][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000088544_90669056.pth... +[2023-10-08 19:21:14,066][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000086912_88997888.pth +[2023-10-08 19:21:14,073][20836] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p1/milestones/checkpoint_000088544_90669056.pth +[2023-10-08 19:21:16,668][21195] Updated weights for policy 0, policy_version 89220 (0.0008) +[2023-10-08 19:21:17,046][21195] Updated weights for policy 0, policy_version 89230 (0.0009) +[2023-10-08 19:21:17,415][21195] Updated weights for policy 0, policy_version 89240 (0.0007) +[2023-10-08 19:21:17,901][21194] Updated weights for policy 1, policy_version 88550 (0.0010) +[2023-10-08 19:21:18,263][21194] Updated weights for policy 1, policy_version 88560 (0.0010) +[2023-10-08 19:21:18,622][21194] Updated weights for policy 1, policy_version 88570 (0.0007) +[2023-10-08 19:21:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 182059008. Throughput: 0: 1721.8, 1: 1720.2. Samples: 45524888. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:21:18,803][19739] Avg episode reward: [(0, '1138.190'), (1, '962.080')] +[2023-10-08 19:21:21,196][21195] Updated weights for policy 0, policy_version 89250 (0.0007) +[2023-10-08 19:21:21,564][21195] Updated weights for policy 0, policy_version 89260 (0.0009) +[2023-10-08 19:21:21,936][21195] Updated weights for policy 0, policy_version 89270 (0.0009) +[2023-10-08 19:21:22,304][21195] Updated weights for policy 0, policy_version 89280 (0.0009) +[2023-10-08 19:21:22,631][21194] Updated weights for policy 1, policy_version 88580 (0.0009) +[2023-10-08 19:21:23,003][21194] Updated weights for policy 1, policy_version 88590 (0.0008) +[2023-10-08 19:21:23,361][21194] Updated weights for policy 1, policy_version 88600 (0.0009) +[2023-10-08 19:21:23,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 182157312. Throughput: 0: 1737.8, 1: 1727.8. Samples: 45540916. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:21:23,803][19739] Avg episode reward: [(0, '1138.190'), (1, '969.600')] +[2023-10-08 19:21:26,247][21195] Updated weights for policy 0, policy_version 89290 (0.0009) +[2023-10-08 19:21:26,618][21195] Updated weights for policy 0, policy_version 89300 (0.0009) +[2023-10-08 19:21:26,993][21195] Updated weights for policy 0, policy_version 89310 (0.0007) +[2023-10-08 19:21:27,172][21194] Updated weights for policy 1, policy_version 88610 (0.0008) +[2023-10-08 19:21:27,550][21194] Updated weights for policy 1, policy_version 88620 (0.0009) +[2023-10-08 19:21:27,914][21194] Updated weights for policy 1, policy_version 88630 (0.0008) +[2023-10-08 19:21:28,274][21194] Updated weights for policy 1, policy_version 88640 (0.0010) +[2023-10-08 19:21:28,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 182222848. Throughput: 0: 1719.2, 1: 1715.3. Samples: 45561090. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:21:28,803][19739] Avg episode reward: [(0, '1138.190'), (1, '969.600')] +[2023-10-08 19:21:30,866][21195] Updated weights for policy 0, policy_version 89320 (0.0008) +[2023-10-08 19:21:31,234][21195] Updated weights for policy 0, policy_version 89330 (0.0008) +[2023-10-08 19:21:31,600][21195] Updated weights for policy 0, policy_version 89340 (0.0007) +[2023-10-08 19:21:32,337][21194] Updated weights for policy 1, policy_version 88650 (0.0008) +[2023-10-08 19:21:32,701][21194] Updated weights for policy 1, policy_version 88660 (0.0007) +[2023-10-08 19:21:33,060][21194] Updated weights for policy 1, policy_version 88670 (0.0008) +[2023-10-08 19:21:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 182288384. Throughput: 0: 1739.2, 1: 1735.5. Samples: 45577696. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:21:33,803][19739] Avg episode reward: [(0, '1138.190'), (1, '969.600')] +[2023-10-08 19:21:35,368][21195] Updated weights for policy 0, policy_version 89350 (0.0008) +[2023-10-08 19:21:35,739][21195] Updated weights for policy 0, policy_version 89360 (0.0009) +[2023-10-08 19:21:36,103][21195] Updated weights for policy 0, policy_version 89370 (0.0009) +[2023-10-08 19:21:37,037][21194] Updated weights for policy 1, policy_version 88680 (0.0011) +[2023-10-08 19:21:37,416][21194] Updated weights for policy 1, policy_version 88690 (0.0011) +[2023-10-08 19:21:37,781][21194] Updated weights for policy 1, policy_version 88700 (0.0008) +[2023-10-08 19:21:38,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 182353920. Throughput: 0: 1728.0, 1: 1732.9. Samples: 45592688. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 19:21:38,803][19739] Avg episode reward: [(0, '1138.190'), (1, '984.160')] +[2023-10-08 19:21:40,031][21195] Updated weights for policy 0, policy_version 89380 (0.0010) +[2023-10-08 19:21:40,391][21195] Updated weights for policy 0, policy_version 89390 (0.0009) +[2023-10-08 19:21:40,769][21195] Updated weights for policy 0, policy_version 89400 (0.0008) +[2023-10-08 19:21:41,786][21194] Updated weights for policy 1, policy_version 88710 (0.0010) +[2023-10-08 19:21:42,152][21194] Updated weights for policy 1, policy_version 88720 (0.0010) +[2023-10-08 19:21:42,514][21194] Updated weights for policy 1, policy_version 88730 (0.0008) +[2023-10-08 19:21:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 182419456. Throughput: 0: 1728.2, 1: 1712.1. Samples: 45613102. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 19:21:43,803][19739] Avg episode reward: [(0, '1138.190'), (1, '984.160')] +[2023-10-08 19:21:44,696][21195] Updated weights for policy 0, policy_version 89410 (0.0009) +[2023-10-08 19:21:45,064][21195] Updated weights for policy 0, policy_version 89420 (0.0008) +[2023-10-08 19:21:45,423][21195] Updated weights for policy 0, policy_version 89430 (0.0009) +[2023-10-08 19:21:45,800][21195] Updated weights for policy 0, policy_version 89440 (0.0010) +[2023-10-08 19:21:46,526][21194] Updated weights for policy 1, policy_version 88740 (0.0010) +[2023-10-08 19:21:46,894][21194] Updated weights for policy 1, policy_version 88750 (0.0009) +[2023-10-08 19:21:47,256][21194] Updated weights for policy 1, policy_version 88760 (0.0008) +[2023-10-08 19:21:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 182484992. Throughput: 0: 1747.1, 1: 1736.9. Samples: 45629664. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 19:21:48,803][19739] Avg episode reward: [(0, '1138.030'), (1, '984.160')] +[2023-10-08 19:21:49,885][21195] Updated weights for policy 0, policy_version 89450 (0.0007) +[2023-10-08 19:21:50,258][21195] Updated weights for policy 0, policy_version 89460 (0.0009) +[2023-10-08 19:21:50,620][21195] Updated weights for policy 0, policy_version 89470 (0.0008) +[2023-10-08 19:21:51,219][21194] Updated weights for policy 1, policy_version 88770 (0.0010) +[2023-10-08 19:21:51,582][21194] Updated weights for policy 1, policy_version 88780 (0.0007) +[2023-10-08 19:21:51,953][21194] Updated weights for policy 1, policy_version 88790 (0.0007) +[2023-10-08 19:21:52,325][21194] Updated weights for policy 1, policy_version 88800 (0.0009) +[2023-10-08 19:21:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 182550528. Throughput: 0: 1716.8, 1: 1710.5. Samples: 45644054. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 19:21:53,803][19739] Avg episode reward: [(0, '1138.030'), (1, '984.120')] +[2023-10-08 19:21:54,673][21195] Updated weights for policy 0, policy_version 89480 (0.0008) +[2023-10-08 19:21:55,052][21195] Updated weights for policy 0, policy_version 89490 (0.0010) +[2023-10-08 19:21:55,417][21195] Updated weights for policy 0, policy_version 89500 (0.0012) +[2023-10-08 19:21:56,277][21194] Updated weights for policy 1, policy_version 88810 (0.0007) +[2023-10-08 19:21:56,637][21194] Updated weights for policy 1, policy_version 88820 (0.0008) +[2023-10-08 19:21:57,002][21194] Updated weights for policy 1, policy_version 88830 (0.0007) +[2023-10-08 19:21:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 182616064. Throughput: 0: 1746.5, 1: 1708.5. Samples: 45665264. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 19:21:58,803][19739] Avg episode reward: [(0, '1138.030'), (1, '984.120')] +[2023-10-08 19:21:59,367][21195] Updated weights for policy 0, policy_version 89510 (0.0009) +[2023-10-08 19:21:59,732][21195] Updated weights for policy 0, policy_version 89520 (0.0009) +[2023-10-08 19:22:00,096][21195] Updated weights for policy 0, policy_version 89530 (0.0009) +[2023-10-08 19:22:00,983][21194] Updated weights for policy 1, policy_version 88840 (0.0009) +[2023-10-08 19:22:01,358][21194] Updated weights for policy 1, policy_version 88850 (0.0008) +[2023-10-08 19:22:01,717][21194] Updated weights for policy 1, policy_version 88860 (0.0009) +[2023-10-08 19:22:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 182681600. Throughput: 0: 1749.4, 1: 1727.0. Samples: 45681328. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 19:22:03,803][19739] Avg episode reward: [(0, '1111.470'), (1, '984.120')] +[2023-10-08 19:22:04,082][21195] Updated weights for policy 0, policy_version 89540 (0.0008) +[2023-10-08 19:22:04,475][21195] Updated weights for policy 0, policy_version 89550 (0.0009) +[2023-10-08 19:22:04,847][21195] Updated weights for policy 0, policy_version 89560 (0.0008) +[2023-10-08 19:22:05,574][21194] Updated weights for policy 1, policy_version 88870 (0.0008) +[2023-10-08 19:22:05,934][21194] Updated weights for policy 1, policy_version 88880 (0.0008) +[2023-10-08 19:22:06,308][21194] Updated weights for policy 1, policy_version 88890 (0.0007) +[2023-10-08 19:22:08,665][21195] Updated weights for policy 0, policy_version 89570 (0.0007) +[2023-10-08 19:22:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 182747136. Throughput: 0: 1731.6, 1: 1712.2. Samples: 45695886. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 19:22:08,803][19739] Avg episode reward: [(0, '1086.330'), (1, '984.120')] +[2023-10-08 19:22:09,033][21195] Updated weights for policy 0, policy_version 89580 (0.0007) +[2023-10-08 19:22:09,396][21195] Updated weights for policy 0, policy_version 89590 (0.0007) +[2023-10-08 19:22:09,762][21195] Updated weights for policy 0, policy_version 89600 (0.0007) +[2023-10-08 19:22:10,071][21194] Updated weights for policy 1, policy_version 88900 (0.0007) +[2023-10-08 19:22:10,435][21194] Updated weights for policy 1, policy_version 88910 (0.0010) +[2023-10-08 19:22:10,800][21194] Updated weights for policy 1, policy_version 88920 (0.0010) +[2023-10-08 19:22:13,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 182812672. Throughput: 0: 1740.7, 1: 1731.3. Samples: 45717330. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 19:22:13,803][19739] Avg episode reward: [(0, '1101.800'), (1, '984.120')] +[2023-10-08 19:22:13,811][21195] Updated weights for policy 0, policy_version 89610 (0.0009) +[2023-10-08 19:22:14,174][21195] Updated weights for policy 0, policy_version 89620 (0.0008) +[2023-10-08 19:22:14,542][21195] Updated weights for policy 0, policy_version 89630 (0.0008) +[2023-10-08 19:22:14,724][21194] Updated weights for policy 1, policy_version 88930 (0.0010) +[2023-10-08 19:22:15,084][21194] Updated weights for policy 1, policy_version 88940 (0.0011) +[2023-10-08 19:22:15,450][21194] Updated weights for policy 1, policy_version 88950 (0.0010) +[2023-10-08 19:22:15,816][21194] Updated weights for policy 1, policy_version 88960 (0.0008) +[2023-10-08 19:22:18,329][21195] Updated weights for policy 0, policy_version 89640 (0.0010) +[2023-10-08 19:22:18,702][21195] Updated weights for policy 0, policy_version 89650 (0.0009) +[2023-10-08 19:22:18,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 182878208. Throughput: 0: 1719.6, 1: 1710.7. Samples: 45732060. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 19:22:18,804][19739] Avg episode reward: [(0, '1101.800'), (1, '998.650')] +[2023-10-08 19:22:19,076][21195] Updated weights for policy 0, policy_version 89660 (0.0008) +[2023-10-08 19:22:19,904][21194] Updated weights for policy 1, policy_version 88970 (0.0011) +[2023-10-08 19:22:20,259][21194] Updated weights for policy 1, policy_version 88980 (0.0009) +[2023-10-08 19:22:20,630][21194] Updated weights for policy 1, policy_version 88990 (0.0010) +[2023-10-08 19:22:22,990][21195] Updated weights for policy 0, policy_version 89670 (0.0007) +[2023-10-08 19:22:23,356][21195] Updated weights for policy 0, policy_version 89680 (0.0007) +[2023-10-08 19:22:23,722][21195] Updated weights for policy 0, policy_version 89690 (0.0010) +[2023-10-08 19:22:23,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 182943744. Throughput: 0: 1740.8, 1: 1716.5. Samples: 45748270. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 19:22:23,803][19739] Avg episode reward: [(0, '1100.060'), (1, '998.740')] +[2023-10-08 19:22:24,552][21194] Updated weights for policy 1, policy_version 89000 (0.0007) +[2023-10-08 19:22:24,925][21194] Updated weights for policy 1, policy_version 89010 (0.0010) +[2023-10-08 19:22:25,291][21194] Updated weights for policy 1, policy_version 89020 (0.0009) +[2023-10-08 19:22:27,600][21195] Updated weights for policy 0, policy_version 89700 (0.0008) +[2023-10-08 19:22:27,969][21195] Updated weights for policy 0, policy_version 89710 (0.0009) +[2023-10-08 19:22:28,346][21195] Updated weights for policy 0, policy_version 89720 (0.0007) +[2023-10-08 19:22:28,802][19739] Fps is (10 sec: 16384.4, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 183042048. Throughput: 0: 1732.4, 1: 1741.5. Samples: 45769424. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 19:22:28,803][19739] Avg episode reward: [(0, '1100.060'), (1, '998.740')] +[2023-10-08 19:22:29,108][21194] Updated weights for policy 1, policy_version 89030 (0.0008) +[2023-10-08 19:22:29,462][21194] Updated weights for policy 1, policy_version 89040 (0.0009) +[2023-10-08 19:22:29,834][21194] Updated weights for policy 1, policy_version 89050 (0.0009) +[2023-10-08 19:22:32,219][21195] Updated weights for policy 0, policy_version 89730 (0.0007) +[2023-10-08 19:22:32,590][21195] Updated weights for policy 0, policy_version 89740 (0.0010) +[2023-10-08 19:22:32,966][21195] Updated weights for policy 0, policy_version 89750 (0.0010) +[2023-10-08 19:22:33,340][21195] Updated weights for policy 0, policy_version 89760 (0.0009) +[2023-10-08 19:22:33,727][21194] Updated weights for policy 1, policy_version 89060 (0.0008) +[2023-10-08 19:22:33,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 183107584. Throughput: 0: 1712.3, 1: 1712.7. Samples: 45783786. Policy #0 lag: (min: 31.0, avg: 31.3, max: 42.0) +[2023-10-08 19:22:33,803][19739] Avg episode reward: [(0, '1100.060'), (1, '997.650')] +[2023-10-08 19:22:34,101][21194] Updated weights for policy 1, policy_version 89070 (0.0008) +[2023-10-08 19:22:34,456][21194] Updated weights for policy 1, policy_version 89080 (0.0009) +[2023-10-08 19:22:37,199][21195] Updated weights for policy 0, policy_version 89770 (0.0007) +[2023-10-08 19:22:37,566][21195] Updated weights for policy 0, policy_version 89780 (0.0007) +[2023-10-08 19:22:37,930][21195] Updated weights for policy 0, policy_version 89790 (0.0009) +[2023-10-08 19:22:38,293][21194] Updated weights for policy 1, policy_version 89090 (0.0009) +[2023-10-08 19:22:38,663][21194] Updated weights for policy 1, policy_version 89100 (0.0009) +[2023-10-08 19:22:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 183173120. Throughput: 0: 1746.7, 1: 1740.1. Samples: 45800960. Policy #0 lag: (min: 31.0, avg: 31.3, max: 42.0) +[2023-10-08 19:22:38,803][19739] Avg episode reward: [(0, '1100.060'), (1, '984.230')] +[2023-10-08 19:22:39,022][21194] Updated weights for policy 1, policy_version 89110 (0.0007) +[2023-10-08 19:22:39,387][21194] Updated weights for policy 1, policy_version 89120 (0.0007) +[2023-10-08 19:22:41,816][21195] Updated weights for policy 0, policy_version 89800 (0.0009) +[2023-10-08 19:22:42,182][21195] Updated weights for policy 0, policy_version 89810 (0.0009) +[2023-10-08 19:22:42,555][21195] Updated weights for policy 0, policy_version 89820 (0.0007) +[2023-10-08 19:22:43,414][21194] Updated weights for policy 1, policy_version 89130 (0.0009) +[2023-10-08 19:22:43,794][21194] Updated weights for policy 1, policy_version 89140 (0.0009) +[2023-10-08 19:22:43,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 183238656. Throughput: 0: 1717.4, 1: 1747.9. Samples: 45821204. Policy #0 lag: (min: 31.0, avg: 31.3, max: 42.0) +[2023-10-08 19:22:43,804][19739] Avg episode reward: [(0, '1100.060'), (1, '984.230')] +[2023-10-08 19:22:44,168][21194] Updated weights for policy 1, policy_version 89150 (0.0007) +[2023-10-08 19:22:46,475][21195] Updated weights for policy 0, policy_version 89830 (0.0008) +[2023-10-08 19:22:46,842][21195] Updated weights for policy 0, policy_version 89840 (0.0008) +[2023-10-08 19:22:47,218][21195] Updated weights for policy 0, policy_version 89850 (0.0009) +[2023-10-08 19:22:48,180][21194] Updated weights for policy 1, policy_version 89160 (0.0008) +[2023-10-08 19:22:48,538][21194] Updated weights for policy 1, policy_version 89170 (0.0008) +[2023-10-08 19:22:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 183304192. Throughput: 0: 1725.5, 1: 1726.4. Samples: 45836660. Policy #0 lag: (min: 31.0, avg: 31.3, max: 42.0) +[2023-10-08 19:22:48,803][19739] Avg episode reward: [(0, '1100.040'), (1, '969.600')] +[2023-10-08 19:22:48,905][21194] Updated weights for policy 1, policy_version 89180 (0.0009) +[2023-10-08 19:22:51,095][21195] Updated weights for policy 0, policy_version 89860 (0.0008) +[2023-10-08 19:22:51,455][21195] Updated weights for policy 0, policy_version 89870 (0.0007) +[2023-10-08 19:22:51,824][21195] Updated weights for policy 0, policy_version 89880 (0.0007) +[2023-10-08 19:22:52,692][21194] Updated weights for policy 1, policy_version 89190 (0.0007) +[2023-10-08 19:22:53,066][21194] Updated weights for policy 1, policy_version 89200 (0.0007) +[2023-10-08 19:22:53,427][21194] Updated weights for policy 1, policy_version 89210 (0.0007) +[2023-10-08 19:22:53,803][19739] Fps is (10 sec: 16384.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 183402496. Throughput: 0: 1734.0, 1: 1744.1. Samples: 45852400. Policy #0 lag: (min: 31.0, avg: 31.3, max: 42.0) +[2023-10-08 19:22:53,803][19739] Avg episode reward: [(0, '1100.040'), (1, '969.600')] +[2023-10-08 19:22:55,764][21195] Updated weights for policy 0, policy_version 89890 (0.0008) +[2023-10-08 19:22:56,172][21195] Updated weights for policy 0, policy_version 89900 (0.0008) +[2023-10-08 19:22:56,544][21195] Updated weights for policy 0, policy_version 89910 (0.0007) +[2023-10-08 19:22:56,906][21195] Updated weights for policy 0, policy_version 89920 (0.0007) +[2023-10-08 19:22:57,561][21194] Updated weights for policy 1, policy_version 89220 (0.0007) +[2023-10-08 19:22:57,933][21194] Updated weights for policy 1, policy_version 89230 (0.0010) +[2023-10-08 19:22:58,304][21194] Updated weights for policy 1, policy_version 89240 (0.0008) +[2023-10-08 19:22:58,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 183468032. Throughput: 0: 1724.5, 1: 1725.1. Samples: 45872562. Policy #0 lag: (min: 31.0, avg: 31.3, max: 42.0) +[2023-10-08 19:22:58,803][19739] Avg episode reward: [(0, '1115.360'), (1, '969.690')] +[2023-10-08 19:23:00,896][21195] Updated weights for policy 0, policy_version 89930 (0.0008) +[2023-10-08 19:23:01,265][21195] Updated weights for policy 0, policy_version 89940 (0.0007) +[2023-10-08 19:23:01,624][21195] Updated weights for policy 0, policy_version 89950 (0.0007) +[2023-10-08 19:23:01,995][21194] Updated weights for policy 1, policy_version 89250 (0.0009) +[2023-10-08 19:23:02,357][21194] Updated weights for policy 1, policy_version 89260 (0.0008) +[2023-10-08 19:23:02,737][21194] Updated weights for policy 1, policy_version 89270 (0.0010) +[2023-10-08 19:23:03,096][21194] Updated weights for policy 1, policy_version 89280 (0.0009) +[2023-10-08 19:23:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 183533568. Throughput: 0: 1740.5, 1: 1742.9. Samples: 45888812. Policy #0 lag: (min: 31.0, avg: 31.3, max: 42.0) +[2023-10-08 19:23:03,803][19739] Avg episode reward: [(0, '1115.360'), (1, '969.690')] +[2023-10-08 19:23:05,421][21195] Updated weights for policy 0, policy_version 89960 (0.0010) +[2023-10-08 19:23:05,788][21195] Updated weights for policy 0, policy_version 89970 (0.0008) +[2023-10-08 19:23:06,163][21195] Updated weights for policy 0, policy_version 89980 (0.0009) +[2023-10-08 19:23:07,153][21194] Updated weights for policy 1, policy_version 89290 (0.0010) +[2023-10-08 19:23:07,523][21194] Updated weights for policy 1, policy_version 89300 (0.0010) +[2023-10-08 19:23:07,876][21194] Updated weights for policy 1, policy_version 89310 (0.0010) +[2023-10-08 19:23:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 183599104. Throughput: 0: 1721.6, 1: 1740.0. Samples: 45904046. Policy #0 lag: (min: 31.0, avg: 31.3, max: 42.0) +[2023-10-08 19:23:08,803][19739] Avg episode reward: [(0, '1115.520'), (1, '969.690')] +[2023-10-08 19:23:09,943][21195] Updated weights for policy 0, policy_version 89990 (0.0007) +[2023-10-08 19:23:10,310][21195] Updated weights for policy 0, policy_version 90000 (0.0008) +[2023-10-08 19:23:10,678][21195] Updated weights for policy 0, policy_version 90010 (0.0008) +[2023-10-08 19:23:11,957][21194] Updated weights for policy 1, policy_version 89320 (0.0010) +[2023-10-08 19:23:12,319][21194] Updated weights for policy 1, policy_version 89330 (0.0007) +[2023-10-08 19:23:12,687][21194] Updated weights for policy 1, policy_version 89340 (0.0007) +[2023-10-08 19:23:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 183664640. Throughput: 0: 1734.5, 1: 1711.9. Samples: 45924514. Policy #0 lag: (min: 31.0, avg: 31.3, max: 42.0) +[2023-10-08 19:23:13,803][19739] Avg episode reward: [(0, '1115.520'), (1, '969.690')] +[2023-10-08 19:23:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000089344_91488256.pth... +[2023-10-08 19:23:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000090016_92176384.pth... +[2023-10-08 19:23:13,854][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000088416_90537984.pth +[2023-10-08 19:23:13,855][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000087744_89849856.pth +[2023-10-08 19:23:14,553][21195] Updated weights for policy 0, policy_version 90020 (0.0007) +[2023-10-08 19:23:14,929][21195] Updated weights for policy 0, policy_version 90030 (0.0010) +[2023-10-08 19:23:15,302][21195] Updated weights for policy 0, policy_version 90040 (0.0010) +[2023-10-08 19:23:16,594][21194] Updated weights for policy 1, policy_version 89350 (0.0008) +[2023-10-08 19:23:16,950][21194] Updated weights for policy 1, policy_version 89360 (0.0009) +[2023-10-08 19:23:17,316][21194] Updated weights for policy 1, policy_version 89370 (0.0009) +[2023-10-08 19:23:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 183730176. Throughput: 0: 1762.9, 1: 1746.5. Samples: 45941708. Policy #0 lag: (min: 31.0, avg: 31.3, max: 42.0) +[2023-10-08 19:23:18,803][19739] Avg episode reward: [(0, '1115.520'), (1, '969.690')] +[2023-10-08 19:23:19,016][21195] Updated weights for policy 0, policy_version 90050 (0.0008) +[2023-10-08 19:23:19,388][21195] Updated weights for policy 0, policy_version 90060 (0.0009) +[2023-10-08 19:23:19,768][21195] Updated weights for policy 0, policy_version 90070 (0.0008) +[2023-10-08 19:23:20,126][21195] Updated weights for policy 0, policy_version 90080 (0.0008) +[2023-10-08 19:23:21,352][21194] Updated weights for policy 1, policy_version 89380 (0.0009) +[2023-10-08 19:23:21,714][21194] Updated weights for policy 1, policy_version 89390 (0.0008) +[2023-10-08 19:23:22,091][21194] Updated weights for policy 1, policy_version 89400 (0.0008) +[2023-10-08 19:23:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 183795712. Throughput: 0: 1729.1, 1: 1718.5. Samples: 45956102. Policy #0 lag: (min: 31.0, avg: 31.3, max: 42.0) +[2023-10-08 19:23:23,803][19739] Avg episode reward: [(0, '1115.810'), (1, '946.380')] +[2023-10-08 19:23:24,056][21195] Updated weights for policy 0, policy_version 90090 (0.0009) +[2023-10-08 19:23:24,419][21195] Updated weights for policy 0, policy_version 90100 (0.0007) +[2023-10-08 19:23:24,782][21195] Updated weights for policy 0, policy_version 90110 (0.0007) +[2023-10-08 19:23:26,049][21194] Updated weights for policy 1, policy_version 89410 (0.0008) +[2023-10-08 19:23:26,418][21194] Updated weights for policy 1, policy_version 89420 (0.0008) +[2023-10-08 19:23:26,787][21194] Updated weights for policy 1, policy_version 89430 (0.0008) +[2023-10-08 19:23:27,150][21194] Updated weights for policy 1, policy_version 89440 (0.0007) +[2023-10-08 19:23:28,638][21195] Updated weights for policy 0, policy_version 90120 (0.0008) +[2023-10-08 19:23:28,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 183861248. Throughput: 0: 1763.7, 1: 1706.2. Samples: 45977352. Policy #0 lag: (min: 31.0, avg: 31.3, max: 42.0) +[2023-10-08 19:23:28,803][19739] Avg episode reward: [(0, '1115.810'), (1, '931.760')] +[2023-10-08 19:23:29,009][21195] Updated weights for policy 0, policy_version 90130 (0.0009) +[2023-10-08 19:23:29,383][21195] Updated weights for policy 0, policy_version 90140 (0.0009) +[2023-10-08 19:23:31,018][21194] Updated weights for policy 1, policy_version 89450 (0.0011) +[2023-10-08 19:23:31,385][21194] Updated weights for policy 1, policy_version 89460 (0.0011) +[2023-10-08 19:23:31,745][21194] Updated weights for policy 1, policy_version 89470 (0.0010) +[2023-10-08 19:23:33,429][21195] Updated weights for policy 0, policy_version 90150 (0.0007) +[2023-10-08 19:23:33,794][21195] Updated weights for policy 0, policy_version 90160 (0.0008) +[2023-10-08 19:23:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 183926784. Throughput: 0: 1746.4, 1: 1729.4. Samples: 45993072. Policy #0 lag: (min: 16.0, avg: 31.4, max: 48.0) +[2023-10-08 19:23:33,804][19739] Avg episode reward: [(0, '1115.810'), (1, '931.760')] +[2023-10-08 19:23:34,160][21195] Updated weights for policy 0, policy_version 90170 (0.0008) +[2023-10-08 19:23:35,774][21194] Updated weights for policy 1, policy_version 89480 (0.0010) +[2023-10-08 19:23:36,144][21194] Updated weights for policy 1, policy_version 89490 (0.0007) +[2023-10-08 19:23:36,508][21194] Updated weights for policy 1, policy_version 89500 (0.0009) +[2023-10-08 19:23:38,077][21195] Updated weights for policy 0, policy_version 90180 (0.0009) +[2023-10-08 19:23:38,441][21195] Updated weights for policy 0, policy_version 90190 (0.0008) +[2023-10-08 19:23:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 183992320. Throughput: 0: 1754.9, 1: 1702.4. Samples: 46007982. Policy #0 lag: (min: 16.0, avg: 31.4, max: 48.0) +[2023-10-08 19:23:38,803][19739] Avg episode reward: [(0, '1105.750'), (1, '931.760')] +[2023-10-08 19:23:38,805][21195] Updated weights for policy 0, policy_version 90200 (0.0007) +[2023-10-08 19:23:40,416][21194] Updated weights for policy 1, policy_version 89510 (0.0007) +[2023-10-08 19:23:40,774][21194] Updated weights for policy 1, policy_version 89520 (0.0007) +[2023-10-08 19:23:41,149][21194] Updated weights for policy 1, policy_version 89530 (0.0007) +[2023-10-08 19:23:42,721][21195] Updated weights for policy 0, policy_version 90210 (0.0008) +[2023-10-08 19:23:43,115][21195] Updated weights for policy 0, policy_version 90220 (0.0007) +[2023-10-08 19:23:43,492][21195] Updated weights for policy 0, policy_version 90230 (0.0007) +[2023-10-08 19:23:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 184057856. Throughput: 0: 1765.1, 1: 1721.0. Samples: 46029436. Policy #0 lag: (min: 16.0, avg: 31.4, max: 48.0) +[2023-10-08 19:23:43,803][19739] Avg episode reward: [(0, '1105.660'), (1, '931.760')] +[2023-10-08 19:23:43,855][21195] Updated weights for policy 0, policy_version 90240 (0.0008) +[2023-10-08 19:23:45,132][21194] Updated weights for policy 1, policy_version 89540 (0.0008) +[2023-10-08 19:23:45,494][21194] Updated weights for policy 1, policy_version 89550 (0.0008) +[2023-10-08 19:23:45,863][21194] Updated weights for policy 1, policy_version 89560 (0.0009) +[2023-10-08 19:23:47,563][21195] Updated weights for policy 0, policy_version 90250 (0.0010) +[2023-10-08 19:23:47,930][21195] Updated weights for policy 0, policy_version 90260 (0.0008) +[2023-10-08 19:23:48,297][21195] Updated weights for policy 0, policy_version 90270 (0.0009) +[2023-10-08 19:23:48,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 184156160. Throughput: 0: 1738.6, 1: 1709.3. Samples: 46043968. Policy #0 lag: (min: 16.0, avg: 31.4, max: 48.0) +[2023-10-08 19:23:48,803][19739] Avg episode reward: [(0, '1105.660'), (1, '931.760')] +[2023-10-08 19:23:49,848][21194] Updated weights for policy 1, policy_version 89570 (0.0008) +[2023-10-08 19:23:50,206][21194] Updated weights for policy 1, policy_version 89580 (0.0010) +[2023-10-08 19:23:50,575][21194] Updated weights for policy 1, policy_version 89590 (0.0008) +[2023-10-08 19:23:50,941][21194] Updated weights for policy 1, policy_version 89600 (0.0008) +[2023-10-08 19:23:52,384][21195] Updated weights for policy 0, policy_version 90280 (0.0010) +[2023-10-08 19:23:52,756][21195] Updated weights for policy 0, policy_version 90290 (0.0008) +[2023-10-08 19:23:53,129][21195] Updated weights for policy 0, policy_version 90300 (0.0007) +[2023-10-08 19:23:53,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 184221696. Throughput: 0: 1766.1, 1: 1709.4. Samples: 46060442. Policy #0 lag: (min: 16.0, avg: 31.4, max: 48.0) +[2023-10-08 19:23:53,803][19739] Avg episode reward: [(0, '1105.660'), (1, '931.760')] +[2023-10-08 19:23:54,919][21194] Updated weights for policy 1, policy_version 89610 (0.0009) +[2023-10-08 19:23:55,289][21194] Updated weights for policy 1, policy_version 89620 (0.0008) +[2023-10-08 19:23:55,656][21194] Updated weights for policy 1, policy_version 89630 (0.0008) +[2023-10-08 19:23:57,034][21195] Updated weights for policy 0, policy_version 90310 (0.0009) +[2023-10-08 19:23:57,390][21195] Updated weights for policy 0, policy_version 90320 (0.0008) +[2023-10-08 19:23:57,766][21195] Updated weights for policy 0, policy_version 90330 (0.0008) +[2023-10-08 19:23:58,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 184287232. Throughput: 0: 1738.5, 1: 1732.9. Samples: 46080726. Policy #0 lag: (min: 16.0, avg: 31.4, max: 48.0) +[2023-10-08 19:23:58,803][19739] Avg episode reward: [(0, '1096.480'), (1, '931.760')] +[2023-10-08 19:23:59,673][21194] Updated weights for policy 1, policy_version 89640 (0.0008) +[2023-10-08 19:24:00,053][21194] Updated weights for policy 1, policy_version 89650 (0.0009) +[2023-10-08 19:24:00,414][21194] Updated weights for policy 1, policy_version 89660 (0.0008) +[2023-10-08 19:24:01,578][21195] Updated weights for policy 0, policy_version 90340 (0.0008) +[2023-10-08 19:24:01,947][21195] Updated weights for policy 0, policy_version 90350 (0.0008) +[2023-10-08 19:24:02,308][21195] Updated weights for policy 0, policy_version 90360 (0.0010) +[2023-10-08 19:24:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 184352768. Throughput: 0: 1727.6, 1: 1695.5. Samples: 46095750. Policy #0 lag: (min: 16.0, avg: 31.4, max: 48.0) +[2023-10-08 19:24:03,803][19739] Avg episode reward: [(0, '1096.480'), (1, '931.760')] +[2023-10-08 19:24:04,320][21194] Updated weights for policy 1, policy_version 89670 (0.0007) +[2023-10-08 19:24:04,692][21194] Updated weights for policy 1, policy_version 89680 (0.0007) +[2023-10-08 19:24:05,060][21194] Updated weights for policy 1, policy_version 89690 (0.0009) +[2023-10-08 19:24:06,136][21195] Updated weights for policy 0, policy_version 90370 (0.0010) +[2023-10-08 19:24:06,514][21195] Updated weights for policy 0, policy_version 90380 (0.0008) +[2023-10-08 19:24:06,888][21195] Updated weights for policy 0, policy_version 90390 (0.0008) +[2023-10-08 19:24:07,246][21195] Updated weights for policy 0, policy_version 90400 (0.0007) +[2023-10-08 19:24:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 184418304. Throughput: 0: 1740.7, 1: 1718.0. Samples: 46111742. Policy #0 lag: (min: 16.0, avg: 31.4, max: 48.0) +[2023-10-08 19:24:08,803][19739] Avg episode reward: [(0, '1096.740'), (1, '931.760')] +[2023-10-08 19:24:08,825][21194] Updated weights for policy 1, policy_version 89700 (0.0008) +[2023-10-08 19:24:09,185][21194] Updated weights for policy 1, policy_version 89710 (0.0011) +[2023-10-08 19:24:09,550][21194] Updated weights for policy 1, policy_version 89720 (0.0010) +[2023-10-08 19:24:11,227][21195] Updated weights for policy 0, policy_version 90410 (0.0008) +[2023-10-08 19:24:11,593][21195] Updated weights for policy 0, policy_version 90420 (0.0009) +[2023-10-08 19:24:11,952][21195] Updated weights for policy 0, policy_version 90430 (0.0010) +[2023-10-08 19:24:13,684][21194] Updated weights for policy 1, policy_version 89730 (0.0010) +[2023-10-08 19:24:13,803][19739] Fps is (10 sec: 13106.7, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 184483840. Throughput: 0: 1722.8, 1: 1726.8. Samples: 46132584. Policy #0 lag: (min: 16.0, avg: 31.4, max: 48.0) +[2023-10-08 19:24:13,804][19739] Avg episode reward: [(0, '1096.740'), (1, '931.760')] +[2023-10-08 19:24:14,051][21194] Updated weights for policy 1, policy_version 89740 (0.0007) +[2023-10-08 19:24:14,420][21194] Updated weights for policy 1, policy_version 89750 (0.0009) +[2023-10-08 19:24:14,782][21194] Updated weights for policy 1, policy_version 89760 (0.0009) +[2023-10-08 19:24:15,981][21195] Updated weights for policy 0, policy_version 90440 (0.0010) +[2023-10-08 19:24:16,360][21195] Updated weights for policy 0, policy_version 90450 (0.0007) +[2023-10-08 19:24:16,719][21195] Updated weights for policy 0, policy_version 90460 (0.0008) +[2023-10-08 19:24:18,580][21194] Updated weights for policy 1, policy_version 89770 (0.0007) +[2023-10-08 19:24:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 184549376. Throughput: 0: 1729.8, 1: 1705.7. Samples: 46147672. Policy #0 lag: (min: 16.0, avg: 31.4, max: 48.0) +[2023-10-08 19:24:18,803][19739] Avg episode reward: [(0, '1082.450'), (1, '931.760')] +[2023-10-08 19:24:18,945][21194] Updated weights for policy 1, policy_version 89780 (0.0008) +[2023-10-08 19:24:19,314][21194] Updated weights for policy 1, policy_version 89790 (0.0012) +[2023-10-08 19:24:20,681][21195] Updated weights for policy 0, policy_version 90470 (0.0009) +[2023-10-08 19:24:21,045][21195] Updated weights for policy 0, policy_version 90480 (0.0010) +[2023-10-08 19:24:21,422][21195] Updated weights for policy 0, policy_version 90490 (0.0007) +[2023-10-08 19:24:23,246][21194] Updated weights for policy 1, policy_version 89800 (0.0008) +[2023-10-08 19:24:23,612][21194] Updated weights for policy 1, policy_version 89810 (0.0008) +[2023-10-08 19:24:23,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 184614912. Throughput: 0: 1714.6, 1: 1733.5. Samples: 46163146. Policy #0 lag: (min: 16.0, avg: 31.4, max: 48.0) +[2023-10-08 19:24:23,803][19739] Avg episode reward: [(0, '1082.450'), (1, '931.760')] +[2023-10-08 19:24:23,978][21194] Updated weights for policy 1, policy_version 89820 (0.0008) +[2023-10-08 19:24:25,417][21195] Updated weights for policy 0, policy_version 90500 (0.0009) +[2023-10-08 19:24:25,774][21195] Updated weights for policy 0, policy_version 90510 (0.0010) +[2023-10-08 19:24:26,153][21195] Updated weights for policy 0, policy_version 90520 (0.0009) +[2023-10-08 19:24:27,854][21194] Updated weights for policy 1, policy_version 89830 (0.0008) +[2023-10-08 19:24:28,227][21194] Updated weights for policy 1, policy_version 89840 (0.0009) +[2023-10-08 19:24:28,594][21194] Updated weights for policy 1, policy_version 89850 (0.0009) +[2023-10-08 19:24:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 184680448. Throughput: 0: 1718.0, 1: 1722.3. Samples: 46184246. Policy #0 lag: (min: 15.0, avg: 17.2, max: 47.0) +[2023-10-08 19:24:28,804][19739] Avg episode reward: [(0, '1082.450'), (1, '931.160')] +[2023-10-08 19:24:29,972][21195] Updated weights for policy 0, policy_version 90530 (0.0007) +[2023-10-08 19:24:30,362][21195] Updated weights for policy 0, policy_version 90540 (0.0008) +[2023-10-08 19:24:30,718][21195] Updated weights for policy 0, policy_version 90550 (0.0008) +[2023-10-08 19:24:31,080][21195] Updated weights for policy 0, policy_version 90560 (0.0008) +[2023-10-08 19:24:32,581][21194] Updated weights for policy 1, policy_version 89860 (0.0009) +[2023-10-08 19:24:32,951][21194] Updated weights for policy 1, policy_version 89870 (0.0008) +[2023-10-08 19:24:33,319][21194] Updated weights for policy 1, policy_version 89880 (0.0008) +[2023-10-08 19:24:33,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 184778752. Throughput: 0: 1748.0, 1: 1723.6. Samples: 46200190. Policy #0 lag: (min: 15.0, avg: 17.2, max: 47.0) +[2023-10-08 19:24:33,803][19739] Avg episode reward: [(0, '1082.450'), (1, '931.160')] +[2023-10-08 19:24:34,898][21195] Updated weights for policy 0, policy_version 90570 (0.0007) +[2023-10-08 19:24:35,262][21195] Updated weights for policy 0, policy_version 90580 (0.0007) +[2023-10-08 19:24:35,624][21195] Updated weights for policy 0, policy_version 90590 (0.0009) +[2023-10-08 19:24:37,274][21194] Updated weights for policy 1, policy_version 89890 (0.0007) +[2023-10-08 19:24:37,639][21194] Updated weights for policy 1, policy_version 89900 (0.0007) +[2023-10-08 19:24:38,010][21194] Updated weights for policy 1, policy_version 89910 (0.0011) +[2023-10-08 19:24:38,374][21194] Updated weights for policy 1, policy_version 89920 (0.0011) +[2023-10-08 19:24:38,803][19739] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 184844288. Throughput: 0: 1716.8, 1: 1728.0. Samples: 46215456. Policy #0 lag: (min: 15.0, avg: 17.2, max: 47.0) +[2023-10-08 19:24:38,803][19739] Avg episode reward: [(0, '1082.730'), (1, '931.130')] +[2023-10-08 19:24:39,619][21195] Updated weights for policy 0, policy_version 90600 (0.0008) +[2023-10-08 19:24:39,988][21195] Updated weights for policy 0, policy_version 90610 (0.0008) +[2023-10-08 19:24:40,360][21195] Updated weights for policy 0, policy_version 90620 (0.0009) +[2023-10-08 19:24:42,421][21194] Updated weights for policy 1, policy_version 89930 (0.0008) +[2023-10-08 19:24:42,787][21194] Updated weights for policy 1, policy_version 89940 (0.0008) +[2023-10-08 19:24:43,153][21194] Updated weights for policy 1, policy_version 89950 (0.0007) +[2023-10-08 19:24:43,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 184909824. Throughput: 0: 1740.8, 1: 1706.6. Samples: 46235862. Policy #0 lag: (min: 15.0, avg: 17.2, max: 47.0) +[2023-10-08 19:24:43,804][19739] Avg episode reward: [(0, '1082.460'), (1, '931.510')] +[2023-10-08 19:24:44,519][21195] Updated weights for policy 0, policy_version 90630 (0.0007) +[2023-10-08 19:24:44,898][21195] Updated weights for policy 0, policy_version 90640 (0.0007) +[2023-10-08 19:24:45,277][21195] Updated weights for policy 0, policy_version 90650 (0.0008) +[2023-10-08 19:24:47,284][21194] Updated weights for policy 1, policy_version 89960 (0.0009) +[2023-10-08 19:24:47,642][21194] Updated weights for policy 1, policy_version 89970 (0.0008) +[2023-10-08 19:24:48,002][21194] Updated weights for policy 1, policy_version 89980 (0.0007) +[2023-10-08 19:24:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 184975360. Throughput: 0: 1745.2, 1: 1734.4. Samples: 46252330. Policy #0 lag: (min: 15.0, avg: 17.2, max: 47.0) +[2023-10-08 19:24:48,803][19739] Avg episode reward: [(0, '1076.940'), (1, '931.510')] +[2023-10-08 19:24:49,205][21195] Updated weights for policy 0, policy_version 90660 (0.0008) +[2023-10-08 19:24:49,582][21195] Updated weights for policy 0, policy_version 90670 (0.0008) +[2023-10-08 19:24:49,948][21195] Updated weights for policy 0, policy_version 90680 (0.0008) +[2023-10-08 19:24:51,911][21194] Updated weights for policy 1, policy_version 89990 (0.0008) +[2023-10-08 19:24:52,273][21194] Updated weights for policy 1, policy_version 90000 (0.0007) +[2023-10-08 19:24:52,640][21194] Updated weights for policy 1, policy_version 90010 (0.0009) +[2023-10-08 19:24:53,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 185040896. Throughput: 0: 1728.6, 1: 1724.7. Samples: 46267140. Policy #0 lag: (min: 15.0, avg: 17.2, max: 47.0) +[2023-10-08 19:24:53,803][19739] Avg episode reward: [(0, '1076.940'), (1, '932.230')] +[2023-10-08 19:24:53,851][21195] Updated weights for policy 0, policy_version 90690 (0.0008) +[2023-10-08 19:24:54,223][21195] Updated weights for policy 0, policy_version 90700 (0.0010) +[2023-10-08 19:24:54,585][21195] Updated weights for policy 0, policy_version 90710 (0.0010) +[2023-10-08 19:24:54,951][21195] Updated weights for policy 0, policy_version 90720 (0.0008) +[2023-10-08 19:24:56,439][21194] Updated weights for policy 1, policy_version 90020 (0.0010) +[2023-10-08 19:24:56,802][21194] Updated weights for policy 1, policy_version 90030 (0.0010) +[2023-10-08 19:24:57,167][21194] Updated weights for policy 1, policy_version 90040 (0.0011) +[2023-10-08 19:24:58,752][21195] Updated weights for policy 0, policy_version 90730 (0.0009) +[2023-10-08 19:24:58,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 185106432. Throughput: 0: 1744.1, 1: 1709.7. Samples: 46288006. Policy #0 lag: (min: 15.0, avg: 17.2, max: 47.0) +[2023-10-08 19:24:58,803][19739] Avg episode reward: [(0, '1076.940'), (1, '932.230')] +[2023-10-08 19:24:59,123][21195] Updated weights for policy 0, policy_version 90740 (0.0010) +[2023-10-08 19:24:59,488][21195] Updated weights for policy 0, policy_version 90750 (0.0007) +[2023-10-08 19:25:01,302][21194] Updated weights for policy 1, policy_version 90050 (0.0008) +[2023-10-08 19:25:01,664][21194] Updated weights for policy 1, policy_version 90060 (0.0007) +[2023-10-08 19:25:02,039][21194] Updated weights for policy 1, policy_version 90070 (0.0007) +[2023-10-08 19:25:02,406][21194] Updated weights for policy 1, policy_version 90080 (0.0007) +[2023-10-08 19:25:03,398][21195] Updated weights for policy 0, policy_version 90760 (0.0008) +[2023-10-08 19:25:03,775][21195] Updated weights for policy 0, policy_version 90770 (0.0008) +[2023-10-08 19:25:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 185171968. Throughput: 0: 1731.0, 1: 1741.6. Samples: 46303938. Policy #0 lag: (min: 15.0, avg: 17.2, max: 47.0) +[2023-10-08 19:25:03,803][19739] Avg episode reward: [(0, '1076.940'), (1, '932.230')] +[2023-10-08 19:25:04,138][21195] Updated weights for policy 0, policy_version 90780 (0.0008) +[2023-10-08 19:25:06,438][21194] Updated weights for policy 1, policy_version 90090 (0.0007) +[2023-10-08 19:25:06,813][21194] Updated weights for policy 1, policy_version 90100 (0.0007) +[2023-10-08 19:25:07,182][21194] Updated weights for policy 1, policy_version 90110 (0.0007) +[2023-10-08 19:25:08,015][21195] Updated weights for policy 0, policy_version 90790 (0.0007) +[2023-10-08 19:25:08,388][21195] Updated weights for policy 0, policy_version 90800 (0.0007) +[2023-10-08 19:25:08,757][21195] Updated weights for policy 0, policy_version 90810 (0.0009) +[2023-10-08 19:25:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 185237504. Throughput: 0: 1750.2, 1: 1713.4. Samples: 46319008. Policy #0 lag: (min: 15.0, avg: 17.2, max: 47.0) +[2023-10-08 19:25:08,803][19739] Avg episode reward: [(0, '1076.940'), (1, '932.230')] +[2023-10-08 19:25:10,877][21194] Updated weights for policy 1, policy_version 90120 (0.0010) +[2023-10-08 19:25:11,242][21194] Updated weights for policy 1, policy_version 90130 (0.0007) +[2023-10-08 19:25:11,616][21194] Updated weights for policy 1, policy_version 90140 (0.0008) +[2023-10-08 19:25:12,615][21195] Updated weights for policy 0, policy_version 90820 (0.0008) +[2023-10-08 19:25:12,982][21195] Updated weights for policy 0, policy_version 90830 (0.0008) +[2023-10-08 19:25:13,348][21195] Updated weights for policy 0, policy_version 90840 (0.0009) +[2023-10-08 19:25:13,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 185335808. Throughput: 0: 1740.0, 1: 1715.3. Samples: 46339734. Policy #0 lag: (min: 15.0, avg: 17.2, max: 47.0) +[2023-10-08 19:25:13,803][19739] Avg episode reward: [(0, '1076.940'), (1, '932.230')] +[2023-10-08 19:25:13,814][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000090848_93028352.pth... +[2023-10-08 19:25:13,814][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000090144_92307456.pth... +[2023-10-08 19:25:13,850][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000088544_90669056.pth +[2023-10-08 19:25:13,852][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000089216_91357184.pth +[2023-10-08 19:25:15,659][21194] Updated weights for policy 1, policy_version 90150 (0.0009) +[2023-10-08 19:25:16,021][21194] Updated weights for policy 1, policy_version 90160 (0.0008) +[2023-10-08 19:25:16,389][21194] Updated weights for policy 1, policy_version 90170 (0.0008) +[2023-10-08 19:25:17,343][21195] Updated weights for policy 0, policy_version 90850 (0.0008) +[2023-10-08 19:25:17,741][21195] Updated weights for policy 0, policy_version 90860 (0.0007) +[2023-10-08 19:25:18,097][21195] Updated weights for policy 0, policy_version 90870 (0.0009) +[2023-10-08 19:25:18,467][21195] Updated weights for policy 0, policy_version 90880 (0.0008) +[2023-10-08 19:25:18,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 185401344. Throughput: 0: 1710.3, 1: 1726.0. Samples: 46354822. Policy #0 lag: (min: 15.0, avg: 17.2, max: 47.0) +[2023-10-08 19:25:18,803][19739] Avg episode reward: [(0, '1076.940'), (1, '932.110')] +[2023-10-08 19:25:20,083][21194] Updated weights for policy 1, policy_version 90180 (0.0009) +[2023-10-08 19:25:20,453][21194] Updated weights for policy 1, policy_version 90190 (0.0010) +[2023-10-08 19:25:20,819][21194] Updated weights for policy 1, policy_version 90200 (0.0010) +[2023-10-08 19:25:22,478][21195] Updated weights for policy 0, policy_version 90890 (0.0009) +[2023-10-08 19:25:22,841][21195] Updated weights for policy 0, policy_version 90900 (0.0007) +[2023-10-08 19:25:23,220][21195] Updated weights for policy 0, policy_version 90910 (0.0009) +[2023-10-08 19:25:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 185466880. Throughput: 0: 1738.8, 1: 1717.0. Samples: 46370966. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:25:23,803][19739] Avg episode reward: [(0, '1076.940'), (1, '932.040')] +[2023-10-08 19:25:24,896][21194] Updated weights for policy 1, policy_version 90210 (0.0008) +[2023-10-08 19:25:25,272][21194] Updated weights for policy 1, policy_version 90220 (0.0008) +[2023-10-08 19:25:25,631][21194] Updated weights for policy 1, policy_version 90230 (0.0010) +[2023-10-08 19:25:26,004][21194] Updated weights for policy 1, policy_version 90240 (0.0008) +[2023-10-08 19:25:27,087][21195] Updated weights for policy 0, policy_version 90920 (0.0009) +[2023-10-08 19:25:27,456][21195] Updated weights for policy 0, policy_version 90930 (0.0009) +[2023-10-08 19:25:27,829][21195] Updated weights for policy 0, policy_version 90940 (0.0009) +[2023-10-08 19:25:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 185532416. Throughput: 0: 1714.0, 1: 1742.2. Samples: 46391392. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:25:28,803][19739] Avg episode reward: [(0, '1076.940'), (1, '932.040')] +[2023-10-08 19:25:29,909][21194] Updated weights for policy 1, policy_version 90250 (0.0009) +[2023-10-08 19:25:30,268][21194] Updated weights for policy 1, policy_version 90260 (0.0008) +[2023-10-08 19:25:30,646][21194] Updated weights for policy 1, policy_version 90270 (0.0007) +[2023-10-08 19:25:31,784][21195] Updated weights for policy 0, policy_version 90950 (0.0010) +[2023-10-08 19:25:32,144][21195] Updated weights for policy 0, policy_version 90960 (0.0010) +[2023-10-08 19:25:32,514][21195] Updated weights for policy 0, policy_version 90970 (0.0010) +[2023-10-08 19:25:33,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 185597952. Throughput: 0: 1710.5, 1: 1716.0. Samples: 46406524. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:25:33,804][19739] Avg episode reward: [(0, '1076.940'), (1, '932.040')] +[2023-10-08 19:25:34,644][21194] Updated weights for policy 1, policy_version 90280 (0.0007) +[2023-10-08 19:25:35,004][21194] Updated weights for policy 1, policy_version 90290 (0.0009) +[2023-10-08 19:25:35,373][21194] Updated weights for policy 1, policy_version 90300 (0.0009) +[2023-10-08 19:25:36,444][21195] Updated weights for policy 0, policy_version 90980 (0.0010) +[2023-10-08 19:25:36,800][21195] Updated weights for policy 0, policy_version 90990 (0.0009) +[2023-10-08 19:25:37,172][21195] Updated weights for policy 0, policy_version 91000 (0.0009) +[2023-10-08 19:25:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 185663488. Throughput: 0: 1733.7, 1: 1724.0. Samples: 46422736. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:25:38,803][19739] Avg episode reward: [(0, '1076.940'), (1, '902.230')] +[2023-10-08 19:25:39,377][21194] Updated weights for policy 1, policy_version 90310 (0.0008) +[2023-10-08 19:25:39,745][21194] Updated weights for policy 1, policy_version 90320 (0.0007) +[2023-10-08 19:25:40,109][21194] Updated weights for policy 1, policy_version 90330 (0.0007) +[2023-10-08 19:25:41,121][21195] Updated weights for policy 0, policy_version 91010 (0.0009) +[2023-10-08 19:25:41,486][21195] Updated weights for policy 0, policy_version 91020 (0.0009) +[2023-10-08 19:25:41,861][21195] Updated weights for policy 0, policy_version 91030 (0.0008) +[2023-10-08 19:25:42,226][21195] Updated weights for policy 0, policy_version 91040 (0.0008) +[2023-10-08 19:25:43,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 185729024. Throughput: 0: 1712.4, 1: 1736.3. Samples: 46443198. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:25:43,804][19739] Avg episode reward: [(0, '1076.940'), (1, '902.160')] +[2023-10-08 19:25:44,160][21194] Updated weights for policy 1, policy_version 90340 (0.0010) +[2023-10-08 19:25:44,520][21194] Updated weights for policy 1, policy_version 90350 (0.0011) +[2023-10-08 19:25:44,881][21194] Updated weights for policy 1, policy_version 90360 (0.0007) +[2023-10-08 19:25:46,085][21195] Updated weights for policy 0, policy_version 91050 (0.0007) +[2023-10-08 19:25:46,457][21195] Updated weights for policy 0, policy_version 91060 (0.0008) +[2023-10-08 19:25:46,826][21195] Updated weights for policy 0, policy_version 91070 (0.0009) +[2023-10-08 19:25:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 185794560. Throughput: 0: 1731.2, 1: 1702.1. Samples: 46458436. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:25:48,803][19739] Avg episode reward: [(0, '1076.940'), (1, '902.160')] +[2023-10-08 19:25:48,807][21194] Updated weights for policy 1, policy_version 90370 (0.0008) +[2023-10-08 19:25:49,180][21194] Updated weights for policy 1, policy_version 90380 (0.0008) +[2023-10-08 19:25:49,556][21194] Updated weights for policy 1, policy_version 90390 (0.0007) +[2023-10-08 19:25:49,926][21194] Updated weights for policy 1, policy_version 90400 (0.0008) +[2023-10-08 19:25:50,941][21195] Updated weights for policy 0, policy_version 91080 (0.0009) +[2023-10-08 19:25:51,310][21195] Updated weights for policy 0, policy_version 91090 (0.0011) +[2023-10-08 19:25:51,670][21195] Updated weights for policy 0, policy_version 91100 (0.0008) +[2023-10-08 19:25:53,802][19739] Fps is (10 sec: 13107.7, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 185860096. Throughput: 0: 1711.1, 1: 1724.2. Samples: 46473596. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:25:53,803][19739] Avg episode reward: [(0, '1076.940'), (1, '899.920')] +[2023-10-08 19:25:53,984][21194] Updated weights for policy 1, policy_version 90410 (0.0008) +[2023-10-08 19:25:54,348][21194] Updated weights for policy 1, policy_version 90420 (0.0009) +[2023-10-08 19:25:54,708][21194] Updated weights for policy 1, policy_version 90430 (0.0008) +[2023-10-08 19:25:55,577][21195] Updated weights for policy 0, policy_version 91110 (0.0009) +[2023-10-08 19:25:55,949][21195] Updated weights for policy 0, policy_version 91120 (0.0008) +[2023-10-08 19:25:56,314][21195] Updated weights for policy 0, policy_version 91130 (0.0007) +[2023-10-08 19:25:58,521][21194] Updated weights for policy 1, policy_version 90440 (0.0010) +[2023-10-08 19:25:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 185925632. Throughput: 0: 1718.7, 1: 1731.4. Samples: 46494986. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:25:58,803][19739] Avg episode reward: [(0, '1077.030'), (1, '885.100')] +[2023-10-08 19:25:58,881][21194] Updated weights for policy 1, policy_version 90450 (0.0011) +[2023-10-08 19:25:59,247][21194] Updated weights for policy 1, policy_version 90460 (0.0010) +[2023-10-08 19:25:59,991][21195] Updated weights for policy 0, policy_version 91140 (0.0010) +[2023-10-08 19:26:00,360][21195] Updated weights for policy 0, policy_version 91150 (0.0009) +[2023-10-08 19:26:00,730][21195] Updated weights for policy 0, policy_version 91160 (0.0012) +[2023-10-08 19:26:03,104][21194] Updated weights for policy 1, policy_version 90470 (0.0010) +[2023-10-08 19:26:03,463][21194] Updated weights for policy 1, policy_version 90480 (0.0007) +[2023-10-08 19:26:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 185991168. Throughput: 0: 1748.1, 1: 1713.7. Samples: 46510604. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:26:03,803][19739] Avg episode reward: [(0, '1077.030'), (1, '900.310')] +[2023-10-08 19:26:03,828][21194] Updated weights for policy 1, policy_version 90490 (0.0009) +[2023-10-08 19:26:04,670][21195] Updated weights for policy 0, policy_version 91170 (0.0009) +[2023-10-08 19:26:05,069][21195] Updated weights for policy 0, policy_version 91180 (0.0010) +[2023-10-08 19:26:05,445][21195] Updated weights for policy 0, policy_version 91190 (0.0010) +[2023-10-08 19:26:05,811][21195] Updated weights for policy 0, policy_version 91200 (0.0008) +[2023-10-08 19:26:07,914][21194] Updated weights for policy 1, policy_version 90500 (0.0010) +[2023-10-08 19:26:08,273][21194] Updated weights for policy 1, policy_version 90510 (0.0007) +[2023-10-08 19:26:08,637][21194] Updated weights for policy 1, policy_version 90520 (0.0009) +[2023-10-08 19:26:08,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 186056704. Throughput: 0: 1722.6, 1: 1723.1. Samples: 46526022. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:26:08,803][19739] Avg episode reward: [(0, '1077.370'), (1, '900.310')] +[2023-10-08 19:26:09,601][21195] Updated weights for policy 0, policy_version 91210 (0.0009) +[2023-10-08 19:26:09,978][21195] Updated weights for policy 0, policy_version 91220 (0.0007) +[2023-10-08 19:26:10,340][21195] Updated weights for policy 0, policy_version 91230 (0.0009) +[2023-10-08 19:26:12,784][21194] Updated weights for policy 1, policy_version 90530 (0.0008) +[2023-10-08 19:26:13,140][21194] Updated weights for policy 1, policy_version 90540 (0.0009) +[2023-10-08 19:26:13,507][21194] Updated weights for policy 1, policy_version 90550 (0.0007) +[2023-10-08 19:26:13,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13107.1, 300 sec: 13773.7). Total num frames: 186122240. Throughput: 0: 1749.4, 1: 1714.2. Samples: 46547254. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:26:13,804][19739] Avg episode reward: [(0, '1071.710'), (1, '900.310')] +[2023-10-08 19:26:13,864][21194] Updated weights for policy 1, policy_version 90560 (0.0008) +[2023-10-08 19:26:14,087][21195] Updated weights for policy 0, policy_version 91240 (0.0010) +[2023-10-08 19:26:14,460][21195] Updated weights for policy 0, policy_version 91250 (0.0010) +[2023-10-08 19:26:14,836][21195] Updated weights for policy 0, policy_version 91260 (0.0010) +[2023-10-08 19:26:17,737][21194] Updated weights for policy 1, policy_version 90570 (0.0009) +[2023-10-08 19:26:18,098][21194] Updated weights for policy 1, policy_version 90580 (0.0010) +[2023-10-08 19:26:18,468][21194] Updated weights for policy 1, policy_version 90590 (0.0010) +[2023-10-08 19:26:18,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 186220544. Throughput: 0: 1747.9, 1: 1726.9. Samples: 46562890. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:26:18,803][19739] Avg episode reward: [(0, '1071.710'), (1, '892.780')] +[2023-10-08 19:26:18,808][21195] Updated weights for policy 0, policy_version 91270 (0.0008) +[2023-10-08 19:26:19,178][21195] Updated weights for policy 0, policy_version 91280 (0.0007) +[2023-10-08 19:26:19,547][21195] Updated weights for policy 0, policy_version 91290 (0.0009) +[2023-10-08 19:26:22,541][21194] Updated weights for policy 1, policy_version 90600 (0.0008) +[2023-10-08 19:26:22,902][21194] Updated weights for policy 1, policy_version 90610 (0.0007) +[2023-10-08 19:26:23,262][21194] Updated weights for policy 1, policy_version 90620 (0.0007) +[2023-10-08 19:26:23,473][21195] Updated weights for policy 0, policy_version 91300 (0.0007) +[2023-10-08 19:26:23,803][19739] Fps is (10 sec: 16384.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 186286080. Throughput: 0: 1732.1, 1: 1727.1. Samples: 46578398. Policy #0 lag: (min: 11.0, avg: 13.8, max: 43.0) +[2023-10-08 19:26:23,803][19739] Avg episode reward: [(0, '1071.770'), (1, '892.780')] +[2023-10-08 19:26:23,841][21195] Updated weights for policy 0, policy_version 91310 (0.0008) +[2023-10-08 19:26:24,217][21195] Updated weights for policy 0, policy_version 91320 (0.0011) +[2023-10-08 19:26:27,151][21194] Updated weights for policy 1, policy_version 90630 (0.0008) +[2023-10-08 19:26:27,512][21194] Updated weights for policy 1, policy_version 90640 (0.0008) +[2023-10-08 19:26:27,893][21194] Updated weights for policy 1, policy_version 90650 (0.0008) +[2023-10-08 19:26:28,225][21195] Updated weights for policy 0, policy_version 91330 (0.0010) +[2023-10-08 19:26:28,601][21195] Updated weights for policy 0, policy_version 91340 (0.0008) +[2023-10-08 19:26:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 186351616. Throughput: 0: 1745.5, 1: 1698.1. Samples: 46598160. Policy #0 lag: (min: 11.0, avg: 13.8, max: 43.0) +[2023-10-08 19:26:28,803][19739] Avg episode reward: [(0, '1071.770'), (1, '876.890')] +[2023-10-08 19:26:28,961][21195] Updated weights for policy 0, policy_version 91350 (0.0009) +[2023-10-08 19:26:29,338][21195] Updated weights for policy 0, policy_version 91360 (0.0009) +[2023-10-08 19:26:31,879][21194] Updated weights for policy 1, policy_version 90660 (0.0008) +[2023-10-08 19:26:32,241][21194] Updated weights for policy 1, policy_version 90670 (0.0010) +[2023-10-08 19:26:32,609][21194] Updated weights for policy 1, policy_version 90680 (0.0007) +[2023-10-08 19:26:33,430][21195] Updated weights for policy 0, policy_version 91370 (0.0011) +[2023-10-08 19:26:33,795][21195] Updated weights for policy 0, policy_version 91380 (0.0010) +[2023-10-08 19:26:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 186417152. Throughput: 0: 1725.2, 1: 1725.9. Samples: 46613738. Policy #0 lag: (min: 11.0, avg: 13.8, max: 43.0) +[2023-10-08 19:26:33,803][19739] Avg episode reward: [(0, '1071.770'), (1, '875.920')] +[2023-10-08 19:26:34,162][21195] Updated weights for policy 0, policy_version 91390 (0.0007) +[2023-10-08 19:26:36,542][21194] Updated weights for policy 1, policy_version 90690 (0.0007) +[2023-10-08 19:26:36,896][21194] Updated weights for policy 1, policy_version 90700 (0.0007) +[2023-10-08 19:26:37,267][21194] Updated weights for policy 1, policy_version 90710 (0.0007) +[2023-10-08 19:26:37,630][21194] Updated weights for policy 1, policy_version 90720 (0.0009) +[2023-10-08 19:26:38,070][21195] Updated weights for policy 0, policy_version 91400 (0.0008) +[2023-10-08 19:26:38,430][21195] Updated weights for policy 0, policy_version 91410 (0.0008) +[2023-10-08 19:26:38,803][21195] Updated weights for policy 0, policy_version 91420 (0.0007) +[2023-10-08 19:26:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 186482688. Throughput: 0: 1745.6, 1: 1713.2. Samples: 46629242. Policy #0 lag: (min: 11.0, avg: 13.8, max: 43.0) +[2023-10-08 19:26:38,803][19739] Avg episode reward: [(0, '1071.770'), (1, '877.030')] +[2023-10-08 19:26:41,516][21194] Updated weights for policy 1, policy_version 90730 (0.0007) +[2023-10-08 19:26:41,878][21194] Updated weights for policy 1, policy_version 90740 (0.0009) +[2023-10-08 19:26:42,247][21194] Updated weights for policy 1, policy_version 90750 (0.0009) +[2023-10-08 19:26:42,703][21195] Updated weights for policy 0, policy_version 91430 (0.0008) +[2023-10-08 19:26:43,073][21195] Updated weights for policy 0, policy_version 91440 (0.0009) +[2023-10-08 19:26:43,452][21195] Updated weights for policy 0, policy_version 91450 (0.0009) +[2023-10-08 19:26:43,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.6, 300 sec: 13884.7). Total num frames: 186580992. Throughput: 0: 1737.5, 1: 1703.8. Samples: 46649844. Policy #0 lag: (min: 11.0, avg: 13.8, max: 43.0) +[2023-10-08 19:26:43,803][19739] Avg episode reward: [(0, '1071.770'), (1, '877.030')] +[2023-10-08 19:26:46,086][21194] Updated weights for policy 1, policy_version 90760 (0.0008) +[2023-10-08 19:26:46,442][21194] Updated weights for policy 1, policy_version 90770 (0.0010) +[2023-10-08 19:26:46,805][21194] Updated weights for policy 1, policy_version 90780 (0.0007) +[2023-10-08 19:26:47,389][21195] Updated weights for policy 0, policy_version 91460 (0.0009) +[2023-10-08 19:26:47,764][21195] Updated weights for policy 0, policy_version 91470 (0.0009) +[2023-10-08 19:26:48,126][21195] Updated weights for policy 0, policy_version 91480 (0.0010) +[2023-10-08 19:26:48,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 186646528. Throughput: 0: 1709.6, 1: 1725.5. Samples: 46665182. Policy #0 lag: (min: 11.0, avg: 13.8, max: 43.0) +[2023-10-08 19:26:48,803][19739] Avg episode reward: [(0, '1071.770'), (1, '891.010')] +[2023-10-08 19:26:50,700][21194] Updated weights for policy 1, policy_version 90790 (0.0007) +[2023-10-08 19:26:51,068][21194] Updated weights for policy 1, policy_version 90800 (0.0008) +[2023-10-08 19:26:51,442][21194] Updated weights for policy 1, policy_version 90810 (0.0010) +[2023-10-08 19:26:52,157][21195] Updated weights for policy 0, policy_version 91490 (0.0007) +[2023-10-08 19:26:52,567][21195] Updated weights for policy 0, policy_version 91500 (0.0009) +[2023-10-08 19:26:52,943][21195] Updated weights for policy 0, policy_version 91510 (0.0010) +[2023-10-08 19:26:53,314][21195] Updated weights for policy 0, policy_version 91520 (0.0010) +[2023-10-08 19:26:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 186712064. Throughput: 0: 1740.7, 1: 1702.4. Samples: 46680962. Policy #0 lag: (min: 11.0, avg: 13.8, max: 43.0) +[2023-10-08 19:26:53,803][19739] Avg episode reward: [(0, '1071.770'), (1, '891.010')] +[2023-10-08 19:26:55,548][21194] Updated weights for policy 1, policy_version 90820 (0.0010) +[2023-10-08 19:26:55,918][21194] Updated weights for policy 1, policy_version 90830 (0.0009) +[2023-10-08 19:26:56,293][21194] Updated weights for policy 1, policy_version 90840 (0.0009) +[2023-10-08 19:26:57,057][21195] Updated weights for policy 0, policy_version 91530 (0.0010) +[2023-10-08 19:26:57,425][21195] Updated weights for policy 0, policy_version 91540 (0.0008) +[2023-10-08 19:26:57,804][21195] Updated weights for policy 0, policy_version 91550 (0.0008) +[2023-10-08 19:26:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 186777600. Throughput: 0: 1709.9, 1: 1715.9. Samples: 46701416. Policy #0 lag: (min: 11.0, avg: 13.8, max: 43.0) +[2023-10-08 19:26:58,803][19739] Avg episode reward: [(0, '1071.960'), (1, '891.010')] +[2023-10-08 19:27:00,255][21194] Updated weights for policy 1, policy_version 90850 (0.0009) +[2023-10-08 19:27:00,625][21194] Updated weights for policy 1, policy_version 90860 (0.0008) +[2023-10-08 19:27:00,993][21194] Updated weights for policy 1, policy_version 90870 (0.0007) +[2023-10-08 19:27:01,352][21194] Updated weights for policy 1, policy_version 90880 (0.0007) +[2023-10-08 19:27:01,739][21195] Updated weights for policy 0, policy_version 91560 (0.0009) +[2023-10-08 19:27:02,118][21195] Updated weights for policy 0, policy_version 91570 (0.0008) +[2023-10-08 19:27:02,477][21195] Updated weights for policy 0, policy_version 91580 (0.0008) +[2023-10-08 19:27:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 186843136. Throughput: 0: 1714.7, 1: 1713.0. Samples: 46717136. Policy #0 lag: (min: 11.0, avg: 13.8, max: 43.0) +[2023-10-08 19:27:03,803][19739] Avg episode reward: [(0, '1086.230'), (1, '905.060')] +[2023-10-08 19:27:05,358][21194] Updated weights for policy 1, policy_version 90890 (0.0011) +[2023-10-08 19:27:05,727][21194] Updated weights for policy 1, policy_version 90900 (0.0009) +[2023-10-08 19:27:06,085][21194] Updated weights for policy 1, policy_version 90910 (0.0009) +[2023-10-08 19:27:06,452][21195] Updated weights for policy 0, policy_version 91590 (0.0008) +[2023-10-08 19:27:06,827][21195] Updated weights for policy 0, policy_version 91600 (0.0010) +[2023-10-08 19:27:07,189][21195] Updated weights for policy 0, policy_version 91610 (0.0008) +[2023-10-08 19:27:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 186908672. Throughput: 0: 1728.6, 1: 1700.3. Samples: 46732698. Policy #0 lag: (min: 11.0, avg: 13.8, max: 43.0) +[2023-10-08 19:27:08,803][19739] Avg episode reward: [(0, '1086.230'), (1, '920.390')] +[2023-10-08 19:27:10,211][21194] Updated weights for policy 1, policy_version 90920 (0.0008) +[2023-10-08 19:27:10,591][21194] Updated weights for policy 1, policy_version 90930 (0.0010) +[2023-10-08 19:27:10,951][21194] Updated weights for policy 1, policy_version 90940 (0.0008) +[2023-10-08 19:27:10,974][21195] Updated weights for policy 0, policy_version 91620 (0.0008) +[2023-10-08 19:27:11,340][21195] Updated weights for policy 0, policy_version 91630 (0.0007) +[2023-10-08 19:27:11,712][21195] Updated weights for policy 0, policy_version 91640 (0.0007) +[2023-10-08 19:27:13,803][19739] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 186974208. Throughput: 0: 1723.4, 1: 1729.1. Samples: 46753526. Policy #0 lag: (min: 11.0, avg: 13.8, max: 43.0) +[2023-10-08 19:27:13,804][19739] Avg episode reward: [(0, '1101.720'), (1, '920.390')] +[2023-10-08 19:27:13,816][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000091648_93847552.pth... +[2023-10-08 19:27:13,816][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000090944_93126656.pth... +[2023-10-08 19:27:13,851][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000089344_91488256.pth +[2023-10-08 19:27:13,860][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000090016_92176384.pth +[2023-10-08 19:27:14,814][21194] Updated weights for policy 1, policy_version 90950 (0.0007) +[2023-10-08 19:27:15,174][21194] Updated weights for policy 1, policy_version 90960 (0.0007) +[2023-10-08 19:27:15,539][21194] Updated weights for policy 1, policy_version 90970 (0.0007) +[2023-10-08 19:27:15,557][21195] Updated weights for policy 0, policy_version 91650 (0.0011) +[2023-10-08 19:27:15,924][21195] Updated weights for policy 0, policy_version 91660 (0.0008) +[2023-10-08 19:27:16,295][21195] Updated weights for policy 0, policy_version 91670 (0.0007) +[2023-10-08 19:27:16,668][21195] Updated weights for policy 0, policy_version 91680 (0.0011) +[2023-10-08 19:27:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 187039744. Throughput: 0: 1746.3, 1: 1704.4. Samples: 46769022. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 19:27:18,803][19739] Avg episode reward: [(0, '1079.870'), (1, '906.490')] +[2023-10-08 19:27:19,542][21194] Updated weights for policy 1, policy_version 90980 (0.0007) +[2023-10-08 19:27:19,903][21194] Updated weights for policy 1, policy_version 90990 (0.0008) +[2023-10-08 19:27:20,269][21194] Updated weights for policy 1, policy_version 91000 (0.0007) +[2023-10-08 19:27:20,416][21195] Updated weights for policy 0, policy_version 91690 (0.0008) +[2023-10-08 19:27:20,787][21195] Updated weights for policy 0, policy_version 91700 (0.0008) +[2023-10-08 19:27:21,148][21195] Updated weights for policy 0, policy_version 91710 (0.0008) +[2023-10-08 19:27:23,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 187105280. Throughput: 0: 1728.3, 1: 1726.2. Samples: 46784692. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 19:27:23,803][19739] Avg episode reward: [(0, '1079.870'), (1, '906.490')] +[2023-10-08 19:27:24,029][21194] Updated weights for policy 1, policy_version 91010 (0.0008) +[2023-10-08 19:27:24,396][21194] Updated weights for policy 1, policy_version 91020 (0.0011) +[2023-10-08 19:27:24,768][21194] Updated weights for policy 1, policy_version 91030 (0.0009) +[2023-10-08 19:27:25,056][21195] Updated weights for policy 0, policy_version 91720 (0.0008) +[2023-10-08 19:27:25,128][21194] Updated weights for policy 1, policy_version 91040 (0.0009) +[2023-10-08 19:27:25,412][21195] Updated weights for policy 0, policy_version 91730 (0.0007) +[2023-10-08 19:27:25,775][21195] Updated weights for policy 0, policy_version 91740 (0.0011) +[2023-10-08 19:27:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 187170816. Throughput: 0: 1739.6, 1: 1738.6. Samples: 46806364. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 19:27:28,803][19739] Avg episode reward: [(0, '1050.260'), (1, '906.490')] +[2023-10-08 19:27:28,964][21194] Updated weights for policy 1, policy_version 91050 (0.0010) +[2023-10-08 19:27:29,338][21194] Updated weights for policy 1, policy_version 91060 (0.0007) +[2023-10-08 19:27:29,708][21194] Updated weights for policy 1, policy_version 91070 (0.0007) +[2023-10-08 19:27:29,802][21195] Updated weights for policy 0, policy_version 91750 (0.0009) +[2023-10-08 19:27:30,173][21195] Updated weights for policy 0, policy_version 91760 (0.0010) +[2023-10-08 19:27:30,538][21195] Updated weights for policy 0, policy_version 91770 (0.0008) +[2023-10-08 19:27:33,768][21194] Updated weights for policy 1, policy_version 91080 (0.0009) +[2023-10-08 19:27:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 187236352. Throughput: 0: 1762.2, 1: 1714.8. Samples: 46821646. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 19:27:33,803][19739] Avg episode reward: [(0, '1050.360'), (1, '906.490')] +[2023-10-08 19:27:34,145][21194] Updated weights for policy 1, policy_version 91090 (0.0008) +[2023-10-08 19:27:34,416][21195] Updated weights for policy 0, policy_version 91780 (0.0008) +[2023-10-08 19:27:34,508][21194] Updated weights for policy 1, policy_version 91100 (0.0009) +[2023-10-08 19:27:34,777][21195] Updated weights for policy 0, policy_version 91790 (0.0008) +[2023-10-08 19:27:35,150][21195] Updated weights for policy 0, policy_version 91800 (0.0008) +[2023-10-08 19:27:38,442][21194] Updated weights for policy 1, policy_version 91110 (0.0009) +[2023-10-08 19:27:38,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 187301888. Throughput: 0: 1730.3, 1: 1734.4. Samples: 46836874. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 19:27:38,804][19739] Avg episode reward: [(0, '1050.360'), (1, '906.490')] +[2023-10-08 19:27:38,812][21194] Updated weights for policy 1, policy_version 91120 (0.0008) +[2023-10-08 19:27:39,062][21195] Updated weights for policy 0, policy_version 91810 (0.0010) +[2023-10-08 19:27:39,175][21194] Updated weights for policy 1, policy_version 91130 (0.0008) +[2023-10-08 19:27:39,464][21195] Updated weights for policy 0, policy_version 91820 (0.0010) +[2023-10-08 19:27:39,834][21195] Updated weights for policy 0, policy_version 91830 (0.0011) +[2023-10-08 19:27:40,194][21195] Updated weights for policy 0, policy_version 91840 (0.0011) +[2023-10-08 19:27:43,261][21194] Updated weights for policy 1, policy_version 91140 (0.0007) +[2023-10-08 19:27:43,633][21194] Updated weights for policy 1, policy_version 91150 (0.0007) +[2023-10-08 19:27:43,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 187367424. Throughput: 0: 1752.5, 1: 1727.9. Samples: 46858036. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 19:27:43,803][19739] Avg episode reward: [(0, '1050.360'), (1, '921.290')] +[2023-10-08 19:27:43,995][21194] Updated weights for policy 1, policy_version 91160 (0.0007) +[2023-10-08 19:27:44,099][21195] Updated weights for policy 0, policy_version 91850 (0.0010) +[2023-10-08 19:27:44,480][21195] Updated weights for policy 0, policy_version 91860 (0.0008) +[2023-10-08 19:27:44,848][21195] Updated weights for policy 0, policy_version 91870 (0.0010) +[2023-10-08 19:27:48,113][21194] Updated weights for policy 1, policy_version 91170 (0.0008) +[2023-10-08 19:27:48,478][21194] Updated weights for policy 1, policy_version 91180 (0.0008) +[2023-10-08 19:27:48,761][21195] Updated weights for policy 0, policy_version 91880 (0.0008) +[2023-10-08 19:27:48,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 187432960. Throughput: 0: 1747.2, 1: 1722.5. Samples: 46873272. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 19:27:48,803][19739] Avg episode reward: [(0, '1050.360'), (1, '921.290')] +[2023-10-08 19:27:48,841][21194] Updated weights for policy 1, policy_version 91190 (0.0008) +[2023-10-08 19:27:49,132][21195] Updated weights for policy 0, policy_version 91890 (0.0008) +[2023-10-08 19:27:49,216][21194] Updated weights for policy 1, policy_version 91200 (0.0008) +[2023-10-08 19:27:49,505][21195] Updated weights for policy 0, policy_version 91900 (0.0010) +[2023-10-08 19:27:53,276][21194] Updated weights for policy 1, policy_version 91210 (0.0007) +[2023-10-08 19:27:53,546][21195] Updated weights for policy 0, policy_version 91910 (0.0007) +[2023-10-08 19:27:53,641][21194] Updated weights for policy 1, policy_version 91220 (0.0008) +[2023-10-08 19:27:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 187498496. Throughput: 0: 1733.9, 1: 1732.3. Samples: 46888674. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 19:27:53,804][19739] Avg episode reward: [(0, '1050.350'), (1, '921.290')] +[2023-10-08 19:27:53,914][21195] Updated weights for policy 0, policy_version 91920 (0.0008) +[2023-10-08 19:27:54,011][21194] Updated weights for policy 1, policy_version 91230 (0.0008) +[2023-10-08 19:27:54,291][21195] Updated weights for policy 0, policy_version 91930 (0.0008) +[2023-10-08 19:27:57,803][21194] Updated weights for policy 1, policy_version 91240 (0.0009) +[2023-10-08 19:27:58,146][21195] Updated weights for policy 0, policy_version 91940 (0.0009) +[2023-10-08 19:27:58,162][21194] Updated weights for policy 1, policy_version 91250 (0.0009) +[2023-10-08 19:27:58,521][21195] Updated weights for policy 0, policy_version 91950 (0.0008) +[2023-10-08 19:27:58,531][21194] Updated weights for policy 1, policy_version 91260 (0.0008) +[2023-10-08 19:27:58,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 187596800. Throughput: 0: 1741.7, 1: 1725.9. Samples: 46909568. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 19:27:58,803][19739] Avg episode reward: [(0, '1079.780'), (1, '921.290')] +[2023-10-08 19:27:58,888][21195] Updated weights for policy 0, policy_version 91960 (0.0008) +[2023-10-08 19:28:02,565][21194] Updated weights for policy 1, policy_version 91270 (0.0007) +[2023-10-08 19:28:02,834][21195] Updated weights for policy 0, policy_version 91970 (0.0008) +[2023-10-08 19:28:02,929][21194] Updated weights for policy 1, policy_version 91280 (0.0008) +[2023-10-08 19:28:03,206][21195] Updated weights for policy 0, policy_version 91980 (0.0008) +[2023-10-08 19:28:03,286][21194] Updated weights for policy 1, policy_version 91290 (0.0007) +[2023-10-08 19:28:03,577][21195] Updated weights for policy 0, policy_version 91990 (0.0009) +[2023-10-08 19:28:03,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 187662336. Throughput: 0: 1712.0, 1: 1735.6. Samples: 46924162. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 19:28:03,803][19739] Avg episode reward: [(0, '1064.630'), (1, '921.290')] +[2023-10-08 19:28:03,951][21195] Updated weights for policy 0, policy_version 92000 (0.0009) +[2023-10-08 19:28:07,122][21194] Updated weights for policy 1, policy_version 91300 (0.0007) +[2023-10-08 19:28:07,490][21194] Updated weights for policy 1, policy_version 91310 (0.0007) +[2023-10-08 19:28:07,796][21195] Updated weights for policy 0, policy_version 92010 (0.0007) +[2023-10-08 19:28:07,862][21194] Updated weights for policy 1, policy_version 91320 (0.0008) +[2023-10-08 19:28:08,149][21195] Updated weights for policy 0, policy_version 92020 (0.0010) +[2023-10-08 19:28:08,516][21195] Updated weights for policy 0, policy_version 92030 (0.0010) +[2023-10-08 19:28:08,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 187760640. Throughput: 0: 1735.7, 1: 1732.4. Samples: 46940756. Policy #0 lag: (min: 13.0, avg: 13.0, max: 13.0) +[2023-10-08 19:28:08,803][19739] Avg episode reward: [(0, '1079.870'), (1, '921.290')] +[2023-10-08 19:28:11,706][21194] Updated weights for policy 1, policy_version 91330 (0.0009) +[2023-10-08 19:28:12,078][21194] Updated weights for policy 1, policy_version 91340 (0.0010) +[2023-10-08 19:28:12,432][21194] Updated weights for policy 1, policy_version 91350 (0.0008) +[2023-10-08 19:28:12,500][21195] Updated weights for policy 0, policy_version 92040 (0.0010) +[2023-10-08 19:28:12,797][21194] Updated weights for policy 1, policy_version 91360 (0.0009) +[2023-10-08 19:28:12,869][21195] Updated weights for policy 0, policy_version 92050 (0.0009) +[2023-10-08 19:28:13,226][21195] Updated weights for policy 0, policy_version 92060 (0.0009) +[2023-10-08 19:28:13,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 187826176. Throughput: 0: 1718.2, 1: 1700.3. Samples: 46960196. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 19:28:13,803][19739] Avg episode reward: [(0, '1079.870'), (1, '921.290')] +[2023-10-08 19:28:16,696][21194] Updated weights for policy 1, policy_version 91370 (0.0007) +[2023-10-08 19:28:17,062][21194] Updated weights for policy 1, policy_version 91380 (0.0007) +[2023-10-08 19:28:17,188][21195] Updated weights for policy 0, policy_version 92070 (0.0007) +[2023-10-08 19:28:17,419][21194] Updated weights for policy 1, policy_version 91390 (0.0007) +[2023-10-08 19:28:17,547][21195] Updated weights for policy 0, policy_version 92080 (0.0007) +[2023-10-08 19:28:17,928][21195] Updated weights for policy 0, policy_version 92090 (0.0010) +[2023-10-08 19:28:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 187891712. Throughput: 0: 1703.4, 1: 1730.3. Samples: 46976164. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 19:28:18,803][19739] Avg episode reward: [(0, '1064.130'), (1, '921.290')] +[2023-10-08 19:28:21,509][21194] Updated weights for policy 1, policy_version 91400 (0.0009) +[2023-10-08 19:28:21,722][21195] Updated weights for policy 0, policy_version 92100 (0.0007) +[2023-10-08 19:28:21,867][21194] Updated weights for policy 1, policy_version 91410 (0.0009) +[2023-10-08 19:28:22,084][21195] Updated weights for policy 0, policy_version 92110 (0.0010) +[2023-10-08 19:28:22,236][21194] Updated weights for policy 1, policy_version 91420 (0.0008) +[2023-10-08 19:28:22,453][21195] Updated weights for policy 0, policy_version 92120 (0.0009) +[2023-10-08 19:28:23,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 187957248. Throughput: 0: 1729.7, 1: 1715.3. Samples: 46991900. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 19:28:23,803][19739] Avg episode reward: [(0, '1064.130'), (1, '921.290')] +[2023-10-08 19:28:26,259][21194] Updated weights for policy 1, policy_version 91430 (0.0008) +[2023-10-08 19:28:26,515][21195] Updated weights for policy 0, policy_version 92130 (0.0008) +[2023-10-08 19:28:26,623][21194] Updated weights for policy 1, policy_version 91440 (0.0008) +[2023-10-08 19:28:26,903][21195] Updated weights for policy 0, policy_version 92140 (0.0007) +[2023-10-08 19:28:26,995][21194] Updated weights for policy 1, policy_version 91450 (0.0008) +[2023-10-08 19:28:27,271][21195] Updated weights for policy 0, policy_version 92150 (0.0008) +[2023-10-08 19:28:27,648][21195] Updated weights for policy 0, policy_version 92160 (0.0008) +[2023-10-08 19:28:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 188022784. Throughput: 0: 1709.3, 1: 1701.1. Samples: 47011504. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 19:28:28,803][19739] Avg episode reward: [(0, '1064.130'), (1, '913.320')] +[2023-10-08 19:28:31,024][21194] Updated weights for policy 1, policy_version 91460 (0.0009) +[2023-10-08 19:28:31,389][21194] Updated weights for policy 1, policy_version 91470 (0.0007) +[2023-10-08 19:28:31,470][21195] Updated weights for policy 0, policy_version 92170 (0.0007) +[2023-10-08 19:28:31,750][21194] Updated weights for policy 1, policy_version 91480 (0.0007) +[2023-10-08 19:28:31,838][21195] Updated weights for policy 0, policy_version 92180 (0.0008) +[2023-10-08 19:28:32,204][21195] Updated weights for policy 0, policy_version 92190 (0.0008) +[2023-10-08 19:28:33,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 188088320. Throughput: 0: 1721.2, 1: 1720.1. Samples: 47028132. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 19:28:33,803][19739] Avg episode reward: [(0, '1064.130'), (1, '898.180')] +[2023-10-08 19:28:35,693][21194] Updated weights for policy 1, policy_version 91490 (0.0009) +[2023-10-08 19:28:36,057][21194] Updated weights for policy 1, policy_version 91500 (0.0008) +[2023-10-08 19:28:36,334][21195] Updated weights for policy 0, policy_version 92200 (0.0008) +[2023-10-08 19:28:36,428][21194] Updated weights for policy 1, policy_version 91510 (0.0007) +[2023-10-08 19:28:36,697][21195] Updated weights for policy 0, policy_version 92210 (0.0007) +[2023-10-08 19:28:36,793][21194] Updated weights for policy 1, policy_version 91520 (0.0008) +[2023-10-08 19:28:37,074][21195] Updated weights for policy 0, policy_version 92220 (0.0009) +[2023-10-08 19:28:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 188153856. Throughput: 0: 1729.3, 1: 1700.1. Samples: 47042998. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 19:28:38,803][19739] Avg episode reward: [(0, '1064.130'), (1, '867.810')] +[2023-10-08 19:28:40,766][21194] Updated weights for policy 1, policy_version 91530 (0.0009) +[2023-10-08 19:28:41,003][21195] Updated weights for policy 0, policy_version 92230 (0.0008) +[2023-10-08 19:28:41,123][21194] Updated weights for policy 1, policy_version 91540 (0.0009) +[2023-10-08 19:28:41,369][21195] Updated weights for policy 0, policy_version 92240 (0.0007) +[2023-10-08 19:28:41,490][21194] Updated weights for policy 1, policy_version 91550 (0.0007) +[2023-10-08 19:28:41,734][21195] Updated weights for policy 0, policy_version 92250 (0.0009) +[2023-10-08 19:28:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 188219392. Throughput: 0: 1717.5, 1: 1711.2. Samples: 47063860. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 19:28:43,803][19739] Avg episode reward: [(0, '1064.130'), (1, '866.410')] +[2023-10-08 19:28:45,480][21194] Updated weights for policy 1, policy_version 91560 (0.0007) +[2023-10-08 19:28:45,663][21195] Updated weights for policy 0, policy_version 92260 (0.0009) +[2023-10-08 19:28:45,857][21194] Updated weights for policy 1, policy_version 91570 (0.0008) +[2023-10-08 19:28:46,023][21195] Updated weights for policy 0, policy_version 92270 (0.0007) +[2023-10-08 19:28:46,216][21194] Updated weights for policy 1, policy_version 91580 (0.0007) +[2023-10-08 19:28:46,396][21195] Updated weights for policy 0, policy_version 92280 (0.0009) +[2023-10-08 19:28:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 188284928. Throughput: 0: 1743.9, 1: 1711.8. Samples: 47079668. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 19:28:48,803][19739] Avg episode reward: [(0, '1064.180'), (1, '850.940')] +[2023-10-08 19:28:50,127][21194] Updated weights for policy 1, policy_version 91590 (0.0007) +[2023-10-08 19:28:50,267][21195] Updated weights for policy 0, policy_version 92290 (0.0007) +[2023-10-08 19:28:50,497][21194] Updated weights for policy 1, policy_version 91600 (0.0011) +[2023-10-08 19:28:50,639][21195] Updated weights for policy 0, policy_version 92300 (0.0007) +[2023-10-08 19:28:50,855][21194] Updated weights for policy 1, policy_version 91610 (0.0008) +[2023-10-08 19:28:51,001][21195] Updated weights for policy 0, policy_version 92310 (0.0009) +[2023-10-08 19:28:51,362][21195] Updated weights for policy 0, policy_version 92320 (0.0009) +[2023-10-08 19:28:53,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 188350464. Throughput: 0: 1719.0, 1: 1696.0. Samples: 47094432. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 19:28:53,804][19739] Avg episode reward: [(0, '1064.180'), (1, '850.940')] +[2023-10-08 19:28:54,876][21194] Updated weights for policy 1, policy_version 91620 (0.0008) +[2023-10-08 19:28:55,241][21194] Updated weights for policy 1, policy_version 91630 (0.0007) +[2023-10-08 19:28:55,327][21195] Updated weights for policy 0, policy_version 92330 (0.0008) +[2023-10-08 19:28:55,597][21194] Updated weights for policy 1, policy_version 91640 (0.0008) +[2023-10-08 19:28:55,692][21195] Updated weights for policy 0, policy_version 92340 (0.0008) +[2023-10-08 19:28:56,059][21195] Updated weights for policy 0, policy_version 92350 (0.0008) +[2023-10-08 19:28:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 188416000. Throughput: 0: 1734.6, 1: 1725.2. Samples: 47115884. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 19:28:58,804][19739] Avg episode reward: [(0, '1055.000'), (1, '850.940')] +[2023-10-08 19:28:59,426][21194] Updated weights for policy 1, policy_version 91650 (0.0010) +[2023-10-08 19:28:59,783][21194] Updated weights for policy 1, policy_version 91660 (0.0009) +[2023-10-08 19:28:59,912][21195] Updated weights for policy 0, policy_version 92360 (0.0009) +[2023-10-08 19:29:00,156][21194] Updated weights for policy 1, policy_version 91670 (0.0010) +[2023-10-08 19:29:00,281][21195] Updated weights for policy 0, policy_version 92370 (0.0008) +[2023-10-08 19:29:00,515][21194] Updated weights for policy 1, policy_version 91680 (0.0008) +[2023-10-08 19:29:00,654][21195] Updated weights for policy 0, policy_version 92380 (0.0007) +[2023-10-08 19:29:03,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 188481536. Throughput: 0: 1753.5, 1: 1694.8. Samples: 47131338. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 19:29:03,803][19739] Avg episode reward: [(0, '1055.170'), (1, '866.040')] +[2023-10-08 19:29:04,474][21194] Updated weights for policy 1, policy_version 91690 (0.0008) +[2023-10-08 19:29:04,498][21195] Updated weights for policy 0, policy_version 92390 (0.0007) +[2023-10-08 19:29:04,830][21194] Updated weights for policy 1, policy_version 91700 (0.0008) +[2023-10-08 19:29:04,861][21195] Updated weights for policy 0, policy_version 92400 (0.0007) +[2023-10-08 19:29:05,198][21194] Updated weights for policy 1, policy_version 91710 (0.0009) +[2023-10-08 19:29:05,233][21195] Updated weights for policy 0, policy_version 92410 (0.0008) +[2023-10-08 19:29:08,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 188547072. Throughput: 0: 1725.3, 1: 1716.4. Samples: 47146778. Policy #0 lag: (min: 23.0, avg: 26.2, max: 55.0) +[2023-10-08 19:29:08,803][19739] Avg episode reward: [(0, '1055.170'), (1, '866.040')] +[2023-10-08 19:29:09,098][21195] Updated weights for policy 0, policy_version 92420 (0.0009) +[2023-10-08 19:29:09,291][21194] Updated weights for policy 1, policy_version 91720 (0.0007) +[2023-10-08 19:29:09,468][21195] Updated weights for policy 0, policy_version 92430 (0.0008) +[2023-10-08 19:29:09,653][21194] Updated weights for policy 1, policy_version 91730 (0.0009) +[2023-10-08 19:29:09,844][21195] Updated weights for policy 0, policy_version 92440 (0.0009) +[2023-10-08 19:29:10,016][21194] Updated weights for policy 1, policy_version 91740 (0.0008) +[2023-10-08 19:29:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 188612608. Throughput: 0: 1747.6, 1: 1726.5. Samples: 47167840. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 19:29:13,803][19739] Avg episode reward: [(0, '1055.170'), (1, '866.040')] +[2023-10-08 19:29:14,000][21195] Updated weights for policy 0, policy_version 92450 (0.0009) +[2023-10-08 19:29:14,053][21194] Updated weights for policy 1, policy_version 91750 (0.0008) +[2023-10-08 19:29:14,397][21195] Updated weights for policy 0, policy_version 92460 (0.0007) +[2023-10-08 19:29:14,413][21194] Updated weights for policy 1, policy_version 91760 (0.0009) +[2023-10-08 19:29:14,762][21195] Updated weights for policy 0, policy_version 92470 (0.0008) +[2023-10-08 19:29:14,785][21194] Updated weights for policy 1, policy_version 91770 (0.0009) +[2023-10-08 19:29:14,999][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000091776_93978624.pth... +[2023-10-08 19:29:15,033][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000090144_92307456.pth +[2023-10-08 19:29:15,136][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000092480_94699520.pth... +[2023-10-08 19:29:15,140][21195] Updated weights for policy 0, policy_version 92480 (0.0009) +[2023-10-08 19:29:15,172][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000090848_93028352.pth +[2023-10-08 19:29:18,553][21194] Updated weights for policy 1, policy_version 91780 (0.0008) +[2023-10-08 19:29:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 188678144. Throughput: 0: 1732.0, 1: 1705.3. Samples: 47182814. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 19:29:18,803][19739] Avg episode reward: [(0, '1055.170'), (1, '866.040')] +[2023-10-08 19:29:18,919][21194] Updated weights for policy 1, policy_version 91790 (0.0010) +[2023-10-08 19:29:19,103][21195] Updated weights for policy 0, policy_version 92490 (0.0008) +[2023-10-08 19:29:19,289][21194] Updated weights for policy 1, policy_version 91800 (0.0008) +[2023-10-08 19:29:19,479][21195] Updated weights for policy 0, policy_version 92500 (0.0008) +[2023-10-08 19:29:19,841][21195] Updated weights for policy 0, policy_version 92510 (0.0010) +[2023-10-08 19:29:23,130][21194] Updated weights for policy 1, policy_version 91810 (0.0008) +[2023-10-08 19:29:23,492][21194] Updated weights for policy 1, policy_version 91820 (0.0009) +[2023-10-08 19:29:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 188743680. Throughput: 0: 1721.0, 1: 1733.9. Samples: 47198468. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 19:29:23,803][19739] Avg episode reward: [(0, '1055.170'), (1, '866.040')] +[2023-10-08 19:29:23,840][21195] Updated weights for policy 0, policy_version 92520 (0.0008) +[2023-10-08 19:29:23,857][21194] Updated weights for policy 1, policy_version 91830 (0.0010) +[2023-10-08 19:29:24,213][21194] Updated weights for policy 1, policy_version 91840 (0.0009) +[2023-10-08 19:29:24,214][21195] Updated weights for policy 0, policy_version 92530 (0.0008) +[2023-10-08 19:29:24,584][21195] Updated weights for policy 0, policy_version 92540 (0.0007) +[2023-10-08 19:29:28,179][21194] Updated weights for policy 1, policy_version 91850 (0.0008) +[2023-10-08 19:29:28,376][21195] Updated weights for policy 0, policy_version 92550 (0.0008) +[2023-10-08 19:29:28,551][21194] Updated weights for policy 1, policy_version 91860 (0.0008) +[2023-10-08 19:29:28,750][21195] Updated weights for policy 0, policy_version 92560 (0.0008) +[2023-10-08 19:29:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 188809216. Throughput: 0: 1733.8, 1: 1726.0. Samples: 47219550. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 19:29:28,803][19739] Avg episode reward: [(0, '1055.170'), (1, '882.510')] +[2023-10-08 19:29:28,921][21194] Updated weights for policy 1, policy_version 91870 (0.0008) +[2023-10-08 19:29:29,112][21195] Updated weights for policy 0, policy_version 92570 (0.0009) +[2023-10-08 19:29:32,993][21195] Updated weights for policy 0, policy_version 92580 (0.0008) +[2023-10-08 19:29:33,192][21194] Updated weights for policy 1, policy_version 91880 (0.0007) +[2023-10-08 19:29:33,368][21195] Updated weights for policy 0, policy_version 92590 (0.0008) +[2023-10-08 19:29:33,570][21194] Updated weights for policy 1, policy_version 91890 (0.0008) +[2023-10-08 19:29:33,738][21195] Updated weights for policy 0, policy_version 92600 (0.0007) +[2023-10-08 19:29:33,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 188874752. Throughput: 0: 1712.4, 1: 1719.3. Samples: 47234098. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 19:29:33,803][19739] Avg episode reward: [(0, '1055.170'), (1, '882.510')] +[2023-10-08 19:29:33,925][21194] Updated weights for policy 1, policy_version 91900 (0.0010) +[2023-10-08 19:29:37,562][21195] Updated weights for policy 0, policy_version 92610 (0.0007) +[2023-10-08 19:29:37,927][21195] Updated weights for policy 0, policy_version 92620 (0.0010) +[2023-10-08 19:29:37,985][21194] Updated weights for policy 1, policy_version 91910 (0.0008) +[2023-10-08 19:29:38,296][21195] Updated weights for policy 0, policy_version 92630 (0.0008) +[2023-10-08 19:29:38,347][21194] Updated weights for policy 1, policy_version 91920 (0.0008) +[2023-10-08 19:29:38,661][21195] Updated weights for policy 0, policy_version 92640 (0.0008) +[2023-10-08 19:29:38,717][21194] Updated weights for policy 1, policy_version 91930 (0.0008) +[2023-10-08 19:29:38,803][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 188973056. Throughput: 0: 1739.4, 1: 1728.9. Samples: 47250506. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 19:29:38,803][19739] Avg episode reward: [(0, '1055.170'), (1, '882.510')] +[2023-10-08 19:29:42,441][21194] Updated weights for policy 1, policy_version 91940 (0.0010) +[2023-10-08 19:29:42,782][21195] Updated weights for policy 0, policy_version 92650 (0.0007) +[2023-10-08 19:29:42,796][21194] Updated weights for policy 1, policy_version 91950 (0.0010) +[2023-10-08 19:29:43,149][21195] Updated weights for policy 0, policy_version 92660 (0.0008) +[2023-10-08 19:29:43,168][21194] Updated weights for policy 1, policy_version 91960 (0.0007) +[2023-10-08 19:29:43,521][21195] Updated weights for policy 0, policy_version 92670 (0.0008) +[2023-10-08 19:29:43,802][19739] Fps is (10 sec: 19660.8, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 189071360. Throughput: 0: 1724.1, 1: 1715.9. Samples: 47270684. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 19:29:43,803][19739] Avg episode reward: [(0, '1055.170'), (1, '882.510')] +[2023-10-08 19:29:47,121][21194] Updated weights for policy 1, policy_version 91970 (0.0007) +[2023-10-08 19:29:47,489][21194] Updated weights for policy 1, policy_version 91980 (0.0010) +[2023-10-08 19:29:47,528][21195] Updated weights for policy 0, policy_version 92680 (0.0007) +[2023-10-08 19:29:47,853][21194] Updated weights for policy 1, policy_version 91990 (0.0008) +[2023-10-08 19:29:47,907][21195] Updated weights for policy 0, policy_version 92690 (0.0008) +[2023-10-08 19:29:48,220][21194] Updated weights for policy 1, policy_version 92000 (0.0008) +[2023-10-08 19:29:48,266][21195] Updated weights for policy 0, policy_version 92700 (0.0008) +[2023-10-08 19:29:48,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 189136896. Throughput: 0: 1699.9, 1: 1732.4. Samples: 47285790. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 19:29:48,804][19739] Avg episode reward: [(0, '1055.170'), (1, '882.510')] +[2023-10-08 19:29:52,135][21194] Updated weights for policy 1, policy_version 92010 (0.0007) +[2023-10-08 19:29:52,210][21195] Updated weights for policy 0, policy_version 92710 (0.0009) +[2023-10-08 19:29:52,490][21194] Updated weights for policy 1, policy_version 92020 (0.0008) +[2023-10-08 19:29:52,570][21195] Updated weights for policy 0, policy_version 92720 (0.0008) +[2023-10-08 19:29:52,853][21194] Updated weights for policy 1, policy_version 92030 (0.0007) +[2023-10-08 19:29:52,947][21195] Updated weights for policy 0, policy_version 92730 (0.0008) +[2023-10-08 19:29:53,803][19739] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 189202432. Throughput: 0: 1731.6, 1: 1719.5. Samples: 47302080. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 19:29:53,804][19739] Avg episode reward: [(0, '1055.170'), (1, '882.640')] +[2023-10-08 19:29:56,920][21195] Updated weights for policy 0, policy_version 92740 (0.0009) +[2023-10-08 19:29:56,963][21194] Updated weights for policy 1, policy_version 92040 (0.0007) +[2023-10-08 19:29:57,281][21195] Updated weights for policy 0, policy_version 92750 (0.0009) +[2023-10-08 19:29:57,333][21194] Updated weights for policy 1, policy_version 92050 (0.0007) +[2023-10-08 19:29:57,650][21195] Updated weights for policy 0, policy_version 92760 (0.0007) +[2023-10-08 19:29:57,693][21194] Updated weights for policy 1, policy_version 92060 (0.0009) +[2023-10-08 19:29:58,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 189267968. Throughput: 0: 1713.3, 1: 1698.4. Samples: 47321368. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 19:29:58,803][19739] Avg episode reward: [(0, '1055.170'), (1, '882.640')] +[2023-10-08 19:30:01,627][21194] Updated weights for policy 1, policy_version 92070 (0.0007) +[2023-10-08 19:30:01,715][21195] Updated weights for policy 0, policy_version 92770 (0.0009) +[2023-10-08 19:30:01,991][21194] Updated weights for policy 1, policy_version 92080 (0.0007) +[2023-10-08 19:30:02,113][21195] Updated weights for policy 0, policy_version 92780 (0.0008) +[2023-10-08 19:30:02,348][21194] Updated weights for policy 1, policy_version 92090 (0.0007) +[2023-10-08 19:30:02,488][21195] Updated weights for policy 0, policy_version 92790 (0.0008) +[2023-10-08 19:30:02,854][21195] Updated weights for policy 0, policy_version 92800 (0.0010) +[2023-10-08 19:30:03,803][19739] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 189333504. Throughput: 0: 1712.6, 1: 1724.8. Samples: 47337494. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 19:30:03,803][19739] Avg episode reward: [(0, '1069.020'), (1, '882.640')] +[2023-10-08 19:30:06,398][21194] Updated weights for policy 1, policy_version 92100 (0.0010) +[2023-10-08 19:30:06,693][21195] Updated weights for policy 0, policy_version 92810 (0.0008) +[2023-10-08 19:30:06,768][21194] Updated weights for policy 1, policy_version 92110 (0.0007) +[2023-10-08 19:30:07,068][21195] Updated weights for policy 0, policy_version 92820 (0.0008) +[2023-10-08 19:30:07,132][21194] Updated weights for policy 1, policy_version 92120 (0.0009) +[2023-10-08 19:30:07,437][21195] Updated weights for policy 0, policy_version 92830 (0.0008) +[2023-10-08 19:30:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 189399040. Throughput: 0: 1729.1, 1: 1704.0. Samples: 47352956. Policy #0 lag: (min: 21.0, avg: 22.5, max: 47.0) +[2023-10-08 19:30:08,803][19739] Avg episode reward: [(0, '1069.270'), (1, '863.660')] +[2023-10-08 19:30:11,232][21194] Updated weights for policy 1, policy_version 92130 (0.0009) +[2023-10-08 19:30:11,239][21195] Updated weights for policy 0, policy_version 92840 (0.0008) +[2023-10-08 19:30:11,598][21194] Updated weights for policy 1, policy_version 92140 (0.0007) +[2023-10-08 19:30:11,611][21195] Updated weights for policy 0, policy_version 92850 (0.0008) +[2023-10-08 19:30:11,973][21195] Updated weights for policy 0, policy_version 92860 (0.0009) +[2023-10-08 19:30:11,973][21194] Updated weights for policy 1, policy_version 92150 (0.0009) +[2023-10-08 19:30:12,335][21194] Updated weights for policy 1, policy_version 92160 (0.0009) +[2023-10-08 19:30:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 189464576. Throughput: 0: 1713.9, 1: 1696.7. Samples: 47373024. Policy #0 lag: (min: 21.0, avg: 22.5, max: 47.0) +[2023-10-08 19:30:13,803][19739] Avg episode reward: [(0, '1069.270'), (1, '863.660')] +[2023-10-08 19:30:15,878][21195] Updated weights for policy 0, policy_version 92870 (0.0010) +[2023-10-08 19:30:16,247][21195] Updated weights for policy 0, policy_version 92880 (0.0010) +[2023-10-08 19:30:16,324][21194] Updated weights for policy 1, policy_version 92170 (0.0007) +[2023-10-08 19:30:16,610][21195] Updated weights for policy 0, policy_version 92890 (0.0007) +[2023-10-08 19:30:16,690][21194] Updated weights for policy 1, policy_version 92180 (0.0007) +[2023-10-08 19:30:17,053][21194] Updated weights for policy 1, policy_version 92190 (0.0007) +[2023-10-08 19:30:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 189530112. Throughput: 0: 1745.5, 1: 1723.6. Samples: 47390204. Policy #0 lag: (min: 21.0, avg: 22.5, max: 47.0) +[2023-10-08 19:30:18,803][19739] Avg episode reward: [(0, '1069.340'), (1, '863.040')] +[2023-10-08 19:30:20,468][21195] Updated weights for policy 0, policy_version 92900 (0.0009) +[2023-10-08 19:30:20,831][21194] Updated weights for policy 1, policy_version 92200 (0.0009) +[2023-10-08 19:30:20,835][21195] Updated weights for policy 0, policy_version 92910 (0.0008) +[2023-10-08 19:30:21,201][21195] Updated weights for policy 0, policy_version 92920 (0.0007) +[2023-10-08 19:30:21,204][21194] Updated weights for policy 1, policy_version 92210 (0.0009) +[2023-10-08 19:30:21,573][21194] Updated weights for policy 1, policy_version 92220 (0.0007) +[2023-10-08 19:30:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 189595648. Throughput: 0: 1720.2, 1: 1702.6. Samples: 47404534. Policy #0 lag: (min: 21.0, avg: 22.5, max: 47.0) +[2023-10-08 19:30:23,803][19739] Avg episode reward: [(0, '1069.550'), (1, '862.730')] +[2023-10-08 19:30:25,092][21195] Updated weights for policy 0, policy_version 92930 (0.0008) +[2023-10-08 19:30:25,457][21195] Updated weights for policy 0, policy_version 92940 (0.0009) +[2023-10-08 19:30:25,586][21194] Updated weights for policy 1, policy_version 92230 (0.0009) +[2023-10-08 19:30:25,823][21195] Updated weights for policy 0, policy_version 92950 (0.0008) +[2023-10-08 19:30:25,953][21194] Updated weights for policy 1, policy_version 92240 (0.0008) +[2023-10-08 19:30:26,196][21195] Updated weights for policy 0, policy_version 92960 (0.0009) +[2023-10-08 19:30:26,313][21194] Updated weights for policy 1, policy_version 92250 (0.0009) +[2023-10-08 19:30:28,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 189661184. Throughput: 0: 1738.4, 1: 1716.8. Samples: 47426170. Policy #0 lag: (min: 21.0, avg: 22.5, max: 47.0) +[2023-10-08 19:30:28,803][19739] Avg episode reward: [(0, '1069.550'), (1, '862.550')] +[2023-10-08 19:30:30,072][21195] Updated weights for policy 0, policy_version 92970 (0.0010) +[2023-10-08 19:30:30,278][21194] Updated weights for policy 1, policy_version 92260 (0.0007) +[2023-10-08 19:30:30,448][21195] Updated weights for policy 0, policy_version 92980 (0.0009) +[2023-10-08 19:30:30,643][21194] Updated weights for policy 1, policy_version 92270 (0.0010) +[2023-10-08 19:30:30,818][21195] Updated weights for policy 0, policy_version 92990 (0.0008) +[2023-10-08 19:30:31,006][21194] Updated weights for policy 1, policy_version 92280 (0.0010) +[2023-10-08 19:30:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 189726720. Throughput: 0: 1759.0, 1: 1710.0. Samples: 47441894. Policy #0 lag: (min: 21.0, avg: 22.5, max: 47.0) +[2023-10-08 19:30:33,803][19739] Avg episode reward: [(0, '1071.160'), (1, '847.820')] +[2023-10-08 19:30:34,624][21195] Updated weights for policy 0, policy_version 93000 (0.0008) +[2023-10-08 19:30:34,811][21194] Updated weights for policy 1, policy_version 92290 (0.0009) +[2023-10-08 19:30:34,982][21195] Updated weights for policy 0, policy_version 93010 (0.0007) +[2023-10-08 19:30:35,167][21194] Updated weights for policy 1, policy_version 92300 (0.0009) +[2023-10-08 19:30:35,344][21195] Updated weights for policy 0, policy_version 93020 (0.0010) +[2023-10-08 19:30:35,541][21194] Updated weights for policy 1, policy_version 92310 (0.0008) +[2023-10-08 19:30:35,905][21194] Updated weights for policy 1, policy_version 92320 (0.0009) +[2023-10-08 19:30:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 189792256. Throughput: 0: 1728.6, 1: 1711.7. Samples: 47456894. Policy #0 lag: (min: 21.0, avg: 22.5, max: 47.0) +[2023-10-08 19:30:38,803][19739] Avg episode reward: [(0, '1071.160'), (1, '833.280')] +[2023-10-08 19:30:39,077][21195] Updated weights for policy 0, policy_version 93030 (0.0007) +[2023-10-08 19:30:39,444][21195] Updated weights for policy 0, policy_version 93040 (0.0009) +[2023-10-08 19:30:39,812][21195] Updated weights for policy 0, policy_version 93050 (0.0008) +[2023-10-08 19:30:39,948][21194] Updated weights for policy 1, policy_version 92330 (0.0008) +[2023-10-08 19:30:40,314][21194] Updated weights for policy 1, policy_version 92340 (0.0008) +[2023-10-08 19:30:40,675][21194] Updated weights for policy 1, policy_version 92350 (0.0007) +[2023-10-08 19:30:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 189857792. Throughput: 0: 1753.0, 1: 1734.8. Samples: 47478320. Policy #0 lag: (min: 21.0, avg: 22.5, max: 47.0) +[2023-10-08 19:30:43,803][19739] Avg episode reward: [(0, '1071.160'), (1, '817.770')] +[2023-10-08 19:30:43,816][21195] Updated weights for policy 0, policy_version 93060 (0.0010) +[2023-10-08 19:30:44,183][21195] Updated weights for policy 0, policy_version 93070 (0.0011) +[2023-10-08 19:30:44,556][21195] Updated weights for policy 0, policy_version 93080 (0.0008) +[2023-10-08 19:30:44,574][21194] Updated weights for policy 1, policy_version 92360 (0.0009) +[2023-10-08 19:30:44,939][21194] Updated weights for policy 1, policy_version 92370 (0.0008) +[2023-10-08 19:30:45,303][21194] Updated weights for policy 1, policy_version 92380 (0.0011) +[2023-10-08 19:30:48,486][21195] Updated weights for policy 0, policy_version 93090 (0.0008) +[2023-10-08 19:30:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 189923328. Throughput: 0: 1754.4, 1: 1707.7. Samples: 47493290. Policy #0 lag: (min: 21.0, avg: 22.5, max: 47.0) +[2023-10-08 19:30:48,803][19739] Avg episode reward: [(0, '1071.160'), (1, '818.400')] +[2023-10-08 19:30:48,868][21195] Updated weights for policy 0, policy_version 93100 (0.0007) +[2023-10-08 19:30:49,230][21195] Updated weights for policy 0, policy_version 93110 (0.0009) +[2023-10-08 19:30:49,331][21194] Updated weights for policy 1, policy_version 92390 (0.0010) +[2023-10-08 19:30:49,599][21195] Updated weights for policy 0, policy_version 93120 (0.0007) +[2023-10-08 19:30:49,699][21194] Updated weights for policy 1, policy_version 92400 (0.0008) +[2023-10-08 19:30:50,069][21194] Updated weights for policy 1, policy_version 92410 (0.0010) +[2023-10-08 19:30:53,612][21195] Updated weights for policy 0, policy_version 93130 (0.0007) +[2023-10-08 19:30:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.3, 300 sec: 13773.7). Total num frames: 189988864. Throughput: 0: 1744.9, 1: 1716.3. Samples: 47508712. Policy #0 lag: (min: 21.0, avg: 22.5, max: 47.0) +[2023-10-08 19:30:53,803][19739] Avg episode reward: [(0, '1071.160'), (1, '816.770')] +[2023-10-08 19:30:53,984][21195] Updated weights for policy 0, policy_version 93140 (0.0007) +[2023-10-08 19:30:54,137][21194] Updated weights for policy 1, policy_version 92420 (0.0009) +[2023-10-08 19:30:54,357][21195] Updated weights for policy 0, policy_version 93150 (0.0010) +[2023-10-08 19:30:54,501][21194] Updated weights for policy 1, policy_version 92430 (0.0008) +[2023-10-08 19:30:54,859][21194] Updated weights for policy 1, policy_version 92440 (0.0009) +[2023-10-08 19:30:58,296][21195] Updated weights for policy 0, policy_version 93160 (0.0011) +[2023-10-08 19:30:58,668][21195] Updated weights for policy 0, policy_version 93170 (0.0011) +[2023-10-08 19:30:58,668][21194] Updated weights for policy 1, policy_version 92450 (0.0007) +[2023-10-08 19:30:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 190054400. Throughput: 0: 1761.2, 1: 1730.5. Samples: 47530154. Policy #0 lag: (min: 21.0, avg: 22.5, max: 47.0) +[2023-10-08 19:30:58,803][19739] Avg episode reward: [(0, '1071.160'), (1, '824.760')] +[2023-10-08 19:30:59,033][21195] Updated weights for policy 0, policy_version 93180 (0.0009) +[2023-10-08 19:30:59,033][21194] Updated weights for policy 1, policy_version 92460 (0.0009) +[2023-10-08 19:30:59,397][21194] Updated weights for policy 1, policy_version 92470 (0.0008) +[2023-10-08 19:30:59,755][21194] Updated weights for policy 1, policy_version 92480 (0.0010) +[2023-10-08 19:31:02,900][21195] Updated weights for policy 0, policy_version 93190 (0.0009) +[2023-10-08 19:31:03,265][21195] Updated weights for policy 0, policy_version 93200 (0.0008) +[2023-10-08 19:31:03,641][21195] Updated weights for policy 0, policy_version 93210 (0.0007) +[2023-10-08 19:31:03,788][21194] Updated weights for policy 1, policy_version 92490 (0.0008) +[2023-10-08 19:31:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 190119936. Throughput: 0: 1725.1, 1: 1699.2. Samples: 47544294. Policy #0 lag: (min: 21.0, avg: 22.5, max: 47.0) +[2023-10-08 19:31:03,803][19739] Avg episode reward: [(0, '1071.210'), (1, '824.930')] +[2023-10-08 19:31:04,151][21194] Updated weights for policy 1, policy_version 92500 (0.0011) +[2023-10-08 19:31:04,526][21194] Updated weights for policy 1, policy_version 92510 (0.0008) +[2023-10-08 19:31:07,396][21195] Updated weights for policy 0, policy_version 93220 (0.0009) +[2023-10-08 19:31:07,764][21195] Updated weights for policy 0, policy_version 93230 (0.0009) +[2023-10-08 19:31:08,139][21195] Updated weights for policy 0, policy_version 93240 (0.0008) +[2023-10-08 19:31:08,658][21194] Updated weights for policy 1, policy_version 92520 (0.0009) +[2023-10-08 19:31:08,802][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 190218240. Throughput: 0: 1758.8, 1: 1721.9. Samples: 47561162. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 19:31:08,803][19739] Avg episode reward: [(0, '1085.180'), (1, '824.930')] +[2023-10-08 19:31:09,020][21194] Updated weights for policy 1, policy_version 92530 (0.0010) +[2023-10-08 19:31:09,387][21194] Updated weights for policy 1, policy_version 92540 (0.0010) +[2023-10-08 19:31:12,213][21195] Updated weights for policy 0, policy_version 93250 (0.0007) +[2023-10-08 19:31:12,575][21195] Updated weights for policy 0, policy_version 93260 (0.0008) +[2023-10-08 19:31:12,943][21195] Updated weights for policy 0, policy_version 93270 (0.0007) +[2023-10-08 19:31:13,310][21195] Updated weights for policy 0, policy_version 93280 (0.0009) +[2023-10-08 19:31:13,378][21194] Updated weights for policy 1, policy_version 92550 (0.0009) +[2023-10-08 19:31:13,745][21194] Updated weights for policy 1, policy_version 92560 (0.0009) +[2023-10-08 19:31:13,803][19739] Fps is (10 sec: 16383.1, 60 sec: 13653.2, 300 sec: 13773.6). Total num frames: 190283776. Throughput: 0: 1737.8, 1: 1717.7. Samples: 47581668. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 19:31:13,804][19739] Avg episode reward: [(0, '1085.180'), (1, '838.970')] +[2023-10-08 19:31:13,813][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000093280_95518720.pth... +[2023-10-08 19:31:13,849][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000091648_93847552.pth +[2023-10-08 19:31:14,119][21194] Updated weights for policy 1, policy_version 92570 (0.0008) +[2023-10-08 19:31:14,333][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000092576_94797824.pth... +[2023-10-08 19:31:14,374][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000090944_93126656.pth +[2023-10-08 19:31:17,100][21195] Updated weights for policy 0, policy_version 93290 (0.0011) +[2023-10-08 19:31:17,471][21195] Updated weights for policy 0, policy_version 93300 (0.0009) +[2023-10-08 19:31:17,834][21195] Updated weights for policy 0, policy_version 93310 (0.0010) +[2023-10-08 19:31:17,991][21194] Updated weights for policy 1, policy_version 92580 (0.0008) +[2023-10-08 19:31:18,362][21194] Updated weights for policy 1, policy_version 92590 (0.0008) +[2023-10-08 19:31:18,716][21194] Updated weights for policy 1, policy_version 92600 (0.0011) +[2023-10-08 19:31:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 190349312. Throughput: 0: 1726.7, 1: 1707.6. Samples: 47596436. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 19:31:18,803][19739] Avg episode reward: [(0, '1085.180'), (1, '840.630')] +[2023-10-08 19:31:21,617][21195] Updated weights for policy 0, policy_version 93320 (0.0007) +[2023-10-08 19:31:21,988][21195] Updated weights for policy 0, policy_version 93330 (0.0009) +[2023-10-08 19:31:22,366][21195] Updated weights for policy 0, policy_version 93340 (0.0009) +[2023-10-08 19:31:22,831][21194] Updated weights for policy 1, policy_version 92610 (0.0008) +[2023-10-08 19:31:23,198][21194] Updated weights for policy 1, policy_version 92620 (0.0009) +[2023-10-08 19:31:23,568][21194] Updated weights for policy 1, policy_version 92630 (0.0011) +[2023-10-08 19:31:23,802][19739] Fps is (10 sec: 13108.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 190414848. Throughput: 0: 1745.3, 1: 1714.6. Samples: 47612592. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 19:31:23,803][19739] Avg episode reward: [(0, '1100.690'), (1, '815.730')] +[2023-10-08 19:31:23,933][21194] Updated weights for policy 1, policy_version 92640 (0.0011) +[2023-10-08 19:31:26,311][21195] Updated weights for policy 0, policy_version 93350 (0.0011) +[2023-10-08 19:31:26,671][21195] Updated weights for policy 0, policy_version 93360 (0.0008) +[2023-10-08 19:31:27,043][21195] Updated weights for policy 0, policy_version 93370 (0.0007) +[2023-10-08 19:31:27,845][21194] Updated weights for policy 1, policy_version 92650 (0.0009) +[2023-10-08 19:31:28,214][21194] Updated weights for policy 1, policy_version 92660 (0.0009) +[2023-10-08 19:31:28,568][21194] Updated weights for policy 1, policy_version 92670 (0.0008) +[2023-10-08 19:31:28,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 190513152. Throughput: 0: 1726.0, 1: 1707.8. Samples: 47632842. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 19:31:28,803][19739] Avg episode reward: [(0, '1100.690'), (1, '815.730')] +[2023-10-08 19:31:31,056][21195] Updated weights for policy 0, policy_version 93380 (0.0008) +[2023-10-08 19:31:31,422][21195] Updated weights for policy 0, policy_version 93390 (0.0010) +[2023-10-08 19:31:31,792][21195] Updated weights for policy 0, policy_version 93400 (0.0009) +[2023-10-08 19:31:32,635][21194] Updated weights for policy 1, policy_version 92680 (0.0008) +[2023-10-08 19:31:32,991][21194] Updated weights for policy 1, policy_version 92690 (0.0008) +[2023-10-08 19:31:33,360][21194] Updated weights for policy 1, policy_version 92700 (0.0007) +[2023-10-08 19:31:33,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 190578688. Throughput: 0: 1734.7, 1: 1721.6. Samples: 47648822. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 19:31:33,803][19739] Avg episode reward: [(0, '1100.690'), (1, '815.730')] +[2023-10-08 19:31:35,758][21195] Updated weights for policy 0, policy_version 93410 (0.0008) +[2023-10-08 19:31:36,178][21195] Updated weights for policy 0, policy_version 93420 (0.0009) +[2023-10-08 19:31:36,553][21195] Updated weights for policy 0, policy_version 93430 (0.0010) +[2023-10-08 19:31:36,922][21195] Updated weights for policy 0, policy_version 93440 (0.0009) +[2023-10-08 19:31:37,221][21194] Updated weights for policy 1, policy_version 92710 (0.0007) +[2023-10-08 19:31:37,591][21194] Updated weights for policy 1, policy_version 92720 (0.0007) +[2023-10-08 19:31:37,959][21194] Updated weights for policy 1, policy_version 92730 (0.0008) +[2023-10-08 19:31:38,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 190644224. Throughput: 0: 1726.8, 1: 1731.2. Samples: 47664322. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 19:31:38,803][19739] Avg episode reward: [(0, '1100.690'), (1, '815.730')] +[2023-10-08 19:31:40,925][21195] Updated weights for policy 0, policy_version 93450 (0.0008) +[2023-10-08 19:31:41,293][21195] Updated weights for policy 0, policy_version 93460 (0.0009) +[2023-10-08 19:31:41,668][21195] Updated weights for policy 0, policy_version 93470 (0.0009) +[2023-10-08 19:31:42,039][21194] Updated weights for policy 1, policy_version 92740 (0.0007) +[2023-10-08 19:31:42,410][21194] Updated weights for policy 1, policy_version 92750 (0.0007) +[2023-10-08 19:31:42,782][21194] Updated weights for policy 1, policy_version 92760 (0.0008) +[2023-10-08 19:31:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 190709760. Throughput: 0: 1721.9, 1: 1704.3. Samples: 47684330. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 19:31:43,803][19739] Avg episode reward: [(0, '1116.200'), (1, '788.120')] +[2023-10-08 19:31:45,542][21195] Updated weights for policy 0, policy_version 93480 (0.0008) +[2023-10-08 19:31:45,923][21195] Updated weights for policy 0, policy_version 93490 (0.0009) +[2023-10-08 19:31:46,287][21195] Updated weights for policy 0, policy_version 93500 (0.0010) +[2023-10-08 19:31:46,614][21194] Updated weights for policy 1, policy_version 92770 (0.0009) +[2023-10-08 19:31:46,976][21194] Updated weights for policy 1, policy_version 92780 (0.0010) +[2023-10-08 19:31:47,342][21194] Updated weights for policy 1, policy_version 92790 (0.0009) +[2023-10-08 19:31:47,710][21194] Updated weights for policy 1, policy_version 92800 (0.0010) +[2023-10-08 19:31:48,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 190775296. Throughput: 0: 1746.7, 1: 1730.9. Samples: 47700784. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 19:31:48,803][19739] Avg episode reward: [(0, '1116.200'), (1, '788.120')] +[2023-10-08 19:31:50,146][21195] Updated weights for policy 0, policy_version 93510 (0.0009) +[2023-10-08 19:31:50,522][21195] Updated weights for policy 0, policy_version 93520 (0.0009) +[2023-10-08 19:31:50,883][21195] Updated weights for policy 0, policy_version 93530 (0.0010) +[2023-10-08 19:31:51,621][21194] Updated weights for policy 1, policy_version 92810 (0.0009) +[2023-10-08 19:31:51,985][21194] Updated weights for policy 1, policy_version 92820 (0.0009) +[2023-10-08 19:31:52,348][21194] Updated weights for policy 1, policy_version 92830 (0.0008) +[2023-10-08 19:31:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 190840832. Throughput: 0: 1712.0, 1: 1717.2. Samples: 47715476. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 19:31:53,803][19739] Avg episode reward: [(0, '1116.200'), (1, '788.120')] +[2023-10-08 19:31:54,851][21195] Updated weights for policy 0, policy_version 93540 (0.0010) +[2023-10-08 19:31:55,223][21195] Updated weights for policy 0, policy_version 93550 (0.0010) +[2023-10-08 19:31:55,589][21195] Updated weights for policy 0, policy_version 93560 (0.0009) +[2023-10-08 19:31:56,224][21194] Updated weights for policy 1, policy_version 92840 (0.0009) +[2023-10-08 19:31:56,603][21194] Updated weights for policy 1, policy_version 92850 (0.0011) +[2023-10-08 19:31:56,961][21194] Updated weights for policy 1, policy_version 92860 (0.0010) +[2023-10-08 19:31:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 190906368. Throughput: 0: 1731.2, 1: 1703.8. Samples: 47736242. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 19:31:58,803][19739] Avg episode reward: [(0, '1116.200'), (1, '798.260')] +[2023-10-08 19:31:59,477][21195] Updated weights for policy 0, policy_version 93570 (0.0007) +[2023-10-08 19:31:59,853][21195] Updated weights for policy 0, policy_version 93580 (0.0007) +[2023-10-08 19:32:00,224][21195] Updated weights for policy 0, policy_version 93590 (0.0007) +[2023-10-08 19:32:00,586][21195] Updated weights for policy 0, policy_version 93600 (0.0010) +[2023-10-08 19:32:00,786][21194] Updated weights for policy 1, policy_version 92870 (0.0008) +[2023-10-08 19:32:01,165][21194] Updated weights for policy 1, policy_version 92880 (0.0007) +[2023-10-08 19:32:01,528][21194] Updated weights for policy 1, policy_version 92890 (0.0010) +[2023-10-08 19:32:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 190971904. Throughput: 0: 1737.7, 1: 1729.0. Samples: 47752438. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 19:32:03,803][19739] Avg episode reward: [(0, '1116.200'), (1, '798.260')] +[2023-10-08 19:32:04,570][21195] Updated weights for policy 0, policy_version 93610 (0.0007) +[2023-10-08 19:32:04,934][21195] Updated weights for policy 0, policy_version 93620 (0.0008) +[2023-10-08 19:32:05,298][21195] Updated weights for policy 0, policy_version 93630 (0.0008) +[2023-10-08 19:32:05,506][21194] Updated weights for policy 1, policy_version 92900 (0.0010) +[2023-10-08 19:32:05,877][21194] Updated weights for policy 1, policy_version 92910 (0.0011) +[2023-10-08 19:32:06,244][21194] Updated weights for policy 1, policy_version 92920 (0.0009) +[2023-10-08 19:32:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 191037440. Throughput: 0: 1720.1, 1: 1717.6. Samples: 47767286. Policy #0 lag: (min: 31.0, avg: 38.8, max: 63.0) +[2023-10-08 19:32:08,803][19739] Avg episode reward: [(0, '1100.630'), (1, '783.410')] +[2023-10-08 19:32:09,219][21195] Updated weights for policy 0, policy_version 93640 (0.0007) +[2023-10-08 19:32:09,580][21195] Updated weights for policy 0, policy_version 93650 (0.0007) +[2023-10-08 19:32:09,956][21195] Updated weights for policy 0, policy_version 93660 (0.0010) +[2023-10-08 19:32:10,244][21194] Updated weights for policy 1, policy_version 92930 (0.0012) +[2023-10-08 19:32:10,597][21194] Updated weights for policy 1, policy_version 92940 (0.0010) +[2023-10-08 19:32:10,962][21194] Updated weights for policy 1, policy_version 92950 (0.0007) +[2023-10-08 19:32:11,331][21194] Updated weights for policy 1, policy_version 92960 (0.0008) +[2023-10-08 19:32:13,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 191102976. Throughput: 0: 1735.2, 1: 1730.7. Samples: 47788808. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:32:13,803][19739] Avg episode reward: [(0, '1100.800'), (1, '783.410')] +[2023-10-08 19:32:13,963][21195] Updated weights for policy 0, policy_version 93670 (0.0007) +[2023-10-08 19:32:14,331][21195] Updated weights for policy 0, policy_version 93680 (0.0008) +[2023-10-08 19:32:14,710][21195] Updated weights for policy 0, policy_version 93690 (0.0007) +[2023-10-08 19:32:15,174][21194] Updated weights for policy 1, policy_version 92970 (0.0009) +[2023-10-08 19:32:15,538][21194] Updated weights for policy 1, policy_version 92980 (0.0010) +[2023-10-08 19:32:15,910][21194] Updated weights for policy 1, policy_version 92990 (0.0008) +[2023-10-08 19:32:18,499][21195] Updated weights for policy 0, policy_version 93700 (0.0008) +[2023-10-08 19:32:18,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 191168512. Throughput: 0: 1726.5, 1: 1719.6. Samples: 47803900. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:32:18,804][19739] Avg episode reward: [(0, '1100.800'), (1, '783.410')] +[2023-10-08 19:32:18,875][21195] Updated weights for policy 0, policy_version 93710 (0.0009) +[2023-10-08 19:32:19,237][21195] Updated weights for policy 0, policy_version 93720 (0.0008) +[2023-10-08 19:32:19,920][21194] Updated weights for policy 1, policy_version 93000 (0.0007) +[2023-10-08 19:32:20,287][21194] Updated weights for policy 1, policy_version 93010 (0.0007) +[2023-10-08 19:32:20,638][21194] Updated weights for policy 1, policy_version 93020 (0.0008) +[2023-10-08 19:32:23,109][21195] Updated weights for policy 0, policy_version 93730 (0.0007) +[2023-10-08 19:32:23,482][21195] Updated weights for policy 0, policy_version 93740 (0.0008) +[2023-10-08 19:32:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 191234048. Throughput: 0: 1738.7, 1: 1714.5. Samples: 47819716. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:32:23,803][19739] Avg episode reward: [(0, '1101.590'), (1, '783.410')] +[2023-10-08 19:32:23,857][21195] Updated weights for policy 0, policy_version 93750 (0.0010) +[2023-10-08 19:32:24,224][21195] Updated weights for policy 0, policy_version 93760 (0.0010) +[2023-10-08 19:32:24,514][21194] Updated weights for policy 1, policy_version 93030 (0.0010) +[2023-10-08 19:32:24,863][21194] Updated weights for policy 1, policy_version 93040 (0.0008) +[2023-10-08 19:32:25,239][21194] Updated weights for policy 1, policy_version 93050 (0.0008) +[2023-10-08 19:32:28,359][21195] Updated weights for policy 0, policy_version 93770 (0.0010) +[2023-10-08 19:32:28,732][21195] Updated weights for policy 0, policy_version 93780 (0.0007) +[2023-10-08 19:32:28,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 191299584. Throughput: 0: 1735.2, 1: 1742.9. Samples: 47840842. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:32:28,803][19739] Avg episode reward: [(0, '1101.590'), (1, '783.410')] +[2023-10-08 19:32:29,090][21195] Updated weights for policy 0, policy_version 93790 (0.0009) +[2023-10-08 19:32:29,137][21194] Updated weights for policy 1, policy_version 93060 (0.0007) +[2023-10-08 19:32:29,500][21194] Updated weights for policy 1, policy_version 93070 (0.0009) +[2023-10-08 19:32:29,865][21194] Updated weights for policy 1, policy_version 93080 (0.0008) +[2023-10-08 19:32:33,014][21195] Updated weights for policy 0, policy_version 93800 (0.0007) +[2023-10-08 19:32:33,388][21195] Updated weights for policy 0, policy_version 93810 (0.0007) +[2023-10-08 19:32:33,756][21195] Updated weights for policy 0, policy_version 93820 (0.0008) +[2023-10-08 19:32:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 191365120. Throughput: 0: 1714.0, 1: 1715.2. Samples: 47855098. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:32:33,803][19739] Avg episode reward: [(0, '1101.590'), (1, '778.040')] +[2023-10-08 19:32:33,830][21194] Updated weights for policy 1, policy_version 93090 (0.0007) +[2023-10-08 19:32:34,196][21194] Updated weights for policy 1, policy_version 93100 (0.0009) +[2023-10-08 19:32:34,564][21194] Updated weights for policy 1, policy_version 93110 (0.0009) +[2023-10-08 19:32:34,929][21194] Updated weights for policy 1, policy_version 93120 (0.0007) +[2023-10-08 19:32:37,736][21195] Updated weights for policy 0, policy_version 93830 (0.0009) +[2023-10-08 19:32:38,103][21195] Updated weights for policy 0, policy_version 93840 (0.0010) +[2023-10-08 19:32:38,479][21195] Updated weights for policy 0, policy_version 93850 (0.0008) +[2023-10-08 19:32:38,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 191463424. Throughput: 0: 1744.6, 1: 1729.9. Samples: 47871830. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:32:38,803][19739] Avg episode reward: [(0, '1101.590'), (1, '778.040')] +[2023-10-08 19:32:38,882][21194] Updated weights for policy 1, policy_version 93130 (0.0007) +[2023-10-08 19:32:39,243][21194] Updated weights for policy 1, policy_version 93140 (0.0008) +[2023-10-08 19:32:39,612][21194] Updated weights for policy 1, policy_version 93150 (0.0008) +[2023-10-08 19:32:42,354][21195] Updated weights for policy 0, policy_version 93860 (0.0008) +[2023-10-08 19:32:42,728][21195] Updated weights for policy 0, policy_version 93870 (0.0007) +[2023-10-08 19:32:43,092][21195] Updated weights for policy 0, policy_version 93880 (0.0007) +[2023-10-08 19:32:43,672][21194] Updated weights for policy 1, policy_version 93160 (0.0008) +[2023-10-08 19:32:43,803][19739] Fps is (10 sec: 16383.6, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 191528960. Throughput: 0: 1726.0, 1: 1745.5. Samples: 47892456. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:32:43,804][19739] Avg episode reward: [(0, '1101.590'), (1, '778.040')] +[2023-10-08 19:32:44,057][21194] Updated weights for policy 1, policy_version 93170 (0.0008) +[2023-10-08 19:32:44,420][21194] Updated weights for policy 1, policy_version 93180 (0.0008) +[2023-10-08 19:32:47,051][21195] Updated weights for policy 0, policy_version 93890 (0.0008) +[2023-10-08 19:32:47,423][21195] Updated weights for policy 0, policy_version 93900 (0.0007) +[2023-10-08 19:32:47,784][21195] Updated weights for policy 0, policy_version 93910 (0.0009) +[2023-10-08 19:32:48,148][21195] Updated weights for policy 0, policy_version 93920 (0.0009) +[2023-10-08 19:32:48,592][21194] Updated weights for policy 1, policy_version 93190 (0.0008) +[2023-10-08 19:32:48,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.8). Total num frames: 191594496. Throughput: 0: 1715.9, 1: 1715.0. Samples: 47906828. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:32:48,803][19739] Avg episode reward: [(0, '1101.590'), (1, '777.560')] +[2023-10-08 19:32:48,958][21194] Updated weights for policy 1, policy_version 93200 (0.0009) +[2023-10-08 19:32:49,319][21194] Updated weights for policy 1, policy_version 93210 (0.0010) +[2023-10-08 19:32:51,959][21195] Updated weights for policy 0, policy_version 93930 (0.0007) +[2023-10-08 19:32:52,325][21195] Updated weights for policy 0, policy_version 93940 (0.0007) +[2023-10-08 19:32:52,695][21195] Updated weights for policy 0, policy_version 93950 (0.0007) +[2023-10-08 19:32:53,361][21194] Updated weights for policy 1, policy_version 93220 (0.0008) +[2023-10-08 19:32:53,723][21194] Updated weights for policy 1, policy_version 93230 (0.0007) +[2023-10-08 19:32:53,803][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 191660032. Throughput: 0: 1742.9, 1: 1720.2. Samples: 47923124. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:32:53,803][19739] Avg episode reward: [(0, '1101.590'), (1, '747.010')] +[2023-10-08 19:32:54,091][21194] Updated weights for policy 1, policy_version 93240 (0.0009) +[2023-10-08 19:32:56,416][21195] Updated weights for policy 0, policy_version 93960 (0.0008) +[2023-10-08 19:32:56,792][21195] Updated weights for policy 0, policy_version 93970 (0.0008) +[2023-10-08 19:32:57,160][21195] Updated weights for policy 0, policy_version 93980 (0.0007) +[2023-10-08 19:32:58,203][21194] Updated weights for policy 1, policy_version 93250 (0.0010) +[2023-10-08 19:32:58,568][21194] Updated weights for policy 1, policy_version 93260 (0.0010) +[2023-10-08 19:32:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 191725568. Throughput: 0: 1725.2, 1: 1718.5. Samples: 47943772. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:32:58,803][19739] Avg episode reward: [(0, '1117.080'), (1, '752.650')] +[2023-10-08 19:32:58,933][21194] Updated weights for policy 1, policy_version 93270 (0.0009) +[2023-10-08 19:32:59,304][21194] Updated weights for policy 1, policy_version 93280 (0.0010) +[2023-10-08 19:33:01,056][21195] Updated weights for policy 0, policy_version 93990 (0.0008) +[2023-10-08 19:33:01,421][21195] Updated weights for policy 0, policy_version 94000 (0.0008) +[2023-10-08 19:33:01,779][21195] Updated weights for policy 0, policy_version 94010 (0.0008) +[2023-10-08 19:33:03,204][21194] Updated weights for policy 1, policy_version 93290 (0.0009) +[2023-10-08 19:33:03,565][21194] Updated weights for policy 1, policy_version 93300 (0.0008) +[2023-10-08 19:33:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 191791104. Throughput: 0: 1733.4, 1: 1714.8. Samples: 47959072. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:33:03,803][19739] Avg episode reward: [(0, '1117.080'), (1, '752.650')] +[2023-10-08 19:33:03,942][21194] Updated weights for policy 1, policy_version 93310 (0.0008) +[2023-10-08 19:33:05,694][21195] Updated weights for policy 0, policy_version 94020 (0.0010) +[2023-10-08 19:33:06,060][21195] Updated weights for policy 0, policy_version 94030 (0.0008) +[2023-10-08 19:33:06,425][21195] Updated weights for policy 0, policy_version 94040 (0.0007) +[2023-10-08 19:33:07,978][21194] Updated weights for policy 1, policy_version 93320 (0.0011) +[2023-10-08 19:33:08,343][21194] Updated weights for policy 1, policy_version 93330 (0.0010) +[2023-10-08 19:33:08,712][21194] Updated weights for policy 1, policy_version 93340 (0.0008) +[2023-10-08 19:33:08,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 191856640. Throughput: 0: 1721.7, 1: 1716.1. Samples: 47974418. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:33:08,803][19739] Avg episode reward: [(0, '1117.080'), (1, '743.650')] +[2023-10-08 19:33:10,365][21195] Updated weights for policy 0, policy_version 94050 (0.0007) +[2023-10-08 19:33:10,781][21195] Updated weights for policy 0, policy_version 94060 (0.0008) +[2023-10-08 19:33:11,147][21195] Updated weights for policy 0, policy_version 94070 (0.0007) +[2023-10-08 19:33:11,521][21195] Updated weights for policy 0, policy_version 94080 (0.0007) +[2023-10-08 19:33:12,588][21194] Updated weights for policy 1, policy_version 93350 (0.0008) +[2023-10-08 19:33:12,941][21194] Updated weights for policy 1, policy_version 93360 (0.0007) +[2023-10-08 19:33:13,317][21194] Updated weights for policy 1, policy_version 93370 (0.0007) +[2023-10-08 19:33:13,803][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 191954944. Throughput: 0: 1730.6, 1: 1699.1. Samples: 47995178. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:33:13,803][19739] Avg episode reward: [(0, '1120.820'), (1, '743.650')] +[2023-10-08 19:33:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000094080_96337920.pth... +[2023-10-08 19:33:13,812][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000093376_95617024.pth... +[2023-10-08 19:33:13,845][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000091776_93978624.pth +[2023-10-08 19:33:13,851][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000092480_94699520.pth +[2023-10-08 19:33:15,433][21195] Updated weights for policy 0, policy_version 94090 (0.0009) +[2023-10-08 19:33:15,803][21195] Updated weights for policy 0, policy_version 94100 (0.0008) +[2023-10-08 19:33:16,175][21195] Updated weights for policy 0, policy_version 94110 (0.0007) +[2023-10-08 19:33:17,263][21194] Updated weights for policy 1, policy_version 93380 (0.0009) +[2023-10-08 19:33:17,622][21194] Updated weights for policy 1, policy_version 93390 (0.0009) +[2023-10-08 19:33:17,991][21194] Updated weights for policy 1, policy_version 93400 (0.0008) +[2023-10-08 19:33:18,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 192020480. Throughput: 0: 1753.9, 1: 1717.5. Samples: 48011308. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:33:18,803][19739] Avg episode reward: [(0, '1136.120'), (1, '734.690')] +[2023-10-08 19:33:20,114][21195] Updated weights for policy 0, policy_version 94120 (0.0009) +[2023-10-08 19:33:20,474][21195] Updated weights for policy 0, policy_version 94130 (0.0008) +[2023-10-08 19:33:20,851][21195] Updated weights for policy 0, policy_version 94140 (0.0008) +[2023-10-08 19:33:21,903][21194] Updated weights for policy 1, policy_version 93410 (0.0010) +[2023-10-08 19:33:22,263][21194] Updated weights for policy 1, policy_version 93420 (0.0008) +[2023-10-08 19:33:22,626][21194] Updated weights for policy 1, policy_version 93430 (0.0007) +[2023-10-08 19:33:22,993][21194] Updated weights for policy 1, policy_version 93440 (0.0007) +[2023-10-08 19:33:23,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 192086016. Throughput: 0: 1723.5, 1: 1712.0. Samples: 48026430. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:33:23,803][19739] Avg episode reward: [(0, '1136.120'), (1, '734.690')] +[2023-10-08 19:33:24,527][21195] Updated weights for policy 0, policy_version 94150 (0.0007) +[2023-10-08 19:33:24,894][21195] Updated weights for policy 0, policy_version 94160 (0.0007) +[2023-10-08 19:33:25,255][21195] Updated weights for policy 0, policy_version 94170 (0.0008) +[2023-10-08 19:33:26,920][21194] Updated weights for policy 1, policy_version 93450 (0.0010) +[2023-10-08 19:33:27,294][21194] Updated weights for policy 1, policy_version 93460 (0.0012) +[2023-10-08 19:33:27,663][21194] Updated weights for policy 1, policy_version 93470 (0.0007) +[2023-10-08 19:33:28,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 192151552. Throughput: 0: 1742.7, 1: 1692.4. Samples: 48047036. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:33:28,804][19739] Avg episode reward: [(0, '1136.120'), (1, '734.690')] +[2023-10-08 19:33:29,239][21195] Updated weights for policy 0, policy_version 94180 (0.0008) +[2023-10-08 19:33:29,601][21195] Updated weights for policy 0, policy_version 94190 (0.0009) +[2023-10-08 19:33:29,965][21195] Updated weights for policy 0, policy_version 94200 (0.0010) +[2023-10-08 19:33:31,770][21194] Updated weights for policy 1, policy_version 93480 (0.0010) +[2023-10-08 19:33:32,137][21194] Updated weights for policy 1, policy_version 93490 (0.0010) +[2023-10-08 19:33:32,501][21194] Updated weights for policy 1, policy_version 93500 (0.0009) +[2023-10-08 19:33:33,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 192217088. Throughput: 0: 1756.8, 1: 1729.6. Samples: 48063716. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:33:33,803][19739] Avg episode reward: [(0, '1136.120'), (1, '743.640')] +[2023-10-08 19:33:33,992][21195] Updated weights for policy 0, policy_version 94210 (0.0011) +[2023-10-08 19:33:34,360][21195] Updated weights for policy 0, policy_version 94220 (0.0007) +[2023-10-08 19:33:34,731][21195] Updated weights for policy 0, policy_version 94230 (0.0007) +[2023-10-08 19:33:35,107][21195] Updated weights for policy 0, policy_version 94240 (0.0007) +[2023-10-08 19:33:36,524][21194] Updated weights for policy 1, policy_version 93510 (0.0008) +[2023-10-08 19:33:36,891][21194] Updated weights for policy 1, policy_version 93520 (0.0007) +[2023-10-08 19:33:37,258][21194] Updated weights for policy 1, policy_version 93530 (0.0007) +[2023-10-08 19:33:38,802][19739] Fps is (10 sec: 13107.5, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 192282624. Throughput: 0: 1730.1, 1: 1715.2. Samples: 48078164. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:33:38,803][19739] Avg episode reward: [(0, '1136.120'), (1, '730.770')] +[2023-10-08 19:33:39,047][21195] Updated weights for policy 0, policy_version 94250 (0.0007) +[2023-10-08 19:33:39,419][21195] Updated weights for policy 0, policy_version 94260 (0.0009) +[2023-10-08 19:33:39,786][21195] Updated weights for policy 0, policy_version 94270 (0.0010) +[2023-10-08 19:33:41,166][21194] Updated weights for policy 1, policy_version 93540 (0.0007) +[2023-10-08 19:33:41,543][21194] Updated weights for policy 1, policy_version 93550 (0.0009) +[2023-10-08 19:33:41,912][21194] Updated weights for policy 1, policy_version 93560 (0.0008) +[2023-10-08 19:33:43,716][21195] Updated weights for policy 0, policy_version 94280 (0.0008) +[2023-10-08 19:33:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 192348160. Throughput: 0: 1749.1, 1: 1702.0. Samples: 48099070. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:33:43,803][19739] Avg episode reward: [(0, '1136.120'), (1, '725.690')] +[2023-10-08 19:33:44,081][21195] Updated weights for policy 0, policy_version 94290 (0.0009) +[2023-10-08 19:33:44,447][21195] Updated weights for policy 0, policy_version 94300 (0.0011) +[2023-10-08 19:33:45,799][21194] Updated weights for policy 1, policy_version 93570 (0.0009) +[2023-10-08 19:33:46,163][21194] Updated weights for policy 1, policy_version 93580 (0.0009) +[2023-10-08 19:33:46,529][21194] Updated weights for policy 1, policy_version 93590 (0.0009) +[2023-10-08 19:33:46,907][21194] Updated weights for policy 1, policy_version 93600 (0.0008) +[2023-10-08 19:33:48,291][21195] Updated weights for policy 0, policy_version 94310 (0.0010) +[2023-10-08 19:33:48,661][21195] Updated weights for policy 0, policy_version 94320 (0.0010) +[2023-10-08 19:33:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 192413696. Throughput: 0: 1731.8, 1: 1726.5. Samples: 48114694. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:33:48,803][19739] Avg episode reward: [(0, '1136.120'), (1, '715.030')] +[2023-10-08 19:33:49,026][21195] Updated weights for policy 0, policy_version 94330 (0.0009) +[2023-10-08 19:33:50,977][21194] Updated weights for policy 1, policy_version 93610 (0.0009) +[2023-10-08 19:33:51,347][21194] Updated weights for policy 1, policy_version 93620 (0.0007) +[2023-10-08 19:33:51,714][21194] Updated weights for policy 1, policy_version 93630 (0.0007) +[2023-10-08 19:33:52,893][21195] Updated weights for policy 0, policy_version 94340 (0.0009) +[2023-10-08 19:33:53,263][21195] Updated weights for policy 0, policy_version 94350 (0.0008) +[2023-10-08 19:33:53,623][21195] Updated weights for policy 0, policy_version 94360 (0.0008) +[2023-10-08 19:33:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 192479232. Throughput: 0: 1749.6, 1: 1705.7. Samples: 48129910. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:33:53,803][19739] Avg episode reward: [(0, '1136.120'), (1, '715.030')] +[2023-10-08 19:33:55,687][21194] Updated weights for policy 1, policy_version 93640 (0.0010) +[2023-10-08 19:33:56,065][21194] Updated weights for policy 1, policy_version 93650 (0.0010) +[2023-10-08 19:33:56,427][21194] Updated weights for policy 1, policy_version 93660 (0.0008) +[2023-10-08 19:33:57,689][21195] Updated weights for policy 0, policy_version 94370 (0.0009) +[2023-10-08 19:33:58,082][21195] Updated weights for policy 0, policy_version 94380 (0.0010) +[2023-10-08 19:33:58,455][21195] Updated weights for policy 0, policy_version 94390 (0.0007) +[2023-10-08 19:33:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 192544768. Throughput: 0: 1745.6, 1: 1726.6. Samples: 48151426. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:33:58,803][19739] Avg episode reward: [(0, '1136.120'), (1, '701.040')] +[2023-10-08 19:33:58,824][21195] Updated weights for policy 0, policy_version 94400 (0.0008) +[2023-10-08 19:34:00,191][21194] Updated weights for policy 1, policy_version 93670 (0.0008) +[2023-10-08 19:34:00,556][21194] Updated weights for policy 1, policy_version 93680 (0.0009) +[2023-10-08 19:34:00,920][21194] Updated weights for policy 1, policy_version 93690 (0.0009) +[2023-10-08 19:34:02,681][21195] Updated weights for policy 0, policy_version 94410 (0.0007) +[2023-10-08 19:34:03,046][21195] Updated weights for policy 0, policy_version 94420 (0.0008) +[2023-10-08 19:34:03,424][21195] Updated weights for policy 0, policy_version 94430 (0.0007) +[2023-10-08 19:34:03,802][19739] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 192643072. Throughput: 0: 1720.9, 1: 1714.8. Samples: 48165916. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:34:03,803][19739] Avg episode reward: [(0, '1136.120'), (1, '701.040')] +[2023-10-08 19:34:04,885][21194] Updated weights for policy 1, policy_version 93700 (0.0008) +[2023-10-08 19:34:05,259][21194] Updated weights for policy 1, policy_version 93710 (0.0010) +[2023-10-08 19:34:05,618][21194] Updated weights for policy 1, policy_version 93720 (0.0008) +[2023-10-08 19:34:07,281][21195] Updated weights for policy 0, policy_version 94440 (0.0008) +[2023-10-08 19:34:07,653][21195] Updated weights for policy 0, policy_version 94450 (0.0008) +[2023-10-08 19:34:08,023][21195] Updated weights for policy 0, policy_version 94460 (0.0008) +[2023-10-08 19:34:08,803][19739] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 192708608. Throughput: 0: 1752.6, 1: 1718.5. Samples: 48182630. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:34:08,804][19739] Avg episode reward: [(0, '1136.120'), (1, '701.040')] +[2023-10-08 19:34:09,297][21194] Updated weights for policy 1, policy_version 93730 (0.0008) +[2023-10-08 19:34:09,668][21194] Updated weights for policy 1, policy_version 93740 (0.0008) +[2023-10-08 19:34:10,043][21194] Updated weights for policy 1, policy_version 93750 (0.0009) +[2023-10-08 19:34:10,418][21194] Updated weights for policy 1, policy_version 93760 (0.0009) +[2023-10-08 19:34:11,898][21195] Updated weights for policy 0, policy_version 94470 (0.0009) +[2023-10-08 19:34:12,264][21195] Updated weights for policy 0, policy_version 94480 (0.0009) +[2023-10-08 19:34:12,632][21195] Updated weights for policy 0, policy_version 94490 (0.0007) +[2023-10-08 19:34:13,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 192774144. Throughput: 0: 1723.2, 1: 1745.1. Samples: 48203108. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:34:13,804][19739] Avg episode reward: [(0, '1136.120'), (1, '701.040')] +[2023-10-08 19:34:14,448][21194] Updated weights for policy 1, policy_version 93770 (0.0007) +[2023-10-08 19:34:14,812][21194] Updated weights for policy 1, policy_version 93780 (0.0007) +[2023-10-08 19:34:15,176][21194] Updated weights for policy 1, policy_version 93790 (0.0008) +[2023-10-08 19:34:16,501][21195] Updated weights for policy 0, policy_version 94500 (0.0009) +[2023-10-08 19:34:16,867][21195] Updated weights for policy 0, policy_version 94510 (0.0010) +[2023-10-08 19:34:17,234][21195] Updated weights for policy 0, policy_version 94520 (0.0010) +[2023-10-08 19:34:18,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 192839680. Throughput: 0: 1717.5, 1: 1714.4. Samples: 48218154. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:34:18,804][19739] Avg episode reward: [(0, '1151.620'), (1, '701.040')] +[2023-10-08 19:34:18,892][21194] Updated weights for policy 1, policy_version 93800 (0.0008) +[2023-10-08 19:34:19,261][21194] Updated weights for policy 1, policy_version 93810 (0.0008) +[2023-10-08 19:34:19,631][21194] Updated weights for policy 1, policy_version 93820 (0.0007) +[2023-10-08 19:34:21,332][21195] Updated weights for policy 0, policy_version 94530 (0.0010) +[2023-10-08 19:34:21,697][21195] Updated weights for policy 0, policy_version 94540 (0.0007) +[2023-10-08 19:34:22,071][21195] Updated weights for policy 0, policy_version 94550 (0.0010) +[2023-10-08 19:34:22,436][21195] Updated weights for policy 0, policy_version 94560 (0.0010) +[2023-10-08 19:34:23,547][21194] Updated weights for policy 1, policy_version 93830 (0.0010) +[2023-10-08 19:34:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 192905216. Throughput: 0: 1734.4, 1: 1738.5. Samples: 48234448. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:34:23,804][19739] Avg episode reward: [(0, '1167.260'), (1, '701.040')] +[2023-10-08 19:34:23,909][21194] Updated weights for policy 1, policy_version 93840 (0.0009) +[2023-10-08 19:34:24,278][21194] Updated weights for policy 1, policy_version 93850 (0.0010) +[2023-10-08 19:34:26,359][21195] Updated weights for policy 0, policy_version 94570 (0.0008) +[2023-10-08 19:34:26,730][21195] Updated weights for policy 0, policy_version 94580 (0.0008) +[2023-10-08 19:34:27,107][21195] Updated weights for policy 0, policy_version 94590 (0.0008) +[2023-10-08 19:34:28,216][21194] Updated weights for policy 1, policy_version 93860 (0.0009) +[2023-10-08 19:34:28,578][21194] Updated weights for policy 1, policy_version 93870 (0.0009) +[2023-10-08 19:34:28,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13884.7). Total num frames: 192970752. Throughput: 0: 1720.4, 1: 1754.0. Samples: 48255414. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:34:28,803][19739] Avg episode reward: [(0, '1167.260'), (1, '701.040')] +[2023-10-08 19:34:28,940][21194] Updated weights for policy 1, policy_version 93880 (0.0009) +[2023-10-08 19:34:30,793][21195] Updated weights for policy 0, policy_version 94600 (0.0008) +[2023-10-08 19:34:31,163][21195] Updated weights for policy 0, policy_version 94610 (0.0008) +[2023-10-08 19:34:31,539][21195] Updated weights for policy 0, policy_version 94620 (0.0008) +[2023-10-08 19:34:32,894][21194] Updated weights for policy 1, policy_version 93890 (0.0007) +[2023-10-08 19:34:33,260][21194] Updated weights for policy 1, policy_version 93900 (0.0008) +[2023-10-08 19:34:33,617][21194] Updated weights for policy 1, policy_version 93910 (0.0007) +[2023-10-08 19:34:33,802][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 193036288. Throughput: 0: 1738.3, 1: 1730.0. Samples: 48270768. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:34:33,803][19739] Avg episode reward: [(0, '1182.810'), (1, '699.800')] +[2023-10-08 19:34:33,804][20740] Saving new best policy, reward=1182.810! +[2023-10-08 19:34:33,985][21194] Updated weights for policy 1, policy_version 93920 (0.0007) +[2023-10-08 19:34:35,488][21195] Updated weights for policy 0, policy_version 94630 (0.0008) +[2023-10-08 19:34:35,857][21195] Updated weights for policy 0, policy_version 94640 (0.0010) +[2023-10-08 19:34:36,225][21195] Updated weights for policy 0, policy_version 94650 (0.0007) +[2023-10-08 19:34:37,880][21194] Updated weights for policy 1, policy_version 93930 (0.0008) +[2023-10-08 19:34:38,242][21194] Updated weights for policy 1, policy_version 93940 (0.0007) +[2023-10-08 19:34:38,613][21194] Updated weights for policy 1, policy_version 93950 (0.0007) +[2023-10-08 19:34:38,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 193134592. Throughput: 0: 1718.2, 1: 1753.4. Samples: 48286132. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:34:38,803][19739] Avg episode reward: [(0, '1182.810'), (1, '669.840')] +[2023-10-08 19:34:40,175][21195] Updated weights for policy 0, policy_version 94660 (0.0008) +[2023-10-08 19:34:40,551][21195] Updated weights for policy 0, policy_version 94670 (0.0008) +[2023-10-08 19:34:40,919][21195] Updated weights for policy 0, policy_version 94680 (0.0010) +[2023-10-08 19:34:42,601][21194] Updated weights for policy 1, policy_version 93960 (0.0008) +[2023-10-08 19:34:42,969][21194] Updated weights for policy 1, policy_version 93970 (0.0009) +[2023-10-08 19:34:43,334][21194] Updated weights for policy 1, policy_version 93980 (0.0008) +[2023-10-08 19:34:43,802][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 193200128. Throughput: 0: 1731.2, 1: 1729.1. Samples: 48307140. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:34:43,803][19739] Avg episode reward: [(0, '1182.820'), (1, '669.140')] +[2023-10-08 19:34:43,811][20740] Saving new best policy, reward=1182.820! +[2023-10-08 19:34:44,644][21195] Updated weights for policy 0, policy_version 94690 (0.0010) +[2023-10-08 19:34:45,059][21195] Updated weights for policy 0, policy_version 94700 (0.0008) +[2023-10-08 19:34:45,427][21195] Updated weights for policy 0, policy_version 94710 (0.0008) +[2023-10-08 19:34:45,797][21195] Updated weights for policy 0, policy_version 94720 (0.0008) +[2023-10-08 19:34:47,260][21194] Updated weights for policy 1, policy_version 93990 (0.0008) +[2023-10-08 19:34:47,616][21194] Updated weights for policy 1, policy_version 94000 (0.0008) +[2023-10-08 19:34:47,975][21194] Updated weights for policy 1, policy_version 94010 (0.0009) +[2023-10-08 19:34:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 193265664. Throughput: 0: 1757.1, 1: 1743.0. Samples: 48323420. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:34:48,803][19739] Avg episode reward: [(0, '1182.820'), (1, '669.140')] +[2023-10-08 19:34:49,732][21195] Updated weights for policy 0, policy_version 94730 (0.0010) +[2023-10-08 19:34:50,098][21195] Updated weights for policy 0, policy_version 94740 (0.0010) +[2023-10-08 19:34:50,477][21195] Updated weights for policy 0, policy_version 94750 (0.0010) +[2023-10-08 19:34:51,881][21194] Updated weights for policy 1, policy_version 94020 (0.0008) +[2023-10-08 19:34:52,257][21194] Updated weights for policy 1, policy_version 94030 (0.0009) +[2023-10-08 19:34:52,625][21194] Updated weights for policy 1, policy_version 94040 (0.0008) +[2023-10-08 19:34:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 193331200. Throughput: 0: 1722.2, 1: 1741.2. Samples: 48338480. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:34:53,803][19739] Avg episode reward: [(0, '1182.820'), (1, '683.680')] +[2023-10-08 19:34:54,332][21195] Updated weights for policy 0, policy_version 94760 (0.0008) +[2023-10-08 19:34:54,704][21195] Updated weights for policy 0, policy_version 94770 (0.0007) +[2023-10-08 19:34:55,080][21195] Updated weights for policy 0, policy_version 94780 (0.0007) +[2023-10-08 19:34:56,587][21194] Updated weights for policy 1, policy_version 94050 (0.0008) +[2023-10-08 19:34:56,961][21194] Updated weights for policy 1, policy_version 94060 (0.0008) +[2023-10-08 19:34:57,323][21194] Updated weights for policy 1, policy_version 94070 (0.0008) +[2023-10-08 19:34:57,677][21194] Updated weights for policy 1, policy_version 94080 (0.0009) +[2023-10-08 19:34:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 193396736. Throughput: 0: 1752.9, 1: 1707.7. Samples: 48358830. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:34:58,803][19739] Avg episode reward: [(0, '1182.820'), (1, '683.680')] +[2023-10-08 19:34:59,097][21195] Updated weights for policy 0, policy_version 94790 (0.0008) +[2023-10-08 19:34:59,456][21195] Updated weights for policy 0, policy_version 94800 (0.0007) +[2023-10-08 19:34:59,823][21195] Updated weights for policy 0, policy_version 94810 (0.0010) +[2023-10-08 19:35:01,663][21194] Updated weights for policy 1, policy_version 94090 (0.0008) +[2023-10-08 19:35:02,031][21194] Updated weights for policy 1, policy_version 94100 (0.0010) +[2023-10-08 19:35:02,401][21194] Updated weights for policy 1, policy_version 94110 (0.0007) +[2023-10-08 19:35:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 193462272. Throughput: 0: 1754.9, 1: 1738.1. Samples: 48375340. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:35:03,803][19739] Avg episode reward: [(0, '1182.820'), (1, '679.840')] +[2023-10-08 19:35:03,804][21195] Updated weights for policy 0, policy_version 94820 (0.0011) +[2023-10-08 19:35:04,169][21195] Updated weights for policy 0, policy_version 94830 (0.0007) +[2023-10-08 19:35:04,540][21195] Updated weights for policy 0, policy_version 94840 (0.0007) +[2023-10-08 19:35:06,200][21194] Updated weights for policy 1, policy_version 94120 (0.0009) +[2023-10-08 19:35:06,563][21194] Updated weights for policy 1, policy_version 94130 (0.0009) +[2023-10-08 19:35:06,928][21194] Updated weights for policy 1, policy_version 94140 (0.0010) +[2023-10-08 19:35:08,272][21195] Updated weights for policy 0, policy_version 94850 (0.0008) +[2023-10-08 19:35:08,646][21195] Updated weights for policy 0, policy_version 94860 (0.0011) +[2023-10-08 19:35:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 193527808. Throughput: 0: 1741.3, 1: 1714.5. Samples: 48389962. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:35:08,803][19739] Avg episode reward: [(0, '1183.050'), (1, '679.840')] +[2023-10-08 19:35:09,011][21195] Updated weights for policy 0, policy_version 94870 (0.0010) +[2023-10-08 19:35:09,378][20740] Saving new best policy, reward=1183.050! +[2023-10-08 19:35:09,381][21195] Updated weights for policy 0, policy_version 94880 (0.0011) +[2023-10-08 19:35:10,917][21194] Updated weights for policy 1, policy_version 94150 (0.0010) +[2023-10-08 19:35:11,293][21194] Updated weights for policy 1, policy_version 94160 (0.0011) +[2023-10-08 19:35:11,664][21194] Updated weights for policy 1, policy_version 94170 (0.0008) +[2023-10-08 19:35:13,062][21195] Updated weights for policy 0, policy_version 94890 (0.0009) +[2023-10-08 19:35:13,436][21195] Updated weights for policy 0, policy_version 94900 (0.0008) +[2023-10-08 19:35:13,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 193593344. Throughput: 0: 1757.9, 1: 1703.3. Samples: 48411166. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:35:13,804][19739] Avg episode reward: [(0, '1183.050'), (1, '687.360')] +[2023-10-08 19:35:13,813][21195] Updated weights for policy 0, policy_version 94910 (0.0008) +[2023-10-08 19:35:13,816][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000094176_96436224.pth... +[2023-10-08 19:35:13,853][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000092576_94797824.pth +[2023-10-08 19:35:13,882][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000094912_97189888.pth... +[2023-10-08 19:35:13,911][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000093280_95518720.pth +[2023-10-08 19:35:15,674][21194] Updated weights for policy 1, policy_version 94180 (0.0009) +[2023-10-08 19:35:16,040][21194] Updated weights for policy 1, policy_version 94190 (0.0009) +[2023-10-08 19:35:16,404][21194] Updated weights for policy 1, policy_version 94200 (0.0008) +[2023-10-08 19:35:17,812][21195] Updated weights for policy 0, policy_version 94920 (0.0009) +[2023-10-08 19:35:18,188][21195] Updated weights for policy 0, policy_version 94930 (0.0008) +[2023-10-08 19:35:18,561][21195] Updated weights for policy 0, policy_version 94940 (0.0010) +[2023-10-08 19:35:18,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 193691648. Throughput: 0: 1730.5, 1: 1720.4. Samples: 48426060. Policy #0 lag: (min: 13.0, avg: 13.1, max: 21.0) +[2023-10-08 19:35:18,803][19739] Avg episode reward: [(0, '1184.670'), (1, '687.360')] +[2023-10-08 19:35:18,804][20740] Saving new best policy, reward=1184.670! +[2023-10-08 19:35:20,415][21194] Updated weights for policy 1, policy_version 94210 (0.0008) +[2023-10-08 19:35:20,782][21194] Updated weights for policy 1, policy_version 94220 (0.0010) +[2023-10-08 19:35:21,154][21194] Updated weights for policy 1, policy_version 94230 (0.0010) +[2023-10-08 19:35:21,524][21194] Updated weights for policy 1, policy_version 94240 (0.0008) +[2023-10-08 19:35:22,446][21195] Updated weights for policy 0, policy_version 94950 (0.0008) +[2023-10-08 19:35:22,819][21195] Updated weights for policy 0, policy_version 94960 (0.0011) +[2023-10-08 19:35:23,198][21195] Updated weights for policy 0, policy_version 94970 (0.0011) +[2023-10-08 19:35:23,803][19739] Fps is (10 sec: 16384.5, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 193757184. Throughput: 0: 1764.1, 1: 1702.3. Samples: 48442120. Policy #0 lag: (min: 13.0, avg: 13.1, max: 21.0) +[2023-10-08 19:35:23,803][19739] Avg episode reward: [(0, '1184.670'), (1, '687.360')] +[2023-10-08 19:35:25,373][21194] Updated weights for policy 1, policy_version 94250 (0.0009) +[2023-10-08 19:35:25,743][21194] Updated weights for policy 1, policy_version 94260 (0.0009) +[2023-10-08 19:35:26,107][21194] Updated weights for policy 1, policy_version 94270 (0.0009) +[2023-10-08 19:35:27,064][21195] Updated weights for policy 0, policy_version 94980 (0.0008) +[2023-10-08 19:35:27,426][21195] Updated weights for policy 0, policy_version 94990 (0.0008) +[2023-10-08 19:35:27,787][21195] Updated weights for policy 0, policy_version 95000 (0.0008) +[2023-10-08 19:35:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 193822720. Throughput: 0: 1736.5, 1: 1724.7. Samples: 48462894. Policy #0 lag: (min: 13.0, avg: 13.1, max: 21.0) +[2023-10-08 19:35:28,803][19739] Avg episode reward: [(0, '1184.660'), (1, '702.580')] +[2023-10-08 19:35:30,138][21194] Updated weights for policy 1, policy_version 94280 (0.0008) +[2023-10-08 19:35:30,502][21194] Updated weights for policy 1, policy_version 94290 (0.0009) +[2023-10-08 19:35:30,868][21194] Updated weights for policy 1, policy_version 94300 (0.0008) +[2023-10-08 19:35:31,700][21195] Updated weights for policy 0, policy_version 95010 (0.0008) +[2023-10-08 19:35:32,099][21195] Updated weights for policy 0, policy_version 95020 (0.0009) +[2023-10-08 19:35:32,469][21195] Updated weights for policy 0, policy_version 95030 (0.0010) +[2023-10-08 19:35:32,842][21195] Updated weights for policy 0, policy_version 95040 (0.0009) +[2023-10-08 19:35:33,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 193888256. Throughput: 0: 1729.5, 1: 1704.7. Samples: 48477956. Policy #0 lag: (min: 13.0, avg: 13.1, max: 21.0) +[2023-10-08 19:35:33,803][19739] Avg episode reward: [(0, '1184.660'), (1, '717.360')] +[2023-10-08 19:35:34,842][21194] Updated weights for policy 1, policy_version 94310 (0.0007) +[2023-10-08 19:35:35,210][21194] Updated weights for policy 1, policy_version 94320 (0.0011) +[2023-10-08 19:35:35,570][21194] Updated weights for policy 1, policy_version 94330 (0.0008) +[2023-10-08 19:35:36,614][21195] Updated weights for policy 0, policy_version 95050 (0.0009) +[2023-10-08 19:35:36,981][21195] Updated weights for policy 0, policy_version 95060 (0.0009) +[2023-10-08 19:35:37,364][21195] Updated weights for policy 0, policy_version 95070 (0.0009) +[2023-10-08 19:35:38,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 193953792. Throughput: 0: 1750.8, 1: 1706.2. Samples: 48494046. Policy #0 lag: (min: 13.0, avg: 13.1, max: 21.0) +[2023-10-08 19:35:38,803][19739] Avg episode reward: [(0, '1184.660'), (1, '717.360')] +[2023-10-08 19:35:39,660][21194] Updated weights for policy 1, policy_version 94340 (0.0009) +[2023-10-08 19:35:40,040][21194] Updated weights for policy 1, policy_version 94350 (0.0009) +[2023-10-08 19:35:40,397][21194] Updated weights for policy 1, policy_version 94360 (0.0011) +[2023-10-08 19:35:41,252][21195] Updated weights for policy 0, policy_version 95080 (0.0009) +[2023-10-08 19:35:41,623][21195] Updated weights for policy 0, policy_version 95090 (0.0008) +[2023-10-08 19:35:41,994][21195] Updated weights for policy 0, policy_version 95100 (0.0009) +[2023-10-08 19:35:43,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 194019328. Throughput: 0: 1730.6, 1: 1737.6. Samples: 48514902. Policy #0 lag: (min: 13.0, avg: 13.1, max: 21.0) +[2023-10-08 19:35:43,803][19739] Avg episode reward: [(0, '1184.660'), (1, '717.360')] +[2023-10-08 19:35:44,321][21194] Updated weights for policy 1, policy_version 94370 (0.0009) +[2023-10-08 19:35:44,691][21194] Updated weights for policy 1, policy_version 94380 (0.0007) +[2023-10-08 19:35:45,050][21194] Updated weights for policy 1, policy_version 94390 (0.0009) +[2023-10-08 19:35:45,413][21194] Updated weights for policy 1, policy_version 94400 (0.0011) +[2023-10-08 19:35:46,002][21195] Updated weights for policy 0, policy_version 95110 (0.0010) +[2023-10-08 19:35:46,374][21195] Updated weights for policy 0, policy_version 95120 (0.0008) +[2023-10-08 19:35:46,740][21195] Updated weights for policy 0, policy_version 95130 (0.0010) +[2023-10-08 19:35:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 194084864. Throughput: 0: 1734.3, 1: 1709.2. Samples: 48530296. Policy #0 lag: (min: 13.0, avg: 13.1, max: 21.0) +[2023-10-08 19:35:48,803][19739] Avg episode reward: [(0, '1184.660'), (1, '717.360')] +[2023-10-08 19:35:49,433][21194] Updated weights for policy 1, policy_version 94410 (0.0007) +[2023-10-08 19:35:49,792][21194] Updated weights for policy 1, policy_version 94420 (0.0009) +[2023-10-08 19:35:50,171][21194] Updated weights for policy 1, policy_version 94430 (0.0010) +[2023-10-08 19:35:50,718][21195] Updated weights for policy 0, policy_version 95140 (0.0009) +[2023-10-08 19:35:51,086][21195] Updated weights for policy 0, policy_version 95150 (0.0008) +[2023-10-08 19:35:51,449][21195] Updated weights for policy 0, policy_version 95160 (0.0007) +[2023-10-08 19:35:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 194150400. Throughput: 0: 1731.4, 1: 1733.1. Samples: 48545862. Policy #0 lag: (min: 13.0, avg: 13.1, max: 21.0) +[2023-10-08 19:35:53,803][19739] Avg episode reward: [(0, '1184.740'), (1, '717.360')] +[2023-10-08 19:35:53,804][20740] Saving new best policy, reward=1184.740! +[2023-10-08 19:35:54,042][21194] Updated weights for policy 1, policy_version 94440 (0.0007) +[2023-10-08 19:35:54,418][21194] Updated weights for policy 1, policy_version 94450 (0.0007) +[2023-10-08 19:35:54,776][21194] Updated weights for policy 1, policy_version 94460 (0.0008) +[2023-10-08 19:35:55,261][21195] Updated weights for policy 0, policy_version 95170 (0.0010) +[2023-10-08 19:35:55,630][21195] Updated weights for policy 0, policy_version 95180 (0.0008) +[2023-10-08 19:35:55,998][21195] Updated weights for policy 0, policy_version 95190 (0.0009) +[2023-10-08 19:35:56,369][21195] Updated weights for policy 0, policy_version 95200 (0.0009) +[2023-10-08 19:35:58,621][21194] Updated weights for policy 1, policy_version 94470 (0.0010) +[2023-10-08 19:35:58,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 194215936. Throughput: 0: 1732.4, 1: 1742.2. Samples: 48567524. Policy #0 lag: (min: 13.0, avg: 13.1, max: 21.0) +[2023-10-08 19:35:58,803][19739] Avg episode reward: [(0, '1184.740'), (1, '717.360')] +[2023-10-08 19:35:58,984][21194] Updated weights for policy 1, policy_version 94480 (0.0008) +[2023-10-08 19:35:59,353][21194] Updated weights for policy 1, policy_version 94490 (0.0007) +[2023-10-08 19:36:00,134][21195] Updated weights for policy 0, policy_version 95210 (0.0009) +[2023-10-08 19:36:00,518][21195] Updated weights for policy 0, policy_version 95220 (0.0009) +[2023-10-08 19:36:00,881][21195] Updated weights for policy 0, policy_version 95230 (0.0007) +[2023-10-08 19:36:03,331][21194] Updated weights for policy 1, policy_version 94500 (0.0009) +[2023-10-08 19:36:03,696][21194] Updated weights for policy 1, policy_version 94510 (0.0009) +[2023-10-08 19:36:03,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 194281472. Throughput: 0: 1765.1, 1: 1725.1. Samples: 48583122. Policy #0 lag: (min: 13.0, avg: 13.1, max: 21.0) +[2023-10-08 19:36:03,804][19739] Avg episode reward: [(0, '1184.740'), (1, '717.360')] +[2023-10-08 19:36:04,064][21194] Updated weights for policy 1, policy_version 94520 (0.0008) +[2023-10-08 19:36:04,686][21195] Updated weights for policy 0, policy_version 95240 (0.0007) +[2023-10-08 19:36:05,060][21195] Updated weights for policy 0, policy_version 95250 (0.0010) +[2023-10-08 19:36:05,424][21195] Updated weights for policy 0, policy_version 95260 (0.0009) +[2023-10-08 19:36:08,028][21194] Updated weights for policy 1, policy_version 94530 (0.0008) +[2023-10-08 19:36:08,402][21194] Updated weights for policy 1, policy_version 94540 (0.0008) +[2023-10-08 19:36:08,758][21194] Updated weights for policy 1, policy_version 94550 (0.0011) +[2023-10-08 19:36:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 194347008. Throughput: 0: 1734.0, 1: 1740.8. Samples: 48598490. Policy #0 lag: (min: 13.0, avg: 13.1, max: 21.0) +[2023-10-08 19:36:08,803][19739] Avg episode reward: [(0, '1184.740'), (1, '717.360')] +[2023-10-08 19:36:09,123][21194] Updated weights for policy 1, policy_version 94560 (0.0007) +[2023-10-08 19:36:09,435][21195] Updated weights for policy 0, policy_version 95270 (0.0008) +[2023-10-08 19:36:09,802][21195] Updated weights for policy 0, policy_version 95280 (0.0011) +[2023-10-08 19:36:10,174][21195] Updated weights for policy 0, policy_version 95290 (0.0007) +[2023-10-08 19:36:13,304][21194] Updated weights for policy 1, policy_version 94570 (0.0009) +[2023-10-08 19:36:13,670][21194] Updated weights for policy 1, policy_version 94580 (0.0011) +[2023-10-08 19:36:13,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 194412544. Throughput: 0: 1748.5, 1: 1732.5. Samples: 48619542. Policy #0 lag: (min: 13.0, avg: 13.1, max: 21.0) +[2023-10-08 19:36:13,803][19739] Avg episode reward: [(0, '1196.860'), (1, '717.620')] +[2023-10-08 19:36:13,811][20740] Saving new best policy, reward=1196.860! +[2023-10-08 19:36:14,040][21194] Updated weights for policy 1, policy_version 94590 (0.0009) +[2023-10-08 19:36:14,162][21195] Updated weights for policy 0, policy_version 95300 (0.0010) +[2023-10-08 19:36:14,531][21195] Updated weights for policy 0, policy_version 95310 (0.0011) +[2023-10-08 19:36:14,900][21195] Updated weights for policy 0, policy_version 95320 (0.0010) +[2023-10-08 19:36:17,945][21194] Updated weights for policy 1, policy_version 94600 (0.0008) +[2023-10-08 19:36:18,307][21194] Updated weights for policy 1, policy_version 94610 (0.0007) +[2023-10-08 19:36:18,680][21194] Updated weights for policy 1, policy_version 94620 (0.0009) +[2023-10-08 19:36:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 194478080. Throughput: 0: 1753.1, 1: 1736.3. Samples: 48634984. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:36:18,804][19739] Avg episode reward: [(0, '1197.010'), (1, '717.620')] +[2023-10-08 19:36:18,869][21195] Updated weights for policy 0, policy_version 95330 (0.0008) +[2023-10-08 19:36:19,234][21195] Updated weights for policy 0, policy_version 95340 (0.0008) +[2023-10-08 19:36:19,595][21195] Updated weights for policy 0, policy_version 95350 (0.0008) +[2023-10-08 19:36:19,963][20740] Saving new best policy, reward=1197.010! +[2023-10-08 19:36:19,968][21195] Updated weights for policy 0, policy_version 95360 (0.0009) +[2023-10-08 19:36:22,569][21194] Updated weights for policy 1, policy_version 94630 (0.0008) +[2023-10-08 19:36:22,929][21194] Updated weights for policy 1, policy_version 94640 (0.0011) +[2023-10-08 19:36:23,300][21194] Updated weights for policy 1, policy_version 94650 (0.0010) +[2023-10-08 19:36:23,790][21195] Updated weights for policy 0, policy_version 95370 (0.0009) +[2023-10-08 19:36:23,803][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 194576384. Throughput: 0: 1735.6, 1: 1739.4. Samples: 48650424. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:36:23,803][19739] Avg episode reward: [(0, '1197.130'), (1, '717.620')] +[2023-10-08 19:36:24,157][21195] Updated weights for policy 0, policy_version 95380 (0.0010) +[2023-10-08 19:36:24,525][21195] Updated weights for policy 0, policy_version 95390 (0.0007) +[2023-10-08 19:36:24,596][20740] Saving new best policy, reward=1197.130! +[2023-10-08 19:36:27,282][21194] Updated weights for policy 1, policy_version 94660 (0.0009) +[2023-10-08 19:36:27,648][21194] Updated weights for policy 1, policy_version 94670 (0.0009) +[2023-10-08 19:36:28,017][21194] Updated weights for policy 1, policy_version 94680 (0.0009) +[2023-10-08 19:36:28,472][21195] Updated weights for policy 0, policy_version 95400 (0.0008) +[2023-10-08 19:36:28,803][19739] Fps is (10 sec: 16384.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 194641920. Throughput: 0: 1754.4, 1: 1711.4. Samples: 48670862. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:36:28,803][19739] Avg episode reward: [(0, '1197.470'), (1, '717.620')] +[2023-10-08 19:36:28,852][21195] Updated weights for policy 0, policy_version 95410 (0.0008) +[2023-10-08 19:36:29,213][21195] Updated weights for policy 0, policy_version 95420 (0.0010) +[2023-10-08 19:36:29,354][20740] Saving new best policy, reward=1197.470! +[2023-10-08 19:36:32,002][21194] Updated weights for policy 1, policy_version 94690 (0.0008) +[2023-10-08 19:36:32,365][21194] Updated weights for policy 1, policy_version 94700 (0.0007) +[2023-10-08 19:36:32,731][21194] Updated weights for policy 1, policy_version 94710 (0.0008) +[2023-10-08 19:36:33,088][21194] Updated weights for policy 1, policy_version 94720 (0.0008) +[2023-10-08 19:36:33,089][21195] Updated weights for policy 0, policy_version 95430 (0.0008) +[2023-10-08 19:36:33,461][21195] Updated weights for policy 0, policy_version 95440 (0.0009) +[2023-10-08 19:36:33,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 194707456. Throughput: 0: 1733.1, 1: 1733.6. Samples: 48686298. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:36:33,803][19739] Avg episode reward: [(0, '1197.470'), (1, '717.620')] +[2023-10-08 19:36:33,830][21195] Updated weights for policy 0, policy_version 95450 (0.0007) +[2023-10-08 19:36:36,961][21194] Updated weights for policy 1, policy_version 94730 (0.0009) +[2023-10-08 19:36:37,325][21194] Updated weights for policy 1, policy_version 94740 (0.0011) +[2023-10-08 19:36:37,691][21194] Updated weights for policy 1, policy_version 94750 (0.0009) +[2023-10-08 19:36:37,765][21195] Updated weights for policy 0, policy_version 95460 (0.0009) +[2023-10-08 19:36:38,130][21195] Updated weights for policy 0, policy_version 95470 (0.0008) +[2023-10-08 19:36:38,493][21195] Updated weights for policy 0, policy_version 95480 (0.0009) +[2023-10-08 19:36:38,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 194805760. Throughput: 0: 1752.5, 1: 1723.5. Samples: 48702282. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:36:38,804][19739] Avg episode reward: [(0, '1197.470'), (1, '717.620')] +[2023-10-08 19:36:41,738][21194] Updated weights for policy 1, policy_version 94760 (0.0009) +[2023-10-08 19:36:42,121][21194] Updated weights for policy 1, policy_version 94770 (0.0007) +[2023-10-08 19:36:42,314][21195] Updated weights for policy 0, policy_version 95490 (0.0007) +[2023-10-08 19:36:42,487][21194] Updated weights for policy 1, policy_version 94780 (0.0009) +[2023-10-08 19:36:42,684][21195] Updated weights for policy 0, policy_version 95500 (0.0007) +[2023-10-08 19:36:43,058][21195] Updated weights for policy 0, policy_version 95510 (0.0007) +[2023-10-08 19:36:43,424][21195] Updated weights for policy 0, policy_version 95520 (0.0007) +[2023-10-08 19:36:43,803][19739] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 194871296. Throughput: 0: 1738.0, 1: 1697.5. Samples: 48722120. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:36:43,803][19739] Avg episode reward: [(0, '1197.470'), (1, '717.620')] +[2023-10-08 19:36:46,503][21194] Updated weights for policy 1, policy_version 94790 (0.0007) +[2023-10-08 19:36:46,864][21194] Updated weights for policy 1, policy_version 94800 (0.0007) +[2023-10-08 19:36:47,238][21194] Updated weights for policy 1, policy_version 94810 (0.0008) +[2023-10-08 19:36:47,265][21195] Updated weights for policy 0, policy_version 95530 (0.0008) +[2023-10-08 19:36:47,624][21195] Updated weights for policy 0, policy_version 95540 (0.0009) +[2023-10-08 19:36:47,993][21195] Updated weights for policy 0, policy_version 95550 (0.0008) +[2023-10-08 19:36:48,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 194936832. Throughput: 0: 1715.8, 1: 1726.6. Samples: 48738030. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:36:48,803][19739] Avg episode reward: [(0, '1183.440'), (1, '717.620')] +[2023-10-08 19:36:51,223][21194] Updated weights for policy 1, policy_version 94820 (0.0008) +[2023-10-08 19:36:51,586][21194] Updated weights for policy 1, policy_version 94830 (0.0011) +[2023-10-08 19:36:51,949][21194] Updated weights for policy 1, policy_version 94840 (0.0010) +[2023-10-08 19:36:51,995][21195] Updated weights for policy 0, policy_version 95560 (0.0007) +[2023-10-08 19:36:52,355][21195] Updated weights for policy 0, policy_version 95570 (0.0007) +[2023-10-08 19:36:52,724][21195] Updated weights for policy 0, policy_version 95580 (0.0007) +[2023-10-08 19:36:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 195002368. Throughput: 0: 1746.4, 1: 1700.9. Samples: 48753620. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:36:53,803][19739] Avg episode reward: [(0, '1183.440'), (1, '717.620')] +[2023-10-08 19:36:56,008][21194] Updated weights for policy 1, policy_version 94850 (0.0009) +[2023-10-08 19:36:56,378][21194] Updated weights for policy 1, policy_version 94860 (0.0009) +[2023-10-08 19:36:56,635][21195] Updated weights for policy 0, policy_version 95590 (0.0007) +[2023-10-08 19:36:56,734][21194] Updated weights for policy 1, policy_version 94870 (0.0009) +[2023-10-08 19:36:56,994][21195] Updated weights for policy 0, policy_version 95600 (0.0008) +[2023-10-08 19:36:57,094][21194] Updated weights for policy 1, policy_version 94880 (0.0008) +[2023-10-08 19:36:57,368][21195] Updated weights for policy 0, policy_version 95610 (0.0008) +[2023-10-08 19:36:58,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 195067904. Throughput: 0: 1727.7, 1: 1699.9. Samples: 48773786. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:36:58,803][19739] Avg episode reward: [(0, '1183.440'), (1, '717.620')] +[2023-10-08 19:37:00,946][21194] Updated weights for policy 1, policy_version 94890 (0.0011) +[2023-10-08 19:37:01,297][21194] Updated weights for policy 1, policy_version 94900 (0.0010) +[2023-10-08 19:37:01,406][21195] Updated weights for policy 0, policy_version 95620 (0.0008) +[2023-10-08 19:37:01,668][21194] Updated weights for policy 1, policy_version 94910 (0.0008) +[2023-10-08 19:37:01,774][21195] Updated weights for policy 0, policy_version 95630 (0.0009) +[2023-10-08 19:37:02,140][21195] Updated weights for policy 0, policy_version 95640 (0.0009) +[2023-10-08 19:37:03,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 195133440. Throughput: 0: 1724.1, 1: 1716.0. Samples: 48789786. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:37:03,803][19739] Avg episode reward: [(0, '1183.440'), (1, '715.200')] +[2023-10-08 19:37:05,553][21194] Updated weights for policy 1, policy_version 94920 (0.0009) +[2023-10-08 19:37:05,925][21194] Updated weights for policy 1, policy_version 94930 (0.0007) +[2023-10-08 19:37:06,043][21195] Updated weights for policy 0, policy_version 95650 (0.0008) +[2023-10-08 19:37:06,278][21194] Updated weights for policy 1, policy_version 94940 (0.0007) +[2023-10-08 19:37:06,429][21195] Updated weights for policy 0, policy_version 95660 (0.0009) +[2023-10-08 19:37:06,793][21195] Updated weights for policy 0, policy_version 95670 (0.0007) +[2023-10-08 19:37:07,161][21195] Updated weights for policy 0, policy_version 95680 (0.0008) +[2023-10-08 19:37:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 195198976. Throughput: 0: 1732.5, 1: 1702.4. Samples: 48804994. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:37:08,803][19739] Avg episode reward: [(0, '1183.360'), (1, '699.960')] +[2023-10-08 19:37:10,301][21194] Updated weights for policy 1, policy_version 94950 (0.0010) +[2023-10-08 19:37:10,663][21194] Updated weights for policy 1, policy_version 94960 (0.0010) +[2023-10-08 19:37:10,917][21195] Updated weights for policy 0, policy_version 95690 (0.0009) +[2023-10-08 19:37:11,032][21194] Updated weights for policy 1, policy_version 94970 (0.0008) +[2023-10-08 19:37:11,284][21195] Updated weights for policy 0, policy_version 95700 (0.0007) +[2023-10-08 19:37:11,654][21195] Updated weights for policy 0, policy_version 95710 (0.0009) +[2023-10-08 19:37:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 195264512. Throughput: 0: 1725.2, 1: 1723.0. Samples: 48826030. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:37:13,803][19739] Avg episode reward: [(0, '1183.360'), (1, '699.960')] +[2023-10-08 19:37:13,809][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000094976_97255424.pth... +[2023-10-08 19:37:13,809][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000095712_98009088.pth... +[2023-10-08 19:37:13,844][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000094080_96337920.pth +[2023-10-08 19:37:13,848][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000093376_95617024.pth +[2023-10-08 19:37:15,115][21194] Updated weights for policy 1, policy_version 94980 (0.0007) +[2023-10-08 19:37:15,475][21194] Updated weights for policy 1, policy_version 94990 (0.0007) +[2023-10-08 19:37:15,563][21195] Updated weights for policy 0, policy_version 95720 (0.0008) +[2023-10-08 19:37:15,840][21194] Updated weights for policy 1, policy_version 95000 (0.0009) +[2023-10-08 19:37:15,929][21195] Updated weights for policy 0, policy_version 95730 (0.0008) +[2023-10-08 19:37:16,306][21195] Updated weights for policy 0, policy_version 95740 (0.0010) +[2023-10-08 19:37:18,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 195330048. Throughput: 0: 1747.2, 1: 1703.3. Samples: 48841572. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:37:18,803][19739] Avg episode reward: [(0, '1183.360'), (1, '699.960')] +[2023-10-08 19:37:19,820][21194] Updated weights for policy 1, policy_version 95010 (0.0009) +[2023-10-08 19:37:20,195][21194] Updated weights for policy 1, policy_version 95020 (0.0008) +[2023-10-08 19:37:20,303][21195] Updated weights for policy 0, policy_version 95750 (0.0009) +[2023-10-08 19:37:20,547][21194] Updated weights for policy 1, policy_version 95030 (0.0009) +[2023-10-08 19:37:20,664][21195] Updated weights for policy 0, policy_version 95760 (0.0008) +[2023-10-08 19:37:20,919][21194] Updated weights for policy 1, policy_version 95040 (0.0008) +[2023-10-08 19:37:21,043][21195] Updated weights for policy 0, policy_version 95770 (0.0009) +[2023-10-08 19:37:23,803][19739] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 195395584. Throughput: 0: 1724.2, 1: 1708.0. Samples: 48856730. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:37:23,804][19739] Avg episode reward: [(0, '1183.360'), (1, '699.960')] +[2023-10-08 19:37:24,744][21194] Updated weights for policy 1, policy_version 95050 (0.0007) +[2023-10-08 19:37:24,937][21195] Updated weights for policy 0, policy_version 95780 (0.0008) +[2023-10-08 19:37:25,107][21194] Updated weights for policy 1, policy_version 95060 (0.0007) +[2023-10-08 19:37:25,297][21195] Updated weights for policy 0, policy_version 95790 (0.0009) +[2023-10-08 19:37:25,477][21194] Updated weights for policy 1, policy_version 95070 (0.0008) +[2023-10-08 19:37:25,658][21195] Updated weights for policy 0, policy_version 95800 (0.0009) +[2023-10-08 19:37:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 195461120. Throughput: 0: 1738.8, 1: 1730.4. Samples: 48878236. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:37:28,803][19739] Avg episode reward: [(0, '1183.360'), (1, '700.160')] +[2023-10-08 19:37:29,471][21194] Updated weights for policy 1, policy_version 95080 (0.0010) +[2023-10-08 19:37:29,612][21195] Updated weights for policy 0, policy_version 95810 (0.0008) +[2023-10-08 19:37:29,846][21194] Updated weights for policy 1, policy_version 95090 (0.0010) +[2023-10-08 19:37:29,977][21195] Updated weights for policy 0, policy_version 95820 (0.0007) +[2023-10-08 19:37:30,195][21194] Updated weights for policy 1, policy_version 95100 (0.0007) +[2023-10-08 19:37:30,337][21195] Updated weights for policy 0, policy_version 95830 (0.0009) +[2023-10-08 19:37:30,709][21195] Updated weights for policy 0, policy_version 95840 (0.0009) +[2023-10-08 19:37:33,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 195526656. Throughput: 0: 1753.2, 1: 1697.7. Samples: 48893322. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:37:33,804][19739] Avg episode reward: [(0, '1183.240'), (1, '700.160')] +[2023-10-08 19:37:34,010][21194] Updated weights for policy 1, policy_version 95110 (0.0008) +[2023-10-08 19:37:34,378][21194] Updated weights for policy 1, policy_version 95120 (0.0009) +[2023-10-08 19:37:34,683][21195] Updated weights for policy 0, policy_version 95850 (0.0008) +[2023-10-08 19:37:34,750][21194] Updated weights for policy 1, policy_version 95130 (0.0007) +[2023-10-08 19:37:35,057][21195] Updated weights for policy 0, policy_version 95860 (0.0009) +[2023-10-08 19:37:35,417][21195] Updated weights for policy 0, policy_version 95870 (0.0009) +[2023-10-08 19:37:38,651][21194] Updated weights for policy 1, policy_version 95140 (0.0007) +[2023-10-08 19:37:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 195592192. Throughput: 0: 1719.6, 1: 1725.6. Samples: 48908656. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:37:38,803][19739] Avg episode reward: [(0, '1183.240'), (1, '714.530')] +[2023-10-08 19:37:39,014][21194] Updated weights for policy 1, policy_version 95150 (0.0007) +[2023-10-08 19:37:39,302][21195] Updated weights for policy 0, policy_version 95880 (0.0009) +[2023-10-08 19:37:39,371][21194] Updated weights for policy 1, policy_version 95160 (0.0008) +[2023-10-08 19:37:39,664][21195] Updated weights for policy 0, policy_version 95890 (0.0009) +[2023-10-08 19:37:40,036][21195] Updated weights for policy 0, policy_version 95900 (0.0007) +[2023-10-08 19:37:43,447][21194] Updated weights for policy 1, policy_version 95170 (0.0010) +[2023-10-08 19:37:43,803][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 195657728. Throughput: 0: 1750.1, 1: 1732.0. Samples: 48930480. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:37:43,803][19739] Avg episode reward: [(0, '1183.240'), (1, '729.800')] +[2023-10-08 19:37:43,818][21194] Updated weights for policy 1, policy_version 95180 (0.0010) +[2023-10-08 19:37:43,896][21195] Updated weights for policy 0, policy_version 95910 (0.0007) +[2023-10-08 19:37:44,172][21194] Updated weights for policy 1, policy_version 95190 (0.0007) +[2023-10-08 19:37:44,273][21195] Updated weights for policy 0, policy_version 95920 (0.0008) +[2023-10-08 19:37:44,542][21194] Updated weights for policy 1, policy_version 95200 (0.0008) +[2023-10-08 19:37:44,636][21195] Updated weights for policy 0, policy_version 95930 (0.0009) +[2023-10-08 19:37:48,470][21194] Updated weights for policy 1, policy_version 95210 (0.0010) +[2023-10-08 19:37:48,657][21195] Updated weights for policy 0, policy_version 95940 (0.0009) +[2023-10-08 19:37:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 195723264. Throughput: 0: 1746.3, 1: 1715.5. Samples: 48945566. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:37:48,803][19739] Avg episode reward: [(0, '1183.240'), (1, '729.800')] +[2023-10-08 19:37:48,841][21194] Updated weights for policy 1, policy_version 95220 (0.0009) +[2023-10-08 19:37:49,027][21195] Updated weights for policy 0, policy_version 95950 (0.0009) +[2023-10-08 19:37:49,208][21194] Updated weights for policy 1, policy_version 95230 (0.0010) +[2023-10-08 19:37:49,398][21195] Updated weights for policy 0, policy_version 95960 (0.0008) +[2023-10-08 19:37:52,994][21194] Updated weights for policy 1, policy_version 95240 (0.0008) +[2023-10-08 19:37:53,252][21195] Updated weights for policy 0, policy_version 95970 (0.0008) +[2023-10-08 19:37:53,362][21194] Updated weights for policy 1, policy_version 95250 (0.0007) +[2023-10-08 19:37:53,630][21195] Updated weights for policy 0, policy_version 95980 (0.0008) +[2023-10-08 19:37:53,723][21194] Updated weights for policy 1, policy_version 95260 (0.0007) +[2023-10-08 19:37:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 195788800. Throughput: 0: 1744.0, 1: 1731.3. Samples: 48961384. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:37:53,803][19739] Avg episode reward: [(0, '1183.240'), (1, '729.800')] +[2023-10-08 19:37:53,991][21195] Updated weights for policy 0, policy_version 95990 (0.0009) +[2023-10-08 19:37:54,360][21195] Updated weights for policy 0, policy_version 96000 (0.0008) +[2023-10-08 19:37:57,793][21194] Updated weights for policy 1, policy_version 95270 (0.0009) +[2023-10-08 19:37:58,157][21194] Updated weights for policy 1, policy_version 95280 (0.0010) +[2023-10-08 19:37:58,190][21195] Updated weights for policy 0, policy_version 96010 (0.0009) +[2023-10-08 19:37:58,522][21194] Updated weights for policy 1, policy_version 95290 (0.0008) +[2023-10-08 19:37:58,556][21195] Updated weights for policy 0, policy_version 96020 (0.0007) +[2023-10-08 19:37:58,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 195887104. Throughput: 0: 1746.8, 1: 1720.8. Samples: 48982068. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:37:58,803][19739] Avg episode reward: [(0, '1183.240'), (1, '729.800')] +[2023-10-08 19:37:58,915][21195] Updated weights for policy 0, policy_version 96030 (0.0008) +[2023-10-08 19:38:02,633][21194] Updated weights for policy 1, policy_version 95300 (0.0008) +[2023-10-08 19:38:02,991][21194] Updated weights for policy 1, policy_version 95310 (0.0008) +[2023-10-08 19:38:03,028][21195] Updated weights for policy 0, policy_version 96040 (0.0008) +[2023-10-08 19:38:03,360][21194] Updated weights for policy 1, policy_version 95320 (0.0008) +[2023-10-08 19:38:03,387][21195] Updated weights for policy 0, policy_version 96050 (0.0009) +[2023-10-08 19:38:03,754][21195] Updated weights for policy 0, policy_version 96060 (0.0010) +[2023-10-08 19:38:03,802][19739] Fps is (10 sec: 16384.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 195952640. Throughput: 0: 1717.4, 1: 1725.1. Samples: 48996484. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:38:03,803][19739] Avg episode reward: [(0, '1183.240'), (1, '729.800')] +[2023-10-08 19:38:07,302][21194] Updated weights for policy 1, policy_version 95330 (0.0008) +[2023-10-08 19:38:07,666][21194] Updated weights for policy 1, policy_version 95340 (0.0008) +[2023-10-08 19:38:07,742][21195] Updated weights for policy 0, policy_version 96070 (0.0008) +[2023-10-08 19:38:08,031][21194] Updated weights for policy 1, policy_version 95350 (0.0009) +[2023-10-08 19:38:08,111][21195] Updated weights for policy 0, policy_version 96080 (0.0009) +[2023-10-08 19:38:08,401][21194] Updated weights for policy 1, policy_version 95360 (0.0009) +[2023-10-08 19:38:08,474][21195] Updated weights for policy 0, policy_version 96090 (0.0008) +[2023-10-08 19:38:08,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 196050944. Throughput: 0: 1743.5, 1: 1728.3. Samples: 49012960. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:38:08,803][19739] Avg episode reward: [(0, '1183.240'), (1, '729.710')] +[2023-10-08 19:38:12,354][21195] Updated weights for policy 0, policy_version 96100 (0.0010) +[2023-10-08 19:38:12,360][21194] Updated weights for policy 1, policy_version 95370 (0.0009) +[2023-10-08 19:38:12,719][21194] Updated weights for policy 1, policy_version 95380 (0.0008) +[2023-10-08 19:38:12,721][21195] Updated weights for policy 0, policy_version 96110 (0.0008) +[2023-10-08 19:38:13,091][21195] Updated weights for policy 0, policy_version 96120 (0.0008) +[2023-10-08 19:38:13,095][21194] Updated weights for policy 1, policy_version 95390 (0.0007) +[2023-10-08 19:38:13,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 196116480. Throughput: 0: 1726.4, 1: 1705.2. Samples: 49032656. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:38:13,803][19739] Avg episode reward: [(0, '1183.240'), (1, '729.710')] +[2023-10-08 19:38:17,076][21194] Updated weights for policy 1, policy_version 95400 (0.0009) +[2023-10-08 19:38:17,129][21195] Updated weights for policy 0, policy_version 96130 (0.0009) +[2023-10-08 19:38:17,441][21194] Updated weights for policy 1, policy_version 95410 (0.0007) +[2023-10-08 19:38:17,500][21195] Updated weights for policy 0, policy_version 96140 (0.0008) +[2023-10-08 19:38:17,806][21194] Updated weights for policy 1, policy_version 95420 (0.0007) +[2023-10-08 19:38:17,874][21195] Updated weights for policy 0, policy_version 96150 (0.0009) +[2023-10-08 19:38:18,244][21195] Updated weights for policy 0, policy_version 96160 (0.0009) +[2023-10-08 19:38:18,803][19739] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 196182016. Throughput: 0: 1710.9, 1: 1736.2. Samples: 49048444. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:38:18,804][19739] Avg episode reward: [(0, '1183.240'), (1, '729.710')] +[2023-10-08 19:38:21,752][21194] Updated weights for policy 1, policy_version 95430 (0.0007) +[2023-10-08 19:38:22,107][21194] Updated weights for policy 1, policy_version 95440 (0.0008) +[2023-10-08 19:38:22,236][21195] Updated weights for policy 0, policy_version 96170 (0.0008) +[2023-10-08 19:38:22,474][21194] Updated weights for policy 1, policy_version 95450 (0.0007) +[2023-10-08 19:38:22,605][21195] Updated weights for policy 0, policy_version 96180 (0.0008) +[2023-10-08 19:38:22,971][21195] Updated weights for policy 0, policy_version 96190 (0.0009) +[2023-10-08 19:38:23,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 196247552. Throughput: 0: 1741.9, 1: 1717.3. Samples: 49064322. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:38:23,804][19739] Avg episode reward: [(0, '1183.240'), (1, '729.710')] +[2023-10-08 19:38:26,439][21194] Updated weights for policy 1, policy_version 95460 (0.0008) +[2023-10-08 19:38:26,804][21194] Updated weights for policy 1, policy_version 95470 (0.0007) +[2023-10-08 19:38:26,928][21195] Updated weights for policy 0, policy_version 96200 (0.0008) +[2023-10-08 19:38:27,184][21194] Updated weights for policy 1, policy_version 95480 (0.0007) +[2023-10-08 19:38:27,297][21195] Updated weights for policy 0, policy_version 96210 (0.0008) +[2023-10-08 19:38:27,656][21195] Updated weights for policy 0, policy_version 96220 (0.0007) +[2023-10-08 19:38:28,802][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 196313088. Throughput: 0: 1705.5, 1: 1701.1. Samples: 49083774. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:38:28,803][19739] Avg episode reward: [(0, '1187.910'), (1, '729.710')] +[2023-10-08 19:38:31,003][21194] Updated weights for policy 1, policy_version 95490 (0.0008) +[2023-10-08 19:38:31,371][21194] Updated weights for policy 1, policy_version 95500 (0.0009) +[2023-10-08 19:38:31,450][21195] Updated weights for policy 0, policy_version 96230 (0.0007) +[2023-10-08 19:38:31,744][21194] Updated weights for policy 1, policy_version 95510 (0.0008) +[2023-10-08 19:38:31,817][21195] Updated weights for policy 0, policy_version 96240 (0.0007) +[2023-10-08 19:38:32,097][21194] Updated weights for policy 1, policy_version 95520 (0.0009) +[2023-10-08 19:38:32,184][21195] Updated weights for policy 0, policy_version 96250 (0.0007) +[2023-10-08 19:38:33,803][19739] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 196378624. Throughput: 0: 1713.4, 1: 1729.4. Samples: 49100490. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:38:33,803][19739] Avg episode reward: [(0, '1187.910'), (1, '714.850')] +[2023-10-08 19:38:36,086][21195] Updated weights for policy 0, policy_version 96260 (0.0007) +[2023-10-08 19:38:36,128][21194] Updated weights for policy 1, policy_version 95530 (0.0009) +[2023-10-08 19:38:36,458][21195] Updated weights for policy 0, policy_version 96270 (0.0009) +[2023-10-08 19:38:36,487][21194] Updated weights for policy 1, policy_version 95540 (0.0008) +[2023-10-08 19:38:36,824][21195] Updated weights for policy 0, policy_version 96280 (0.0007) +[2023-10-08 19:38:36,847][21194] Updated weights for policy 1, policy_version 95550 (0.0008) +[2023-10-08 19:38:38,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13884.7). Total num frames: 196444160. Throughput: 0: 1717.8, 1: 1698.3. Samples: 49115108. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:38:38,804][19739] Avg episode reward: [(0, '1187.910'), (1, '712.390')] +[2023-10-08 19:38:40,622][21195] Updated weights for policy 0, policy_version 96290 (0.0007) +[2023-10-08 19:38:40,782][21194] Updated weights for policy 1, policy_version 95560 (0.0008) +[2023-10-08 19:38:41,012][21195] Updated weights for policy 0, policy_version 96300 (0.0007) +[2023-10-08 19:38:41,135][21194] Updated weights for policy 1, policy_version 95570 (0.0007) +[2023-10-08 19:38:41,381][21195] Updated weights for policy 0, policy_version 96310 (0.0008) +[2023-10-08 19:38:41,503][21194] Updated weights for policy 1, policy_version 95580 (0.0007) +[2023-10-08 19:38:41,757][21195] Updated weights for policy 0, policy_version 96320 (0.0009) +[2023-10-08 19:38:43,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 196509696. Throughput: 0: 1710.9, 1: 1715.3. Samples: 49136250. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:38:43,803][19739] Avg episode reward: [(0, '1203.470'), (1, '712.690')] +[2023-10-08 19:38:43,812][20740] Saving new best policy, reward=1203.470! +[2023-10-08 19:38:45,459][21194] Updated weights for policy 1, policy_version 95590 (0.0010) +[2023-10-08 19:38:45,651][21195] Updated weights for policy 0, policy_version 96330 (0.0009) +[2023-10-08 19:38:45,840][21194] Updated weights for policy 1, policy_version 95600 (0.0009) +[2023-10-08 19:38:46,017][21195] Updated weights for policy 0, policy_version 96340 (0.0007) +[2023-10-08 19:38:46,206][21194] Updated weights for policy 1, policy_version 95610 (0.0008) +[2023-10-08 19:38:46,394][21195] Updated weights for policy 0, policy_version 96350 (0.0010) +[2023-10-08 19:38:48,802][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 196575232. Throughput: 0: 1737.1, 1: 1719.1. Samples: 49152012. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:38:48,803][19739] Avg episode reward: [(0, '1203.470'), (1, '698.530')] +[2023-10-08 19:38:50,249][21194] Updated weights for policy 1, policy_version 95620 (0.0009) +[2023-10-08 19:38:50,506][21195] Updated weights for policy 0, policy_version 96360 (0.0007) +[2023-10-08 19:38:50,613][21194] Updated weights for policy 1, policy_version 95630 (0.0008) +[2023-10-08 19:38:50,864][21195] Updated weights for policy 0, policy_version 96370 (0.0010) +[2023-10-08 19:38:50,972][21194] Updated weights for policy 1, policy_version 95640 (0.0007) +[2023-10-08 19:38:51,223][21195] Updated weights for policy 0, policy_version 96380 (0.0009) +[2023-10-08 19:38:53,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 196640768. Throughput: 0: 1710.6, 1: 1705.8. Samples: 49166700. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:38:53,803][19739] Avg episode reward: [(0, '1218.980'), (1, '684.040')] +[2023-10-08 19:38:53,804][20740] Saving new best policy, reward=1218.980! +[2023-10-08 19:38:55,047][21194] Updated weights for policy 1, policy_version 95650 (0.0007) +[2023-10-08 19:38:55,065][21195] Updated weights for policy 0, policy_version 96390 (0.0007) +[2023-10-08 19:38:55,409][21194] Updated weights for policy 1, policy_version 95660 (0.0007) +[2023-10-08 19:38:55,431][21195] Updated weights for policy 0, policy_version 96400 (0.0009) +[2023-10-08 19:38:55,777][21194] Updated weights for policy 1, policy_version 95670 (0.0007) +[2023-10-08 19:38:55,797][21195] Updated weights for policy 0, policy_version 96410 (0.0009) +[2023-10-08 19:38:56,128][21194] Updated weights for policy 1, policy_version 95680 (0.0008) +[2023-10-08 19:38:58,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 196706304. Throughput: 0: 1726.9, 1: 1727.3. Samples: 49188094. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:38:58,804][19739] Avg episode reward: [(0, '1218.980'), (1, '628.710')] +[2023-10-08 19:38:59,829][21195] Updated weights for policy 0, policy_version 96420 (0.0007) +[2023-10-08 19:39:00,093][21194] Updated weights for policy 1, policy_version 95690 (0.0009) +[2023-10-08 19:39:00,200][21195] Updated weights for policy 0, policy_version 96430 (0.0007) +[2023-10-08 19:39:00,461][21194] Updated weights for policy 1, policy_version 95700 (0.0008) +[2023-10-08 19:39:00,568][21195] Updated weights for policy 0, policy_version 96440 (0.0007) +[2023-10-08 19:39:00,820][21194] Updated weights for policy 1, policy_version 95710 (0.0008) +[2023-10-08 19:39:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 196771840. Throughput: 0: 1744.1, 1: 1699.9. Samples: 49203424. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:39:03,803][19739] Avg episode reward: [(0, '1218.980'), (1, '613.290')] +[2023-10-08 19:39:04,487][21195] Updated weights for policy 0, policy_version 96450 (0.0008) +[2023-10-08 19:39:04,765][21194] Updated weights for policy 1, policy_version 95720 (0.0007) +[2023-10-08 19:39:04,859][21195] Updated weights for policy 0, policy_version 96460 (0.0007) +[2023-10-08 19:39:05,124][21194] Updated weights for policy 1, policy_version 95730 (0.0007) +[2023-10-08 19:39:05,236][21195] Updated weights for policy 0, policy_version 96470 (0.0007) +[2023-10-08 19:39:05,488][21194] Updated weights for policy 1, policy_version 95740 (0.0009) +[2023-10-08 19:39:05,599][21195] Updated weights for policy 0, policy_version 96480 (0.0008) +[2023-10-08 19:39:08,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 196837376. Throughput: 0: 1715.3, 1: 1718.4. Samples: 49218842. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:39:08,803][19739] Avg episode reward: [(0, '1218.980'), (1, '613.520')] +[2023-10-08 19:39:09,321][21195] Updated weights for policy 0, policy_version 96490 (0.0007) +[2023-10-08 19:39:09,579][21194] Updated weights for policy 1, policy_version 95750 (0.0009) +[2023-10-08 19:39:09,684][21195] Updated weights for policy 0, policy_version 96500 (0.0007) +[2023-10-08 19:39:09,933][21194] Updated weights for policy 1, policy_version 95760 (0.0009) +[2023-10-08 19:39:10,055][21195] Updated weights for policy 0, policy_version 96510 (0.0007) +[2023-10-08 19:39:10,294][21194] Updated weights for policy 1, policy_version 95770 (0.0009) +[2023-10-08 19:39:13,803][19739] Fps is (10 sec: 13106.7, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 196902912. Throughput: 0: 1752.3, 1: 1733.2. Samples: 49240624. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:39:13,804][19739] Avg episode reward: [(0, '1219.870'), (1, '613.520')] +[2023-10-08 19:39:13,815][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000095776_98074624.pth... +[2023-10-08 19:39:13,836][21195] Updated weights for policy 0, policy_version 96520 (0.0007) +[2023-10-08 19:39:13,851][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000094176_96436224.pth +[2023-10-08 19:39:14,186][21194] Updated weights for policy 1, policy_version 95780 (0.0007) +[2023-10-08 19:39:14,213][21195] Updated weights for policy 0, policy_version 96530 (0.0008) +[2023-10-08 19:39:14,548][21194] Updated weights for policy 1, policy_version 95790 (0.0007) +[2023-10-08 19:39:14,582][21195] Updated weights for policy 0, policy_version 96540 (0.0007) +[2023-10-08 19:39:14,733][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000096544_98861056.pth... +[2023-10-08 19:39:14,767][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000094912_97189888.pth +[2023-10-08 19:39:14,771][20740] Saving new best policy, reward=1219.870! +[2023-10-08 19:39:14,918][21194] Updated weights for policy 1, policy_version 95800 (0.0009) +[2023-10-08 19:39:18,595][21195] Updated weights for policy 0, policy_version 96550 (0.0008) +[2023-10-08 19:39:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 196968448. Throughput: 0: 1739.2, 1: 1702.8. Samples: 49255380. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:39:18,803][19739] Avg episode reward: [(0, '1207.440'), (1, '613.780')] +[2023-10-08 19:39:18,934][21194] Updated weights for policy 1, policy_version 95810 (0.0009) +[2023-10-08 19:39:18,968][21195] Updated weights for policy 0, policy_version 96560 (0.0008) +[2023-10-08 19:39:19,308][21194] Updated weights for policy 1, policy_version 95820 (0.0009) +[2023-10-08 19:39:19,333][21195] Updated weights for policy 0, policy_version 96570 (0.0009) +[2023-10-08 19:39:19,674][21194] Updated weights for policy 1, policy_version 95830 (0.0009) +[2023-10-08 19:39:20,041][21194] Updated weights for policy 1, policy_version 95840 (0.0009) +[2023-10-08 19:39:23,346][21195] Updated weights for policy 0, policy_version 96580 (0.0008) +[2023-10-08 19:39:23,709][21195] Updated weights for policy 0, policy_version 96590 (0.0008) +[2023-10-08 19:39:23,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 197033984. Throughput: 0: 1732.9, 1: 1732.8. Samples: 49271060. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:39:23,803][19739] Avg episode reward: [(0, '1191.960'), (1, '628.910')] +[2023-10-08 19:39:23,815][21194] Updated weights for policy 1, policy_version 95850 (0.0007) +[2023-10-08 19:39:24,077][21195] Updated weights for policy 0, policy_version 96600 (0.0010) +[2023-10-08 19:39:24,191][21194] Updated weights for policy 1, policy_version 95860 (0.0009) +[2023-10-08 19:39:24,550][21194] Updated weights for policy 1, policy_version 95870 (0.0009) +[2023-10-08 19:39:27,943][21195] Updated weights for policy 0, policy_version 96610 (0.0008) +[2023-10-08 19:39:28,348][21195] Updated weights for policy 0, policy_version 96620 (0.0007) +[2023-10-08 19:39:28,591][21194] Updated weights for policy 1, policy_version 95880 (0.0008) +[2023-10-08 19:39:28,716][21195] Updated weights for policy 0, policy_version 96630 (0.0008) +[2023-10-08 19:39:28,802][19739] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 197099520. Throughput: 0: 1745.2, 1: 1724.8. Samples: 49292404. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:39:28,803][19739] Avg episode reward: [(0, '1191.960'), (1, '629.070')] +[2023-10-08 19:39:28,964][21194] Updated weights for policy 1, policy_version 95890 (0.0010) +[2023-10-08 19:39:29,081][21195] Updated weights for policy 0, policy_version 96640 (0.0009) +[2023-10-08 19:39:29,331][21194] Updated weights for policy 1, policy_version 95900 (0.0010) +[2023-10-08 19:39:33,103][21195] Updated weights for policy 0, policy_version 96650 (0.0009) +[2023-10-08 19:39:33,225][21194] Updated weights for policy 1, policy_version 95910 (0.0008) +[2023-10-08 19:39:33,476][21195] Updated weights for policy 0, policy_version 96660 (0.0008) +[2023-10-08 19:39:33,582][21194] Updated weights for policy 1, policy_version 95920 (0.0007) +[2023-10-08 19:39:33,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13662.6). Total num frames: 197165056. Throughput: 0: 1716.2, 1: 1712.7. Samples: 49306312. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:39:33,803][19739] Avg episode reward: [(0, '1191.800'), (1, '629.070')] +[2023-10-08 19:39:33,837][21195] Updated weights for policy 0, policy_version 96670 (0.0009) +[2023-10-08 19:39:33,948][21194] Updated weights for policy 1, policy_version 95930 (0.0010) +[2023-10-08 19:39:37,741][21195] Updated weights for policy 0, policy_version 96680 (0.0009) +[2023-10-08 19:39:37,741][21194] Updated weights for policy 1, policy_version 95940 (0.0009) +[2023-10-08 19:39:38,103][21195] Updated weights for policy 0, policy_version 96690 (0.0009) +[2023-10-08 19:39:38,107][21194] Updated weights for policy 1, policy_version 95950 (0.0009) +[2023-10-08 19:39:38,472][21195] Updated weights for policy 0, policy_version 96700 (0.0008) +[2023-10-08 19:39:38,473][21194] Updated weights for policy 1, policy_version 95960 (0.0007) +[2023-10-08 19:39:38,803][19739] Fps is (10 sec: 19660.6, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 197296128. Throughput: 0: 1744.4, 1: 1728.0. Samples: 49322956. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:39:38,803][19739] Avg episode reward: [(0, '1191.800'), (1, '630.050')] +[2023-10-08 19:39:42,299][21194] Updated weights for policy 1, policy_version 95970 (0.0008) +[2023-10-08 19:39:42,664][21194] Updated weights for policy 1, policy_version 95980 (0.0008) +[2023-10-08 19:39:42,666][21195] Updated weights for policy 0, policy_version 96710 (0.0008) +[2023-10-08 19:39:43,026][21194] Updated weights for policy 1, policy_version 95990 (0.0007) +[2023-10-08 19:39:43,028][21195] Updated weights for policy 0, policy_version 96720 (0.0008) +[2023-10-08 19:39:43,391][21194] Updated weights for policy 1, policy_version 96000 (0.0007) +[2023-10-08 19:39:43,400][21195] Updated weights for policy 0, policy_version 96730 (0.0009) +[2023-10-08 19:39:43,803][19739] Fps is (10 sec: 19660.5, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 197361664. Throughput: 0: 1728.2, 1: 1717.2. Samples: 49343136. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:39:43,803][19739] Avg episode reward: [(0, '1191.800'), (1, '630.400')] +[2023-10-08 19:39:47,329][21194] Updated weights for policy 1, policy_version 96010 (0.0008) +[2023-10-08 19:39:47,335][21195] Updated weights for policy 0, policy_version 96740 (0.0010) +[2023-10-08 19:39:47,700][21194] Updated weights for policy 1, policy_version 96020 (0.0007) +[2023-10-08 19:39:47,705][21195] Updated weights for policy 0, policy_version 96750 (0.0009) +[2023-10-08 19:39:48,057][21194] Updated weights for policy 1, policy_version 96030 (0.0008) +[2023-10-08 19:39:48,065][21195] Updated weights for policy 0, policy_version 96760 (0.0008) +[2023-10-08 19:39:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 197427200. Throughput: 0: 1705.8, 1: 1735.9. Samples: 49358298. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:39:48,803][19739] Avg episode reward: [(0, '1191.800'), (1, '630.400')] +[2023-10-08 19:39:51,968][21195] Updated weights for policy 0, policy_version 96770 (0.0007) +[2023-10-08 19:39:52,282][21194] Updated weights for policy 1, policy_version 96040 (0.0008) +[2023-10-08 19:39:52,339][21195] Updated weights for policy 0, policy_version 96780 (0.0008) +[2023-10-08 19:39:52,657][21194] Updated weights for policy 1, policy_version 96050 (0.0008) +[2023-10-08 19:39:52,699][21195] Updated weights for policy 0, policy_version 96790 (0.0007) +[2023-10-08 19:39:53,018][21194] Updated weights for policy 1, policy_version 96060 (0.0008) +[2023-10-08 19:39:53,059][21195] Updated weights for policy 0, policy_version 96800 (0.0007) +[2023-10-08 19:39:53,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13884.8). Total num frames: 197492736. Throughput: 0: 1736.7, 1: 1728.2. Samples: 49374764. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:39:53,803][19739] Avg episode reward: [(0, '1191.800'), (1, '630.400')] +[2023-10-08 19:39:56,962][21194] Updated weights for policy 1, policy_version 96070 (0.0008) +[2023-10-08 19:39:56,994][21195] Updated weights for policy 0, policy_version 96810 (0.0008) +[2023-10-08 19:39:57,323][21194] Updated weights for policy 1, policy_version 96080 (0.0007) +[2023-10-08 19:39:57,367][21195] Updated weights for policy 0, policy_version 96820 (0.0008) +[2023-10-08 19:39:57,701][21194] Updated weights for policy 1, policy_version 96090 (0.0008) +[2023-10-08 19:39:57,727][21195] Updated weights for policy 0, policy_version 96830 (0.0008) +[2023-10-08 19:39:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 197558272. Throughput: 0: 1702.3, 1: 1698.1. Samples: 49393642. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:39:58,803][19739] Avg episode reward: [(0, '1191.800'), (1, '630.400')] +[2023-10-08 19:40:01,624][21195] Updated weights for policy 0, policy_version 96840 (0.0008) +[2023-10-08 19:40:01,662][21194] Updated weights for policy 1, policy_version 96100 (0.0009) +[2023-10-08 19:40:01,988][21195] Updated weights for policy 0, policy_version 96850 (0.0007) +[2023-10-08 19:40:02,039][21194] Updated weights for policy 1, policy_version 96110 (0.0007) +[2023-10-08 19:40:02,363][21195] Updated weights for policy 0, policy_version 96860 (0.0008) +[2023-10-08 19:40:02,397][21194] Updated weights for policy 1, policy_version 96120 (0.0008) +[2023-10-08 19:40:03,802][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13884.7). Total num frames: 197623808. Throughput: 0: 1714.9, 1: 1725.9. Samples: 49410218. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:40:03,803][19739] Avg episode reward: [(0, '1191.800'), (1, '630.400')] +[2023-10-08 19:40:06,406][21194] Updated weights for policy 1, policy_version 96130 (0.0010) +[2023-10-08 19:40:06,460][21195] Updated weights for policy 0, policy_version 96870 (0.0008) +[2023-10-08 19:40:06,767][21194] Updated weights for policy 1, policy_version 96140 (0.0007) +[2023-10-08 19:40:06,827][21195] Updated weights for policy 0, policy_version 96880 (0.0008) +[2023-10-08 19:40:07,126][21194] Updated weights for policy 1, policy_version 96150 (0.0008) +[2023-10-08 19:40:07,201][21195] Updated weights for policy 0, policy_version 96890 (0.0009) +[2023-10-08 19:40:07,489][21194] Updated weights for policy 1, policy_version 96160 (0.0008) +[2023-10-08 19:40:08,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13884.8). Total num frames: 197689344. Throughput: 0: 1723.8, 1: 1706.0. Samples: 49425400. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:40:08,804][19739] Avg episode reward: [(0, '1191.800'), (1, '630.400')] +[2023-10-08 19:40:11,224][21195] Updated weights for policy 0, policy_version 96900 (0.0009) +[2023-10-08 19:40:11,589][21195] Updated weights for policy 0, policy_version 96910 (0.0008) +[2023-10-08 19:40:11,645][21194] Updated weights for policy 1, policy_version 96170 (0.0010) +[2023-10-08 19:40:11,950][21195] Updated weights for policy 0, policy_version 96920 (0.0007) +[2023-10-08 19:40:12,016][21194] Updated weights for policy 1, policy_version 96180 (0.0009) +[2023-10-08 19:40:12,384][21194] Updated weights for policy 1, policy_version 96190 (0.0009) +[2023-10-08 19:40:13,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 197754880. Throughput: 0: 1700.9, 1: 1695.2. Samples: 49445230. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:40:13,803][19739] Avg episode reward: [(0, '1191.800'), (1, '630.400')] +[2023-10-08 19:40:15,867][21195] Updated weights for policy 0, policy_version 96930 (0.0007) +[2023-10-08 19:40:16,269][21195] Updated weights for policy 0, policy_version 96940 (0.0009) +[2023-10-08 19:40:16,436][21194] Updated weights for policy 1, policy_version 96200 (0.0008) +[2023-10-08 19:40:16,632][21195] Updated weights for policy 0, policy_version 96950 (0.0007) +[2023-10-08 19:40:16,807][21194] Updated weights for policy 1, policy_version 96210 (0.0009) +[2023-10-08 19:40:16,998][21195] Updated weights for policy 0, policy_version 96960 (0.0009) +[2023-10-08 19:40:17,174][21194] Updated weights for policy 1, policy_version 96220 (0.0008) +[2023-10-08 19:40:18,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 197820416. Throughput: 0: 1728.7, 1: 1721.4. Samples: 49461566. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 19:40:18,803][19739] Avg episode reward: [(0, '1203.200'), (1, '630.400')] +[2023-10-08 19:40:21,020][21195] Updated weights for policy 0, policy_version 96970 (0.0009) +[2023-10-08 19:40:21,160][21194] Updated weights for policy 1, policy_version 96230 (0.0008) +[2023-10-08 19:40:21,381][21195] Updated weights for policy 0, policy_version 96980 (0.0007) +[2023-10-08 19:40:21,535][21194] Updated weights for policy 1, policy_version 96240 (0.0008) +[2023-10-08 19:40:21,747][21195] Updated weights for policy 0, policy_version 96990 (0.0007) +[2023-10-08 19:40:21,890][21194] Updated weights for policy 1, policy_version 96250 (0.0009) +[2023-10-08 19:40:23,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 197885952. Throughput: 0: 1702.1, 1: 1691.7. Samples: 49475680. Policy #0 lag: (min: 5.0, avg: 5.7, max: 24.0) +[2023-10-08 19:40:23,803][19739] Avg episode reward: [(0, '1203.200'), (1, '630.520')] +[2023-10-08 19:40:25,554][21195] Updated weights for policy 0, policy_version 97000 (0.0008) +[2023-10-08 19:40:25,928][21195] Updated weights for policy 0, policy_version 97010 (0.0009) +[2023-10-08 19:40:25,978][21194] Updated weights for policy 1, policy_version 96260 (0.0009) +[2023-10-08 19:40:26,293][21195] Updated weights for policy 0, policy_version 97020 (0.0008) +[2023-10-08 19:40:26,342][21194] Updated weights for policy 1, policy_version 96270 (0.0007) +[2023-10-08 19:40:26,719][21194] Updated weights for policy 1, policy_version 96280 (0.0010) +[2023-10-08 19:40:28,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 197951488. Throughput: 0: 1718.0, 1: 1700.0. Samples: 49496944. Policy #0 lag: (min: 5.0, avg: 5.7, max: 24.0) +[2023-10-08 19:40:28,803][19739] Avg episode reward: [(0, '1203.200'), (1, '630.520')] +[2023-10-08 19:40:30,053][21195] Updated weights for policy 0, policy_version 97030 (0.0007) +[2023-10-08 19:40:30,425][21195] Updated weights for policy 0, policy_version 97040 (0.0008) +[2023-10-08 19:40:30,650][21194] Updated weights for policy 1, policy_version 96290 (0.0008) +[2023-10-08 19:40:30,786][21195] Updated weights for policy 0, policy_version 97050 (0.0009) +[2023-10-08 19:40:31,017][21194] Updated weights for policy 1, policy_version 96300 (0.0008) +[2023-10-08 19:40:31,393][21194] Updated weights for policy 1, policy_version 96310 (0.0008) +[2023-10-08 19:40:31,753][21194] Updated weights for policy 1, policy_version 96320 (0.0009) +[2023-10-08 19:40:33,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 198017024. Throughput: 0: 1741.2, 1: 1703.4. Samples: 49513304. Policy #0 lag: (min: 5.0, avg: 5.7, max: 24.0) +[2023-10-08 19:40:33,803][19739] Avg episode reward: [(0, '1218.560'), (1, '630.520')] +[2023-10-08 19:40:34,720][21195] Updated weights for policy 0, policy_version 97060 (0.0008) +[2023-10-08 19:40:35,092][21195] Updated weights for policy 0, policy_version 97070 (0.0008) +[2023-10-08 19:40:35,458][21195] Updated weights for policy 0, policy_version 97080 (0.0008) +[2023-10-08 19:40:35,642][21194] Updated weights for policy 1, policy_version 96330 (0.0008) +[2023-10-08 19:40:36,000][21194] Updated weights for policy 1, policy_version 96340 (0.0008) +[2023-10-08 19:40:36,369][21194] Updated weights for policy 1, policy_version 96350 (0.0008) +[2023-10-08 19:40:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 198082560. Throughput: 0: 1709.3, 1: 1690.6. Samples: 49527758. Policy #0 lag: (min: 5.0, avg: 5.7, max: 24.0) +[2023-10-08 19:40:38,803][19739] Avg episode reward: [(0, '1218.020'), (1, '630.520')] +[2023-10-08 19:40:39,465][21195] Updated weights for policy 0, policy_version 97090 (0.0008) +[2023-10-08 19:40:39,826][21195] Updated weights for policy 0, policy_version 97100 (0.0007) +[2023-10-08 19:40:40,195][21195] Updated weights for policy 0, policy_version 97110 (0.0009) +[2023-10-08 19:40:40,372][21194] Updated weights for policy 1, policy_version 96360 (0.0008) +[2023-10-08 19:40:40,561][21195] Updated weights for policy 0, policy_version 97120 (0.0007) +[2023-10-08 19:40:40,748][21194] Updated weights for policy 1, policy_version 96370 (0.0008) +[2023-10-08 19:40:41,113][21194] Updated weights for policy 1, policy_version 96380 (0.0008) +[2023-10-08 19:40:43,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 198148096. Throughput: 0: 1728.7, 1: 1716.4. Samples: 49548670. Policy #0 lag: (min: 5.0, avg: 5.7, max: 24.0) +[2023-10-08 19:40:43,803][19739] Avg episode reward: [(0, '1218.020'), (1, '630.520')] +[2023-10-08 19:40:44,486][21195] Updated weights for policy 0, policy_version 97130 (0.0008) +[2023-10-08 19:40:44,856][21195] Updated weights for policy 0, policy_version 97140 (0.0007) +[2023-10-08 19:40:45,055][21194] Updated weights for policy 1, policy_version 96390 (0.0008) +[2023-10-08 19:40:45,220][21195] Updated weights for policy 0, policy_version 97150 (0.0008) +[2023-10-08 19:40:45,419][21194] Updated weights for policy 1, policy_version 96400 (0.0010) +[2023-10-08 19:40:45,792][21194] Updated weights for policy 1, policy_version 96410 (0.0010) +[2023-10-08 19:40:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 198213632. Throughput: 0: 1733.0, 1: 1690.8. Samples: 49564290. Policy #0 lag: (min: 5.0, avg: 5.7, max: 24.0) +[2023-10-08 19:40:48,803][19739] Avg episode reward: [(0, '1218.020'), (1, '630.520')] +[2023-10-08 19:40:49,095][21195] Updated weights for policy 0, policy_version 97160 (0.0009) +[2023-10-08 19:40:49,466][21195] Updated weights for policy 0, policy_version 97170 (0.0008) +[2023-10-08 19:40:49,772][21194] Updated weights for policy 1, policy_version 96420 (0.0009) +[2023-10-08 19:40:49,839][21195] Updated weights for policy 0, policy_version 97180 (0.0007) +[2023-10-08 19:40:50,140][21194] Updated weights for policy 1, policy_version 96430 (0.0009) +[2023-10-08 19:40:50,506][21194] Updated weights for policy 1, policy_version 96440 (0.0009) +[2023-10-08 19:40:53,776][21195] Updated weights for policy 0, policy_version 97190 (0.0008) +[2023-10-08 19:40:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 198279168. Throughput: 0: 1718.5, 1: 1704.2. Samples: 49579420. Policy #0 lag: (min: 5.0, avg: 5.7, max: 24.0) +[2023-10-08 19:40:53,803][19739] Avg episode reward: [(0, '1218.020'), (1, '630.520')] +[2023-10-08 19:40:54,144][21195] Updated weights for policy 0, policy_version 97200 (0.0008) +[2023-10-08 19:40:54,512][21195] Updated weights for policy 0, policy_version 97210 (0.0007) +[2023-10-08 19:40:54,562][21194] Updated weights for policy 1, policy_version 96450 (0.0008) +[2023-10-08 19:40:54,923][21194] Updated weights for policy 1, policy_version 96460 (0.0007) +[2023-10-08 19:40:55,288][21194] Updated weights for policy 1, policy_version 96470 (0.0008) +[2023-10-08 19:40:55,650][21194] Updated weights for policy 1, policy_version 96480 (0.0009) +[2023-10-08 19:40:58,399][21195] Updated weights for policy 0, policy_version 97220 (0.0008) +[2023-10-08 19:40:58,773][21195] Updated weights for policy 0, policy_version 97230 (0.0009) +[2023-10-08 19:40:58,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 198344704. Throughput: 0: 1739.5, 1: 1720.8. Samples: 49600944. Policy #0 lag: (min: 5.0, avg: 5.7, max: 24.0) +[2023-10-08 19:40:58,803][19739] Avg episode reward: [(0, '1218.020'), (1, '630.520')] +[2023-10-08 19:40:59,139][21195] Updated weights for policy 0, policy_version 97240 (0.0008) +[2023-10-08 19:40:59,638][21194] Updated weights for policy 1, policy_version 96490 (0.0009) +[2023-10-08 19:41:00,005][21194] Updated weights for policy 1, policy_version 96500 (0.0010) +[2023-10-08 19:41:00,377][21194] Updated weights for policy 1, policy_version 96510 (0.0008) +[2023-10-08 19:41:03,092][21195] Updated weights for policy 0, policy_version 97250 (0.0009) +[2023-10-08 19:41:03,485][21195] Updated weights for policy 0, policy_version 97260 (0.0009) +[2023-10-08 19:41:03,802][19739] Fps is (10 sec: 13107.3, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 198410240. Throughput: 0: 1725.1, 1: 1694.2. Samples: 49615436. Policy #0 lag: (min: 5.0, avg: 5.7, max: 24.0) +[2023-10-08 19:41:03,803][19739] Avg episode reward: [(0, '1218.020'), (1, '630.520')] +[2023-10-08 19:41:03,855][21195] Updated weights for policy 0, policy_version 97270 (0.0010) +[2023-10-08 19:41:04,226][21195] Updated weights for policy 0, policy_version 97280 (0.0009) +[2023-10-08 19:41:04,357][21194] Updated weights for policy 1, policy_version 96520 (0.0007) +[2023-10-08 19:41:04,739][21194] Updated weights for policy 1, policy_version 96530 (0.0008) +[2023-10-08 19:41:05,110][21194] Updated weights for policy 1, policy_version 96540 (0.0009) +[2023-10-08 19:41:08,075][21195] Updated weights for policy 0, policy_version 97290 (0.0008) +[2023-10-08 19:41:08,442][21195] Updated weights for policy 0, policy_version 97300 (0.0008) +[2023-10-08 19:41:08,802][19739] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 198475776. Throughput: 0: 1746.5, 1: 1722.1. Samples: 49631768. Policy #0 lag: (min: 5.0, avg: 5.7, max: 24.0) +[2023-10-08 19:41:08,803][19739] Avg episode reward: [(0, '1218.020'), (1, '645.890')] +[2023-10-08 19:41:08,816][21195] Updated weights for policy 0, policy_version 97310 (0.0007) +[2023-10-08 19:41:09,017][21194] Updated weights for policy 1, policy_version 96550 (0.0009) +[2023-10-08 19:41:09,378][21194] Updated weights for policy 1, policy_version 96560 (0.0010) +[2023-10-08 19:41:09,745][21194] Updated weights for policy 1, policy_version 96570 (0.0008) +[2023-10-08 19:41:12,808][21195] Updated weights for policy 0, policy_version 97320 (0.0009) +[2023-10-08 19:41:13,175][21195] Updated weights for policy 0, policy_version 97330 (0.0009) +[2023-10-08 19:41:13,540][21195] Updated weights for policy 0, policy_version 97340 (0.0009) +[2023-10-08 19:41:13,793][21194] Updated weights for policy 1, policy_version 96580 (0.0008) +[2023-10-08 19:41:13,803][19739] Fps is (10 sec: 16383.7, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 198574080. Throughput: 0: 1736.0, 1: 1725.2. Samples: 49652698. Policy #0 lag: (min: 5.0, avg: 5.7, max: 24.0) +[2023-10-08 19:41:13,803][19739] Avg episode reward: [(0, '1218.020'), (1, '645.890')] +[2023-10-08 19:41:13,812][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000097344_99680256.pth... +[2023-10-08 19:41:13,842][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000095712_98009088.pth +[2023-10-08 19:41:13,845][20740] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p0/milestones/checkpoint_000097344_99680256.pth +[2023-10-08 19:41:14,156][21194] Updated weights for policy 1, policy_version 96590 (0.0010) +[2023-10-08 19:41:14,518][21194] Updated weights for policy 1, policy_version 96600 (0.0008) +[2023-10-08 19:41:14,806][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000096608_98926592.pth... +[2023-10-08 19:41:14,834][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000094976_97255424.pth +[2023-10-08 19:41:14,838][20836] Saving a milestone ./train_atari/atari_atlantis_APPO/checkpoint_p1/milestones/checkpoint_000096608_98926592.pth +[2023-10-08 19:41:17,539][21195] Updated weights for policy 0, policy_version 97350 (0.0010) +[2023-10-08 19:41:17,916][21195] Updated weights for policy 0, policy_version 97360 (0.0012) +[2023-10-08 19:41:18,285][21195] Updated weights for policy 0, policy_version 97370 (0.0010) +[2023-10-08 19:41:18,479][21194] Updated weights for policy 1, policy_version 96610 (0.0010) +[2023-10-08 19:41:18,802][19739] Fps is (10 sec: 16384.0, 60 sec: 13653.4, 300 sec: 13773.7). Total num frames: 198639616. Throughput: 0: 1711.4, 1: 1704.9. Samples: 49667038. Policy #0 lag: (min: 5.0, avg: 5.7, max: 24.0) +[2023-10-08 19:41:18,803][19739] Avg episode reward: [(0, '1218.020'), (1, '650.210')] +[2023-10-08 19:41:18,852][21194] Updated weights for policy 1, policy_version 96620 (0.0007) +[2023-10-08 19:41:19,212][21194] Updated weights for policy 1, policy_version 96630 (0.0008) +[2023-10-08 19:41:19,588][21194] Updated weights for policy 1, policy_version 96640 (0.0008) +[2023-10-08 19:41:22,331][21195] Updated weights for policy 0, policy_version 97380 (0.0009) +[2023-10-08 19:41:22,691][21195] Updated weights for policy 0, policy_version 97390 (0.0007) +[2023-10-08 19:41:23,066][21195] Updated weights for policy 0, policy_version 97400 (0.0010) +[2023-10-08 19:41:23,522][21194] Updated weights for policy 1, policy_version 96650 (0.0009) +[2023-10-08 19:41:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 198705152. Throughput: 0: 1736.8, 1: 1730.2. Samples: 49683776. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:41:23,803][19739] Avg episode reward: [(0, '1217.920'), (1, '636.040')] +[2023-10-08 19:41:23,894][21194] Updated weights for policy 1, policy_version 96660 (0.0010) +[2023-10-08 19:41:24,264][21194] Updated weights for policy 1, policy_version 96670 (0.0007) +[2023-10-08 19:41:26,950][21195] Updated weights for policy 0, policy_version 97410 (0.0009) +[2023-10-08 19:41:27,325][21195] Updated weights for policy 0, policy_version 97420 (0.0007) +[2023-10-08 19:41:27,696][21195] Updated weights for policy 0, policy_version 97430 (0.0007) +[2023-10-08 19:41:28,057][21195] Updated weights for policy 0, policy_version 97440 (0.0008) +[2023-10-08 19:41:28,249][21194] Updated weights for policy 1, policy_version 96680 (0.0008) +[2023-10-08 19:41:28,615][21194] Updated weights for policy 1, policy_version 96690 (0.0007) +[2023-10-08 19:41:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 198770688. Throughput: 0: 1724.0, 1: 1735.4. Samples: 49704342. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:41:28,803][19739] Avg episode reward: [(0, '1217.920'), (1, '636.040')] +[2023-10-08 19:41:28,973][21194] Updated weights for policy 1, policy_version 96700 (0.0008) +[2023-10-08 19:41:31,779][21195] Updated weights for policy 0, policy_version 97450 (0.0008) +[2023-10-08 19:41:32,148][21195] Updated weights for policy 0, policy_version 97460 (0.0010) +[2023-10-08 19:41:32,521][21195] Updated weights for policy 0, policy_version 97470 (0.0009) +[2023-10-08 19:41:32,829][21194] Updated weights for policy 1, policy_version 96710 (0.0007) +[2023-10-08 19:41:33,202][21194] Updated weights for policy 1, policy_version 96720 (0.0008) +[2023-10-08 19:41:33,571][21194] Updated weights for policy 1, policy_version 96730 (0.0009) +[2023-10-08 19:41:33,803][19739] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 198868992. Throughput: 0: 1716.5, 1: 1734.8. Samples: 49719602. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:41:33,804][19739] Avg episode reward: [(0, '1217.920'), (1, '636.040')] +[2023-10-08 19:41:36,619][21195] Updated weights for policy 0, policy_version 97480 (0.0010) +[2023-10-08 19:41:36,989][21195] Updated weights for policy 0, policy_version 97490 (0.0011) +[2023-10-08 19:41:37,357][21195] Updated weights for policy 0, policy_version 97500 (0.0009) +[2023-10-08 19:41:37,375][21194] Updated weights for policy 1, policy_version 96740 (0.0007) +[2023-10-08 19:41:37,751][21194] Updated weights for policy 1, policy_version 96750 (0.0007) +[2023-10-08 19:41:38,112][21194] Updated weights for policy 1, policy_version 96760 (0.0008) +[2023-10-08 19:41:38,802][19739] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 198934528. Throughput: 0: 1733.1, 1: 1745.6. Samples: 49735958. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:41:38,803][19739] Avg episode reward: [(0, '1217.920'), (1, '636.890')] +[2023-10-08 19:41:41,245][21195] Updated weights for policy 0, policy_version 97510 (0.0007) +[2023-10-08 19:41:41,614][21195] Updated weights for policy 0, policy_version 97520 (0.0007) +[2023-10-08 19:41:41,922][21194] Updated weights for policy 1, policy_version 96770 (0.0008) +[2023-10-08 19:41:41,989][21195] Updated weights for policy 0, policy_version 97530 (0.0009) +[2023-10-08 19:41:42,280][21194] Updated weights for policy 1, policy_version 96780 (0.0008) +[2023-10-08 19:41:42,650][21194] Updated weights for policy 1, policy_version 96790 (0.0007) +[2023-10-08 19:41:43,006][21194] Updated weights for policy 1, policy_version 96800 (0.0007) +[2023-10-08 19:41:43,803][19739] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 199000064. Throughput: 0: 1716.6, 1: 1715.8. Samples: 49755402. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:41:43,803][19739] Avg episode reward: [(0, '1238.090'), (1, '651.720')] +[2023-10-08 19:41:43,809][20740] Saving new best policy, reward=1238.090! +[2023-10-08 19:41:45,880][21195] Updated weights for policy 0, policy_version 97540 (0.0008) +[2023-10-08 19:41:46,248][21195] Updated weights for policy 0, policy_version 97550 (0.0007) +[2023-10-08 19:41:46,611][21195] Updated weights for policy 0, policy_version 97560 (0.0007) +[2023-10-08 19:41:46,878][21194] Updated weights for policy 1, policy_version 96810 (0.0007) +[2023-10-08 19:41:47,249][21194] Updated weights for policy 1, policy_version 96820 (0.0011) +[2023-10-08 19:41:47,607][21194] Updated weights for policy 1, policy_version 96830 (0.0009) +[2023-10-08 19:41:48,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 199065600. Throughput: 0: 1733.1, 1: 1741.9. Samples: 49771810. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:41:48,803][19739] Avg episode reward: [(0, '1238.090'), (1, '651.720')] +[2023-10-08 19:41:50,362][21195] Updated weights for policy 0, policy_version 97570 (0.0008) +[2023-10-08 19:41:50,724][21195] Updated weights for policy 0, policy_version 97580 (0.0011) +[2023-10-08 19:41:51,086][21195] Updated weights for policy 0, policy_version 97590 (0.0011) +[2023-10-08 19:41:51,450][21195] Updated weights for policy 0, policy_version 97600 (0.0010) +[2023-10-08 19:41:51,719][21194] Updated weights for policy 1, policy_version 96840 (0.0008) +[2023-10-08 19:41:52,080][21194] Updated weights for policy 1, policy_version 96850 (0.0010) +[2023-10-08 19:41:52,445][21194] Updated weights for policy 1, policy_version 96860 (0.0010) +[2023-10-08 19:41:53,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 199131136. Throughput: 0: 1711.9, 1: 1727.3. Samples: 49786532. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:41:53,803][19739] Avg episode reward: [(0, '1238.090'), (1, '666.660')] +[2023-10-08 19:41:55,643][21195] Updated weights for policy 0, policy_version 97610 (0.0010) +[2023-10-08 19:41:56,018][21195] Updated weights for policy 0, policy_version 97620 (0.0011) +[2023-10-08 19:41:56,172][21194] Updated weights for policy 1, policy_version 96870 (0.0008) +[2023-10-08 19:41:56,381][21195] Updated weights for policy 0, policy_version 97630 (0.0009) +[2023-10-08 19:41:56,538][21194] Updated weights for policy 1, policy_version 96880 (0.0009) +[2023-10-08 19:41:56,893][21194] Updated weights for policy 1, policy_version 96890 (0.0007) +[2023-10-08 19:41:58,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 199196672. Throughput: 0: 1717.9, 1: 1720.5. Samples: 49807428. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:41:58,803][19739] Avg episode reward: [(0, '1238.090'), (1, '666.660')] +[2023-10-08 19:42:00,327][21195] Updated weights for policy 0, policy_version 97640 (0.0009) +[2023-10-08 19:42:00,693][21195] Updated weights for policy 0, policy_version 97650 (0.0009) +[2023-10-08 19:42:00,768][21194] Updated weights for policy 1, policy_version 96900 (0.0009) +[2023-10-08 19:42:01,062][21195] Updated weights for policy 0, policy_version 97660 (0.0008) +[2023-10-08 19:42:01,120][21194] Updated weights for policy 1, policy_version 96910 (0.0009) +[2023-10-08 19:42:01,481][21194] Updated weights for policy 1, policy_version 96920 (0.0007) +[2023-10-08 19:42:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 199262208. Throughput: 0: 1738.5, 1: 1741.0. Samples: 49823616. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:42:03,803][19739] Avg episode reward: [(0, '1238.090'), (1, '666.660')] +[2023-10-08 19:42:05,020][21195] Updated weights for policy 0, policy_version 97670 (0.0008) +[2023-10-08 19:42:05,385][21195] Updated weights for policy 0, policy_version 97680 (0.0008) +[2023-10-08 19:42:05,577][21194] Updated weights for policy 1, policy_version 96930 (0.0008) +[2023-10-08 19:42:05,753][21195] Updated weights for policy 0, policy_version 97690 (0.0009) +[2023-10-08 19:42:05,946][21194] Updated weights for policy 1, policy_version 96940 (0.0007) +[2023-10-08 19:42:06,317][21194] Updated weights for policy 1, policy_version 96950 (0.0010) +[2023-10-08 19:42:06,681][21194] Updated weights for policy 1, policy_version 96960 (0.0011) +[2023-10-08 19:42:08,803][19739] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 199327744. Throughput: 0: 1715.2, 1: 1715.4. Samples: 49838152. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:42:08,803][19739] Avg episode reward: [(0, '1238.090'), (1, '666.660')] +[2023-10-08 19:42:09,741][21195] Updated weights for policy 0, policy_version 97700 (0.0007) +[2023-10-08 19:42:10,100][21195] Updated weights for policy 0, policy_version 97710 (0.0007) +[2023-10-08 19:42:10,471][21195] Updated weights for policy 0, policy_version 97720 (0.0008) +[2023-10-08 19:42:10,576][21194] Updated weights for policy 1, policy_version 96970 (0.0008) +[2023-10-08 19:42:10,951][21194] Updated weights for policy 1, policy_version 96980 (0.0008) +[2023-10-08 19:42:11,312][21194] Updated weights for policy 1, policy_version 96990 (0.0008) +[2023-10-08 19:42:13,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 199393280. Throughput: 0: 1736.7, 1: 1718.9. Samples: 49859844. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:42:13,803][19739] Avg episode reward: [(0, '1238.090'), (1, '681.890')] +[2023-10-08 19:42:14,192][21195] Updated weights for policy 0, policy_version 97730 (0.0008) +[2023-10-08 19:42:14,560][21195] Updated weights for policy 0, policy_version 97740 (0.0007) +[2023-10-08 19:42:14,919][21195] Updated weights for policy 0, policy_version 97750 (0.0009) +[2023-10-08 19:42:15,294][21195] Updated weights for policy 0, policy_version 97760 (0.0011) +[2023-10-08 19:42:15,466][21194] Updated weights for policy 1, policy_version 97000 (0.0010) +[2023-10-08 19:42:15,835][21194] Updated weights for policy 1, policy_version 97010 (0.0008) +[2023-10-08 19:42:16,201][21194] Updated weights for policy 1, policy_version 97020 (0.0009) +[2023-10-08 19:42:18,803][19739] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 199458816. Throughput: 0: 1743.1, 1: 1726.5. Samples: 49875734. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:42:18,803][19739] Avg episode reward: [(0, '1238.090'), (1, '683.060')] +[2023-10-08 19:42:19,408][21195] Updated weights for policy 0, policy_version 97770 (0.0008) +[2023-10-08 19:42:19,776][21195] Updated weights for policy 0, policy_version 97780 (0.0008) +[2023-10-08 19:42:19,955][21194] Updated weights for policy 1, policy_version 97030 (0.0007) +[2023-10-08 19:42:20,142][21195] Updated weights for policy 0, policy_version 97790 (0.0009) +[2023-10-08 19:42:20,323][21194] Updated weights for policy 1, policy_version 97040 (0.0009) +[2023-10-08 19:42:20,698][21194] Updated weights for policy 1, policy_version 97050 (0.0009) +[2023-10-08 19:42:23,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 199524352. Throughput: 0: 1727.6, 1: 1714.4. Samples: 49890850. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 19:42:23,803][19739] Avg episode reward: [(0, '1238.090'), (1, '683.060')] +[2023-10-08 19:42:23,950][21195] Updated weights for policy 0, policy_version 97800 (0.0010) +[2023-10-08 19:42:24,320][21195] Updated weights for policy 0, policy_version 97810 (0.0010) +[2023-10-08 19:42:24,688][21195] Updated weights for policy 0, policy_version 97820 (0.0010) +[2023-10-08 19:42:24,758][21194] Updated weights for policy 1, policy_version 97060 (0.0009) +[2023-10-08 19:42:25,122][21194] Updated weights for policy 1, policy_version 97070 (0.0009) +[2023-10-08 19:42:25,489][21194] Updated weights for policy 1, policy_version 97080 (0.0008) +[2023-10-08 19:42:28,465][21195] Updated weights for policy 0, policy_version 97830 (0.0007) +[2023-10-08 19:42:28,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 199589888. Throughput: 0: 1752.0, 1: 1744.0. Samples: 49912720. Policy #0 lag: (min: 30.0, avg: 42.4, max: 62.0) +[2023-10-08 19:42:28,803][19739] Avg episode reward: [(0, '1238.090'), (1, '683.060')] +[2023-10-08 19:42:28,835][21195] Updated weights for policy 0, policy_version 97840 (0.0007) +[2023-10-08 19:42:29,208][21195] Updated weights for policy 0, policy_version 97850 (0.0008) +[2023-10-08 19:42:29,489][21194] Updated weights for policy 1, policy_version 97090 (0.0009) +[2023-10-08 19:42:29,857][21194] Updated weights for policy 1, policy_version 97100 (0.0009) +[2023-10-08 19:42:30,233][21194] Updated weights for policy 1, policy_version 97110 (0.0010) +[2023-10-08 19:42:30,597][21194] Updated weights for policy 1, policy_version 97120 (0.0008) +[2023-10-08 19:42:32,890][21195] Updated weights for policy 0, policy_version 97860 (0.0008) +[2023-10-08 19:42:33,261][21195] Updated weights for policy 0, policy_version 97870 (0.0010) +[2023-10-08 19:42:33,632][21195] Updated weights for policy 0, policy_version 97880 (0.0010) +[2023-10-08 19:42:33,803][19739] Fps is (10 sec: 13106.8, 60 sec: 13107.2, 300 sec: 13773.7). Total num frames: 199655424. Throughput: 0: 1734.2, 1: 1718.6. Samples: 49927184. Policy #0 lag: (min: 30.0, avg: 42.4, max: 62.0) +[2023-10-08 19:42:33,804][19739] Avg episode reward: [(0, '1238.090'), (1, '683.060')] +[2023-10-08 19:42:34,489][21194] Updated weights for policy 1, policy_version 97130 (0.0008) +[2023-10-08 19:42:34,846][21194] Updated weights for policy 1, policy_version 97140 (0.0010) +[2023-10-08 19:42:35,205][21194] Updated weights for policy 1, policy_version 97150 (0.0011) +[2023-10-08 19:42:37,439][21195] Updated weights for policy 0, policy_version 97890 (0.0008) +[2023-10-08 19:42:37,809][21195] Updated weights for policy 0, policy_version 97900 (0.0009) +[2023-10-08 19:42:38,170][21195] Updated weights for policy 0, policy_version 97910 (0.0007) +[2023-10-08 19:42:38,534][21195] Updated weights for policy 0, policy_version 97920 (0.0008) +[2023-10-08 19:42:38,803][19739] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 199753728. Throughput: 0: 1759.3, 1: 1734.9. Samples: 49943774. Policy #0 lag: (min: 30.0, avg: 42.4, max: 62.0) +[2023-10-08 19:42:38,803][19739] Avg episode reward: [(0, '1246.600'), (1, '683.060')] +[2023-10-08 19:42:38,804][20740] Saving new best policy, reward=1246.600! +[2023-10-08 19:42:39,158][21194] Updated weights for policy 1, policy_version 97160 (0.0007) +[2023-10-08 19:42:39,524][21194] Updated weights for policy 1, policy_version 97170 (0.0009) +[2023-10-08 19:42:39,880][21194] Updated weights for policy 1, policy_version 97180 (0.0009) +[2023-10-08 19:42:42,552][21195] Updated weights for policy 0, policy_version 97930 (0.0009) +[2023-10-08 19:42:42,916][21195] Updated weights for policy 0, policy_version 97940 (0.0007) +[2023-10-08 19:42:43,290][21195] Updated weights for policy 0, policy_version 97950 (0.0008) +[2023-10-08 19:42:43,713][21194] Updated weights for policy 1, policy_version 97190 (0.0009) +[2023-10-08 19:42:43,803][19739] Fps is (10 sec: 16384.5, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 199819264. Throughput: 0: 1744.1, 1: 1746.9. Samples: 49964524. Policy #0 lag: (min: 30.0, avg: 42.4, max: 62.0) +[2023-10-08 19:42:43,803][19739] Avg episode reward: [(0, '1231.020'), (1, '683.060')] +[2023-10-08 19:42:44,078][21194] Updated weights for policy 1, policy_version 97200 (0.0010) +[2023-10-08 19:42:44,431][21194] Updated weights for policy 1, policy_version 97210 (0.0008) +[2023-10-08 19:42:47,130][21195] Updated weights for policy 0, policy_version 97960 (0.0008) +[2023-10-08 19:42:47,494][21195] Updated weights for policy 0, policy_version 97970 (0.0009) +[2023-10-08 19:42:47,862][21195] Updated weights for policy 0, policy_version 97980 (0.0008) +[2023-10-08 19:42:48,498][21194] Updated weights for policy 1, policy_version 97220 (0.0008) +[2023-10-08 19:42:48,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13884.7). Total num frames: 199884800. Throughput: 0: 1739.8, 1: 1725.8. Samples: 49979570. Policy #0 lag: (min: 30.0, avg: 42.4, max: 62.0) +[2023-10-08 19:42:48,803][19739] Avg episode reward: [(0, '1226.000'), (1, '683.060')] +[2023-10-08 19:42:48,860][21194] Updated weights for policy 1, policy_version 97230 (0.0008) +[2023-10-08 19:42:49,234][21194] Updated weights for policy 1, policy_version 97240 (0.0009) +[2023-10-08 19:42:51,692][21195] Updated weights for policy 0, policy_version 97990 (0.0010) +[2023-10-08 19:42:52,053][21195] Updated weights for policy 0, policy_version 98000 (0.0008) +[2023-10-08 19:42:52,422][21195] Updated weights for policy 0, policy_version 98010 (0.0007) +[2023-10-08 19:42:53,122][21194] Updated weights for policy 1, policy_version 97250 (0.0010) +[2023-10-08 19:42:53,478][21194] Updated weights for policy 1, policy_version 97260 (0.0009) +[2023-10-08 19:42:53,803][19739] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 199950336. Throughput: 0: 1765.4, 1: 1744.8. Samples: 49996112. Policy #0 lag: (min: 30.0, avg: 42.4, max: 62.0) +[2023-10-08 19:42:53,803][19739] Avg episode reward: [(0, '1226.000'), (1, '683.060')] +[2023-10-08 19:42:53,849][21194] Updated weights for policy 1, policy_version 97270 (0.0008) +[2023-10-08 19:42:54,218][21194] Updated weights for policy 1, policy_version 97280 (0.0007) +[2023-10-08 19:42:56,322][21195] Updated weights for policy 0, policy_version 98020 (0.0007) +[2023-10-08 19:42:56,689][21195] Updated weights for policy 0, policy_version 98030 (0.0009) +[2023-10-08 19:42:57,058][21195] Updated weights for policy 0, policy_version 98040 (0.0008) +[2023-10-08 19:42:58,270][21194] Updated weights for policy 1, policy_version 97290 (0.0009) +[2023-10-08 19:42:58,640][21194] Updated weights for policy 1, policy_version 97300 (0.0009) +[2023-10-08 19:42:58,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 200015872. Throughput: 0: 1743.9, 1: 1737.9. Samples: 50016524. Policy #0 lag: (min: 30.0, avg: 42.4, max: 62.0) +[2023-10-08 19:42:58,803][19739] Avg episode reward: [(0, '1226.000'), (1, '683.060')] +[2023-10-08 19:42:59,010][21194] Updated weights for policy 1, policy_version 97310 (0.0009) +[2023-10-08 19:43:00,756][21195] Updated weights for policy 0, policy_version 98050 (0.0008) +[2023-10-08 19:43:01,137][21195] Updated weights for policy 0, policy_version 98060 (0.0009) +[2023-10-08 19:43:01,495][21195] Updated weights for policy 0, policy_version 98070 (0.0011) +[2023-10-08 19:43:01,862][21195] Updated weights for policy 0, policy_version 98080 (0.0010) +[2023-10-08 19:43:03,150][21194] Updated weights for policy 1, policy_version 97320 (0.0010) +[2023-10-08 19:43:03,516][21194] Updated weights for policy 1, policy_version 97330 (0.0007) +[2023-10-08 19:43:03,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13662.6). Total num frames: 200081408. Throughput: 0: 1748.6, 1: 1731.5. Samples: 50032340. Policy #0 lag: (min: 30.0, avg: 42.4, max: 62.0) +[2023-10-08 19:43:03,803][19739] Avg episode reward: [(0, '1232.150'), (1, '712.050')] +[2023-10-08 19:43:03,879][21194] Updated weights for policy 1, policy_version 97340 (0.0009) +[2023-10-08 19:43:05,782][21195] Updated weights for policy 0, policy_version 98090 (0.0009) +[2023-10-08 19:43:06,150][21195] Updated weights for policy 0, policy_version 98100 (0.0009) +[2023-10-08 19:43:06,516][21195] Updated weights for policy 0, policy_version 98110 (0.0007) +[2023-10-08 19:43:07,714][21194] Updated weights for policy 1, policy_version 97350 (0.0008) +[2023-10-08 19:43:08,076][21194] Updated weights for policy 1, policy_version 97360 (0.0008) +[2023-10-08 19:43:08,445][21194] Updated weights for policy 1, policy_version 97370 (0.0007) +[2023-10-08 19:43:08,803][19739] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 200179712. Throughput: 0: 1748.4, 1: 1735.6. Samples: 50047630. Policy #0 lag: (min: 30.0, avg: 42.4, max: 62.0) +[2023-10-08 19:43:08,803][19739] Avg episode reward: [(0, '1232.150'), (1, '710.840')] +[2023-10-08 19:43:10,441][21195] Updated weights for policy 0, policy_version 98120 (0.0007) +[2023-10-08 19:43:10,807][21195] Updated weights for policy 0, policy_version 98130 (0.0008) +[2023-10-08 19:43:11,176][21195] Updated weights for policy 0, policy_version 98140 (0.0011) +[2023-10-08 19:43:12,292][21194] Updated weights for policy 1, policy_version 97380 (0.0009) +[2023-10-08 19:43:12,654][21194] Updated weights for policy 1, policy_version 97390 (0.0008) +[2023-10-08 19:43:13,018][21194] Updated weights for policy 1, policy_version 97400 (0.0007) +[2023-10-08 19:43:13,803][19739] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 13773.7). Total num frames: 200245248. Throughput: 0: 1740.7, 1: 1714.7. Samples: 50068212. Policy #0 lag: (min: 30.0, avg: 42.4, max: 62.0) +[2023-10-08 19:43:13,803][19739] Avg episode reward: [(0, '1232.150'), (1, '710.840')] +[2023-10-08 19:43:13,811][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000098144_100499456.pth... +[2023-10-08 19:43:13,811][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000097408_99745792.pth... +[2023-10-08 19:43:13,842][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000096544_98861056.pth +[2023-10-08 19:43:13,848][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000095776_98074624.pth +[2023-10-08 19:43:15,064][21195] Updated weights for policy 0, policy_version 98150 (0.0010) +[2023-10-08 19:43:15,432][21195] Updated weights for policy 0, policy_version 98160 (0.0011) +[2023-10-08 19:43:15,795][21195] Updated weights for policy 0, policy_version 98170 (0.0009) +[2023-10-08 19:43:16,948][21194] Updated weights for policy 1, policy_version 97410 (0.0008) +[2023-10-08 19:43:17,324][21194] Updated weights for policy 1, policy_version 97420 (0.0008) +[2023-10-08 19:43:17,697][21194] Updated weights for policy 1, policy_version 97430 (0.0007) +[2023-10-08 19:43:18,056][21194] Updated weights for policy 1, policy_version 97440 (0.0009) +[2023-10-08 19:43:18,802][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 200310784. Throughput: 0: 1765.0, 1: 1736.7. Samples: 50084758. Policy #0 lag: (min: 30.0, avg: 42.4, max: 62.0) +[2023-10-08 19:43:18,803][19739] Avg episode reward: [(0, '1232.150'), (1, '711.420')] +[2023-10-08 19:43:19,629][21195] Updated weights for policy 0, policy_version 98180 (0.0010) +[2023-10-08 19:43:19,992][21195] Updated weights for policy 0, policy_version 98190 (0.0010) +[2023-10-08 19:43:20,363][21195] Updated weights for policy 0, policy_version 98200 (0.0007) +[2023-10-08 19:43:21,945][21194] Updated weights for policy 1, policy_version 97450 (0.0009) +[2023-10-08 19:43:22,318][21194] Updated weights for policy 1, policy_version 97460 (0.0008) +[2023-10-08 19:43:22,677][21194] Updated weights for policy 1, policy_version 97470 (0.0008) +[2023-10-08 19:43:23,803][19739] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 200376320. Throughput: 0: 1736.4, 1: 1725.0. Samples: 50099538. Policy #0 lag: (min: 30.0, avg: 42.4, max: 62.0) +[2023-10-08 19:43:23,803][19739] Avg episode reward: [(0, '1232.320'), (1, '696.940')] +[2023-10-08 19:43:24,534][21195] Updated weights for policy 0, policy_version 98210 (0.0007) +[2023-10-08 19:43:24,905][21195] Updated weights for policy 0, policy_version 98220 (0.0008) +[2023-10-08 19:43:25,271][21195] Updated weights for policy 0, policy_version 98230 (0.0009) +[2023-10-08 19:43:25,644][21195] Updated weights for policy 0, policy_version 98240 (0.0011) +[2023-10-08 19:43:26,735][21194] Updated weights for policy 1, policy_version 97480 (0.0009) +[2023-10-08 19:43:27,097][21194] Updated weights for policy 1, policy_version 97490 (0.0008) +[2023-10-08 19:43:27,468][21194] Updated weights for policy 1, policy_version 97500 (0.0007) +[2023-10-08 19:43:28,803][19739] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 200441856. Throughput: 0: 1761.2, 1: 1699.0. Samples: 50120234. Policy #0 lag: (min: 31.0, avg: 36.9, max: 63.0) +[2023-10-08 19:43:28,803][19739] Avg episode reward: [(0, '1232.130'), (1, '696.940')] +[2023-10-08 19:43:29,510][21195] Updated weights for policy 0, policy_version 98250 (0.0007) +[2023-10-08 19:43:29,877][21195] Updated weights for policy 0, policy_version 98260 (0.0008) +[2023-10-08 19:43:30,245][21195] Updated weights for policy 0, policy_version 98270 (0.0007) +[2023-10-08 19:43:31,464][21194] Updated weights for policy 1, policy_version 97510 (0.0009) +[2023-10-08 19:43:31,824][21194] Updated weights for policy 1, policy_version 97520 (0.0009) +[2023-10-08 19:43:32,184][21194] Updated weights for policy 1, policy_version 97530 (0.0008) +[2023-10-08 19:43:33,803][19739] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 13773.7). Total num frames: 200507392. Throughput: 0: 1776.3, 1: 1728.1. Samples: 50137270. Policy #0 lag: (min: 31.0, avg: 36.9, max: 63.0) +[2023-10-08 19:43:33,804][19739] Avg episode reward: [(0, '1232.130'), (1, '697.580')] +[2023-10-08 19:43:34,054][21195] Updated weights for policy 0, policy_version 98280 (0.0010) +[2023-10-08 19:43:34,418][21195] Updated weights for policy 0, policy_version 98290 (0.0010) +[2023-10-08 19:43:34,787][21195] Updated weights for policy 0, policy_version 98300 (0.0011) +[2023-10-08 19:43:36,018][21194] Updated weights for policy 1, policy_version 97540 (0.0009) +[2023-10-08 19:43:36,385][21194] Updated weights for policy 1, policy_version 97550 (0.0007) +[2023-10-08 19:43:36,761][21194] Updated weights for policy 1, policy_version 97560 (0.0009) +[2023-10-08 19:43:38,594][21195] Updated weights for policy 0, policy_version 98310 (0.0009) +[2023-10-08 19:43:38,803][19739] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 200572928. Throughput: 0: 1751.2, 1: 1704.0. Samples: 50151594. Policy #0 lag: (min: 31.0, avg: 36.9, max: 63.0) +[2023-10-08 19:43:38,803][19739] Avg episode reward: [(0, '1231.950'), (1, '697.640')] +[2023-10-08 19:43:38,965][21195] Updated weights for policy 0, policy_version 98320 (0.0007) +[2023-10-08 19:43:39,339][21195] Updated weights for policy 0, policy_version 98330 (0.0010) +[2023-10-08 19:43:40,747][21194] Updated weights for policy 1, policy_version 97570 (0.0008) +[2023-10-08 19:43:41,111][21194] Updated weights for policy 1, policy_version 97580 (0.0011) +[2023-10-08 19:43:41,478][21194] Updated weights for policy 1, policy_version 97590 (0.0007) +[2023-10-08 19:43:41,841][21194] Updated weights for policy 1, policy_version 97600 (0.0010) +[2023-10-08 19:43:43,087][21195] Updated weights for policy 0, policy_version 98340 (0.0009) +[2023-10-08 19:43:43,456][21195] Updated weights for policy 0, policy_version 98350 (0.0009) +[2023-10-08 19:43:43,803][19739] Fps is (10 sec: 13107.6, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 200638464. Throughput: 0: 1773.6, 1: 1706.7. Samples: 50173136. Policy #0 lag: (min: 31.0, avg: 36.9, max: 63.0) +[2023-10-08 19:43:43,803][19739] Avg episode reward: [(0, '1228.270'), (1, '707.460')] +[2023-10-08 19:43:43,817][21195] Updated weights for policy 0, policy_version 98360 (0.0009) +[2023-10-08 19:43:45,756][21194] Updated weights for policy 1, policy_version 97610 (0.0010) +[2023-10-08 19:43:46,119][21194] Updated weights for policy 1, policy_version 97620 (0.0009) +[2023-10-08 19:43:46,483][21194] Updated weights for policy 1, policy_version 97630 (0.0011) +[2023-10-08 19:43:47,755][21195] Updated weights for policy 0, policy_version 98370 (0.0010) +[2023-10-08 19:43:48,124][21195] Updated weights for policy 0, policy_version 98380 (0.0008) +[2023-10-08 19:43:48,484][21195] Updated weights for policy 0, policy_version 98390 (0.0009) +[2023-10-08 19:43:48,803][19739] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 13773.7). Total num frames: 200704000. Throughput: 0: 1738.7, 1: 1718.1. Samples: 50187898. Policy #0 lag: (min: 31.0, avg: 36.9, max: 63.0) +[2023-10-08 19:43:48,804][19739] Avg episode reward: [(0, '1228.270'), (1, '707.460')] +[2023-10-08 19:43:48,849][21195] Updated weights for policy 0, policy_version 98400 (0.0009) +[2023-10-08 19:43:50,429][21194] Updated weights for policy 1, policy_version 97640 (0.0010) +[2023-10-08 19:43:50,798][21194] Updated weights for policy 1, policy_version 97650 (0.0010) +[2023-10-08 19:43:51,163][21194] Updated weights for policy 1, policy_version 97660 (0.0010) +[2023-10-08 19:43:52,835][21195] Updated weights for policy 0, policy_version 98410 (0.0008) +[2023-10-08 19:43:53,205][21195] Updated weights for policy 0, policy_version 98420 (0.0007) +[2023-10-08 19:43:53,579][21195] Updated weights for policy 0, policy_version 98430 (0.0009) +[2023-10-08 19:43:53,645][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000098432_100794368.pth... +[2023-10-08 19:43:53,645][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000097664_100007936.pth... +[2023-10-08 19:43:53,645][21229] Stopping RolloutWorker_w1... +[2023-10-08 19:43:53,645][21240] Stopping RolloutWorker_w11... +[2023-10-08 19:43:53,645][21229] Loop rollout_proc1_evt_loop terminating... +[2023-10-08 19:43:53,646][21240] Loop rollout_proc11_evt_loop terminating... +[2023-10-08 19:43:53,646][21924] Stopping RolloutWorker_w15... +[2023-10-08 19:43:53,646][21239] Stopping RolloutWorker_w9... +[2023-10-08 19:43:53,646][19739] Component RolloutWorker_w1 stopped! +[2023-10-08 19:43:53,646][21924] Loop rollout_proc15_evt_loop terminating... +[2023-10-08 19:43:53,646][21239] Loop rollout_proc9_evt_loop terminating... +[2023-10-08 19:43:53,647][21237] Stopping RolloutWorker_w6... +[2023-10-08 19:43:53,647][21237] Loop rollout_proc6_evt_loop terminating... +[2023-10-08 19:43:53,647][21232] Stopping RolloutWorker_w2... +[2023-10-08 19:43:53,647][21233] Stopping RolloutWorker_w7... +[2023-10-08 19:43:53,647][19739] Component RolloutWorker_w11 stopped! +[2023-10-08 19:43:53,647][21232] Loop rollout_proc2_evt_loop terminating... +[2023-10-08 19:43:53,648][21233] Loop rollout_proc7_evt_loop terminating... +[2023-10-08 19:43:53,647][21234] Stopping RolloutWorker_w0... +[2023-10-08 19:43:53,648][21886] Stopping RolloutWorker_w14... +[2023-10-08 19:43:53,648][21234] Loop rollout_proc0_evt_loop terminating... +[2023-10-08 19:43:53,648][21886] Loop rollout_proc14_evt_loop terminating... +[2023-10-08 19:43:53,648][21230] Stopping RolloutWorker_w3... +[2023-10-08 19:43:53,648][19739] Component RolloutWorker_w15 stopped! +[2023-10-08 19:43:53,649][21230] Loop rollout_proc3_evt_loop terminating... +[2023-10-08 19:43:53,649][21242] Stopping RolloutWorker_w12... +[2023-10-08 19:43:53,649][21235] Stopping RolloutWorker_w4... +[2023-10-08 19:43:53,649][19739] Component RolloutWorker_w9 stopped! +[2023-10-08 19:43:53,649][21235] Loop rollout_proc4_evt_loop terminating... +[2023-10-08 19:43:53,649][21242] Loop rollout_proc12_evt_loop terminating... +[2023-10-08 19:43:53,649][21241] Stopping RolloutWorker_w10... +[2023-10-08 19:43:53,650][21241] Loop rollout_proc10_evt_loop terminating... +[2023-10-08 19:43:53,649][19739] Component RolloutWorker_w6 stopped! +[2023-10-08 19:43:53,650][19739] Component RolloutWorker_w2 stopped! +[2023-10-08 19:43:53,651][19739] Component RolloutWorker_w7 stopped! +[2023-10-08 19:43:53,652][21236] Stopping RolloutWorker_w5... +[2023-10-08 19:43:53,652][21243] Stopping RolloutWorker_w13... +[2023-10-08 19:43:53,652][21238] Stopping RolloutWorker_w8... +[2023-10-08 19:43:53,651][19739] Component RolloutWorker_w0 stopped! +[2023-10-08 19:43:53,652][20836] Stopping Batcher_1... +[2023-10-08 19:43:53,652][21238] Loop rollout_proc8_evt_loop terminating... +[2023-10-08 19:43:53,652][21243] Loop rollout_proc13_evt_loop terminating... +[2023-10-08 19:43:53,652][21236] Loop rollout_proc5_evt_loop terminating... +[2023-10-08 19:43:53,652][19739] Component RolloutWorker_w14 stopped! +[2023-10-08 19:43:53,653][19739] Component RolloutWorker_w3 stopped! +[2023-10-08 19:43:53,654][19739] Component RolloutWorker_w12 stopped! +[2023-10-08 19:43:53,654][19739] Component RolloutWorker_w4 stopped! +[2023-10-08 19:43:53,654][19739] Component RolloutWorker_w10 stopped! +[2023-10-08 19:43:53,654][19739] Component RolloutWorker_w5 stopped! +[2023-10-08 19:43:53,655][19739] Component RolloutWorker_w13 stopped! +[2023-10-08 19:43:53,655][19739] Component RolloutWorker_w8 stopped! +[2023-10-08 19:43:53,655][19739] Component Batcher_1 stopped! +[2023-10-08 19:43:53,656][19739] Component Batcher_0 stopped! +[2023-10-08 19:43:53,673][21194] Weights refcount: 2 0 +[2023-10-08 19:43:53,675][21194] Stopping InferenceWorker_p1-w0... +[2023-10-08 19:43:53,676][21194] Loop inference_proc1-0_evt_loop terminating... +[2023-10-08 19:43:53,675][19739] Component InferenceWorker_p1-w0 stopped! +[2023-10-08 19:43:53,667][20740] Stopping Batcher_0... +[2023-10-08 19:43:53,678][20740] Loop batcher_evt_loop terminating... +[2023-10-08 19:43:53,679][20740] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000097344_99680256.pth +[2023-10-08 19:43:53,667][20836] Loop batcher_evt_loop terminating... +[2023-10-08 19:43:53,681][21195] Weights refcount: 2 0 +[2023-10-08 19:43:53,683][21195] Stopping InferenceWorker_p0-w0... +[2023-10-08 19:43:53,684][21195] Loop inference_proc0-0_evt_loop terminating... +[2023-10-08 19:43:53,684][20740] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p0/checkpoint_000098432_100794368.pth... +[2023-10-08 19:43:53,683][19739] Component InferenceWorker_p0-w0 stopped! +[2023-10-08 19:43:53,695][20836] Removing ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000096608_98926592.pth +[2023-10-08 19:43:53,701][20836] Saving ./train_atari/atari_atlantis_APPO/checkpoint_p1/checkpoint_000097664_100007936.pth... +[2023-10-08 19:43:53,741][20740] Stopping LearnerWorker_p0... +[2023-10-08 19:43:53,742][20740] Loop learner_proc0_evt_loop terminating... +[2023-10-08 19:43:53,742][19739] Component LearnerWorker_p0 stopped! +[2023-10-08 19:43:53,756][20836] Stopping LearnerWorker_p1... +[2023-10-08 19:43:53,757][20836] Loop learner_proc1_evt_loop terminating... +[2023-10-08 19:43:53,757][19739] Component LearnerWorker_p1 stopped! +[2023-10-08 19:43:53,758][19739] Waiting for process learner_proc0 to stop... +[2023-10-08 19:43:54,603][19739] Waiting for process learner_proc1 to stop... +[2023-10-08 19:43:54,635][19739] Waiting for process inference_proc0-0 to join... +[2023-10-08 19:43:54,635][19739] Waiting for process inference_proc1-0 to join... +[2023-10-08 19:43:54,636][19739] Waiting for process rollout_proc0 to join... +[2023-10-08 19:43:54,637][19739] Waiting for process rollout_proc1 to join... +[2023-10-08 19:43:54,638][19739] Waiting for process rollout_proc2 to join... +[2023-10-08 19:43:54,638][19739] Waiting for process rollout_proc3 to join... +[2023-10-08 19:43:54,639][19739] Waiting for process rollout_proc4 to join... +[2023-10-08 19:43:54,639][19739] Waiting for process rollout_proc5 to join... +[2023-10-08 19:43:54,640][19739] Waiting for process rollout_proc6 to join... +[2023-10-08 19:43:54,641][19739] Waiting for process rollout_proc7 to join... +[2023-10-08 19:43:54,641][19739] Waiting for process rollout_proc8 to join... +[2023-10-08 19:43:54,642][19739] Waiting for process rollout_proc9 to join... +[2023-10-08 19:43:54,643][19739] Waiting for process rollout_proc10 to join... +[2023-10-08 19:43:54,643][19739] Waiting for process rollout_proc11 to join... +[2023-10-08 19:43:54,643][19739] Waiting for process rollout_proc12 to join... +[2023-10-08 19:43:54,644][19739] Waiting for process rollout_proc13 to join... +[2023-10-08 19:43:54,644][19739] Waiting for process rollout_proc14 to join... +[2023-10-08 19:43:54,645][19739] Waiting for process rollout_proc15 to join... +[2023-10-08 19:43:54,645][19739] Batcher 0 profile tree view: +batching: 170.1098, releasing_batches: 0.0893 +[2023-10-08 19:43:54,645][19739] Batcher 1 profile tree view: +batching: 168.2526, releasing_batches: 0.0902 +[2023-10-08 19:43:54,645][19739] InferenceWorker_p0-w0 profile tree view: +wait_policy: 0.0001 + wait_policy_total: 2361.5568 +update_model: 201.2080 + weight_update: 0.0010 +one_step: 0.0035 + handle_policy_step: 11299.1360 + deserialize: 63.7486, stack: 195.6376, obs_to_device_normalize: 2527.0382, forward: 5096.0262, prepare_outputs: 2465.9282, send_messages: 463.7048 +[2023-10-08 19:43:54,646][19739] InferenceWorker_p1-w0 profile tree view: +wait_policy: 0.0000 + wait_policy_total: 2399.7468 +update_model: 202.9519 + weight_update: 0.0010 +one_step: 0.0023 + handle_policy_step: 11261.3325 + deserialize: 63.2959, stack: 193.3789, obs_to_device_normalize: 2526.0325, forward: 5091.8727, prepare_outputs: 2434.7968, send_messages: 460.8200 +[2023-10-08 19:43:54,646][19739] Learner 0 profile tree view: +misc: 0.0195, prepare_batch: 263.5477 +train: 3648.1710 + epoch_init: 0.1937, minibatch_init: 13.3461, losses_postprocess: 894.9374, kl_divergence: 30.8972, update: 384.3450, after_optimizer: 2140.3059 + calculate_losses: 167.4775 + losses_init: 0.3785, forward_head: 56.3126, bptt_initial: 1.4310, bptt: 1.9914, tail: 38.3027, advantages_returns: 11.1516, losses: 44.2689 +[2023-10-08 19:43:54,646][19739] Learner 1 profile tree view: +misc: 0.0193, prepare_batch: 261.4445 +train: 3592.8294 + epoch_init: 0.1873, minibatch_init: 13.1474, losses_postprocess: 879.9661, kl_divergence: 31.2447, update: 382.4236, after_optimizer: 2102.6647 + calculate_losses: 166.3988 + losses_init: 0.5345, forward_head: 55.8964, bptt_initial: 1.3970, bptt: 1.9202, tail: 37.9139, advantages_returns: 11.1002, losses: 43.9372 +[2023-10-08 19:43:54,647][19739] RolloutWorker_w0 profile tree view: +wait_for_trajectories: 1.2354, enqueue_policy_requests: 410.5443, process_policy_outputs: 192.9268, env_step: 7258.4229, finalize_trajectories: 3.5970, complete_rollouts: 2.9438 +post_env_step: 376.6819 + process_env_step: 83.2042 +[2023-10-08 19:43:54,647][19739] RolloutWorker_w15 profile tree view: +wait_for_trajectories: 1.2554, enqueue_policy_requests: 408.4870, process_policy_outputs: 190.5457, env_step: 7314.7473, finalize_trajectories: 3.4175, complete_rollouts: 2.9836 +post_env_step: 372.7387 + process_env_step: 83.2993 +[2023-10-08 19:43:54,647][19739] Loop Runner_EvtLoop terminating... +[2023-10-08 19:43:54,648][19739] Runner profile tree view: +main_loop: 14556.4070 +[2023-10-08 19:43:54,648][19739] Collected {0: 100794368, 1: 100007936}, FPS: 13794.8