diff --git "a/sf_log.txt" "b/sf_log.txt" new file mode 100644--- /dev/null +++ "b/sf_log.txt" @@ -0,0 +1,26140 @@ +[2023-10-08 11:46:20,747][101941] Saving configuration to ./train_atari/atari_asteroid_APPO/config.json... +[2023-10-08 11:46:21,063][101941] Rollout worker 0 uses device cpu +[2023-10-08 11:46:21,064][101941] Rollout worker 1 uses device cpu +[2023-10-08 11:46:21,065][101941] Rollout worker 2 uses device cpu +[2023-10-08 11:46:21,065][101941] Rollout worker 3 uses device cpu +[2023-10-08 11:46:21,066][101941] Rollout worker 4 uses device cpu +[2023-10-08 11:46:21,066][101941] Rollout worker 5 uses device cpu +[2023-10-08 11:46:21,066][101941] Rollout worker 6 uses device cpu +[2023-10-08 11:46:21,067][101941] Rollout worker 7 uses device cpu +[2023-10-08 11:46:21,067][101941] Rollout worker 8 uses device cpu +[2023-10-08 11:46:21,068][101941] Rollout worker 9 uses device cpu +[2023-10-08 11:46:21,068][101941] Rollout worker 10 uses device cpu +[2023-10-08 11:46:21,069][101941] Rollout worker 11 uses device cpu +[2023-10-08 11:46:21,069][101941] Rollout worker 12 uses device cpu +[2023-10-08 11:46:21,069][101941] Rollout worker 13 uses device cpu +[2023-10-08 11:46:21,070][101941] Rollout worker 14 uses device cpu +[2023-10-08 11:46:21,070][101941] Rollout worker 15 uses device cpu +[2023-10-08 11:46:21,356][101941] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-10-08 11:46:21,357][101941] InferenceWorker_p0-w0: min num requests: 2 +[2023-10-08 11:46:21,360][101941] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-10-08 11:46:21,360][101941] InferenceWorker_p1-w0: min num requests: 2 +[2023-10-08 11:46:21,406][101941] Starting all processes... +[2023-10-08 11:46:21,406][101941] Starting process learner_proc0 +[2023-10-08 11:46:23,112][101941] Starting process learner_proc1 +[2023-10-08 11:46:23,115][102634] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-10-08 11:46:23,116][102634] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 +[2023-10-08 11:46:23,133][102634] Num visible devices: 1 +[2023-10-08 11:46:23,153][102634] Setting fixed seed 1234 +[2023-10-08 11:46:23,154][102634] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-10-08 11:46:23,154][102634] Initializing actor-critic model on device cuda:0 +[2023-10-08 11:46:23,155][102634] RunningMeanStd input shape: (4, 84, 84) +[2023-10-08 11:46:23,155][102634] RunningMeanStd input shape: (1,) +[2023-10-08 11:46:23,167][102634] ConvEncoder: input_channels=4 +[2023-10-08 11:46:23,321][102634] Conv encoder output size: 512 +[2023-10-08 11:46:23,322][102634] Created Actor Critic model with architecture: +[2023-10-08 11:46:23,323][102634] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): MultiInputEncoder( + (encoders): ModuleDict( + (obs): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ReLU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ReLU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ReLU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ReLU) + ) + ) + ) + ) + ) + (core): ModelCoreIdentity() + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=14, bias=True) + ) +) +[2023-10-08 11:46:23,887][102634] Using optimizer +[2023-10-08 11:46:23,888][102634] No checkpoints found +[2023-10-08 11:46:23,888][102634] Did not load from checkpoint, starting from scratch! +[2023-10-08 11:46:23,889][102634] Initialized policy 0 weights for model version 0 +[2023-10-08 11:46:23,891][102634] LearnerWorker_p0 finished initialization! +[2023-10-08 11:46:23,891][102634] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-10-08 11:46:24,909][101941] Starting all processes... +[2023-10-08 11:46:24,912][102760] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-10-08 11:46:24,912][102760] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for learning process 1 +[2023-10-08 11:46:24,917][101941] Starting process inference_proc0-0 +[2023-10-08 11:46:24,917][101941] Starting process inference_proc1-0 +[2023-10-08 11:46:24,918][101941] Starting process rollout_proc0 +[2023-10-08 11:46:24,931][102760] Num visible devices: 1 +[2023-10-08 11:46:24,918][101941] Starting process rollout_proc1 +[2023-10-08 11:46:24,918][101941] Starting process rollout_proc2 +[2023-10-08 11:46:24,919][101941] Starting process rollout_proc3 +[2023-10-08 11:46:24,948][102760] Setting fixed seed 1234 +[2023-10-08 11:46:24,924][101941] Starting process rollout_proc4 +[2023-10-08 11:46:24,950][102760] Using GPUs [0] for process 1 (actually maps to GPUs [1]) +[2023-10-08 11:46:24,950][102760] Initializing actor-critic model on device cuda:0 +[2023-10-08 11:46:24,950][102760] RunningMeanStd input shape: (4, 84, 84) +[2023-10-08 11:46:24,951][102760] RunningMeanStd input shape: (1,) +[2023-10-08 11:46:24,925][101941] Starting process rollout_proc5 +[2023-10-08 11:46:24,929][101941] Starting process rollout_proc6 +[2023-10-08 11:46:24,929][101941] Starting process rollout_proc7 +[2023-10-08 11:46:24,930][101941] Starting process rollout_proc8 +[2023-10-08 11:46:24,963][102760] ConvEncoder: input_channels=4 +[2023-10-08 11:46:24,930][101941] Starting process rollout_proc9 +[2023-10-08 11:46:24,932][101941] Starting process rollout_proc10 +[2023-10-08 11:46:24,932][101941] Starting process rollout_proc11 +[2023-10-08 11:46:24,934][101941] Starting process rollout_proc12 +[2023-10-08 11:46:24,938][101941] Starting process rollout_proc13 +[2023-10-08 11:46:25,482][102760] Conv encoder output size: 512 +[2023-10-08 11:46:25,484][102760] Created Actor Critic model with architecture: +[2023-10-08 11:46:25,484][102760] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): MultiInputEncoder( + (encoders): ModuleDict( + (obs): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ReLU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ReLU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ReLU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ReLU) + ) + ) + ) + ) + ) + (core): ModelCoreIdentity() + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=14, bias=True) + ) +) +[2023-10-08 11:46:26,355][102760] Using optimizer +[2023-10-08 11:46:26,356][102760] No checkpoints found +[2023-10-08 11:46:26,356][102760] Did not load from checkpoint, starting from scratch! +[2023-10-08 11:46:26,356][102760] Initialized policy 1 weights for model version 0 +[2023-10-08 11:46:26,358][102760] LearnerWorker_p1 finished initialization! +[2023-10-08 11:46:26,359][102760] Using GPUs [0] for process 1 (actually maps to GPUs [1]) +[2023-10-08 11:46:27,188][101941] Starting process rollout_proc14 +[2023-10-08 11:46:27,194][102938] Worker 7 uses CPU cores [14, 15] +[2023-10-08 11:46:27,205][101941] Starting process rollout_proc15 +[2023-10-08 11:46:27,210][102944] Worker 13 uses CPU cores [26, 27] +[2023-10-08 11:46:27,212][102942] Worker 11 uses CPU cores [22, 23] +[2023-10-08 11:46:27,217][102941] Worker 10 uses CPU cores [20, 21] +[2023-10-08 11:46:27,416][102935] Worker 2 uses CPU cores [4, 5] +[2023-10-08 11:46:27,456][102940] Worker 9 uses CPU cores [18, 19] +[2023-10-08 11:46:27,499][102932] Worker 3 uses CPU cores [6, 7] +[2023-10-08 11:46:27,505][102937] Worker 6 uses CPU cores [12, 13] +[2023-10-08 11:46:27,515][102943] Worker 12 uses CPU cores [24, 25] +[2023-10-08 11:46:27,518][102934] Worker 4 uses CPU cores [8, 9] +[2023-10-08 11:46:27,530][102897] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-10-08 11:46:27,531][102897] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 +[2023-10-08 11:46:27,538][102898] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-10-08 11:46:27,538][102898] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for inference process 1 +[2023-10-08 11:46:27,549][102897] Num visible devices: 1 +[2023-10-08 11:46:27,557][102898] Num visible devices: 1 +[2023-10-08 11:46:27,627][102933] Worker 1 uses CPU cores [2, 3] +[2023-10-08 11:46:27,664][102939] Worker 8 uses CPU cores [16, 17] +[2023-10-08 11:46:27,676][102936] Worker 5 uses CPU cores [10, 11] +[2023-10-08 11:46:27,810][102930] Worker 0 uses CPU cores [0, 1] +[2023-10-08 11:46:28,187][102897] RunningMeanStd input shape: (4, 84, 84) +[2023-10-08 11:46:28,187][102897] RunningMeanStd input shape: (1,) +[2023-10-08 11:46:28,199][102897] ConvEncoder: input_channels=4 +[2023-10-08 11:46:28,241][102898] RunningMeanStd input shape: (4, 84, 84) +[2023-10-08 11:46:28,242][102898] RunningMeanStd input shape: (1,) +[2023-10-08 11:46:28,261][102898] ConvEncoder: input_channels=4 +[2023-10-08 11:46:28,305][102897] Conv encoder output size: 512 +[2023-10-08 11:46:28,378][102898] Conv encoder output size: 512 +[2023-10-08 11:46:29,112][103679] Worker 15 uses CPU cores [30, 31] +[2023-10-08 11:46:29,118][101941] Inference worker 0-0 is ready! +[2023-10-08 11:46:29,119][101941] Inference worker 1-0 is ready! +[2023-10-08 11:46:29,119][103647] Worker 14 uses CPU cores [28, 29] +[2023-10-08 11:46:29,120][101941] All inference workers are ready! Signal rollout workers to start! +[2023-10-08 11:46:29,121][102935] EnvRunner 2-0 uses policy 0 +[2023-10-08 11:46:29,121][102933] EnvRunner 1-0 uses policy 1 +[2023-10-08 11:46:29,121][102930] EnvRunner 0-0 uses policy 0 +[2023-10-08 11:46:29,121][102944] EnvRunner 13-0 uses policy 1 +[2023-10-08 11:46:29,121][102943] EnvRunner 12-0 uses policy 0 +[2023-10-08 11:46:29,121][102940] EnvRunner 9-0 uses policy 1 +[2023-10-08 11:46:29,121][102942] EnvRunner 11-0 uses policy 1 +[2023-10-08 11:46:29,121][102939] EnvRunner 8-0 uses policy 0 +[2023-10-08 11:46:29,122][102938] EnvRunner 7-0 uses policy 1 +[2023-10-08 11:46:29,121][102937] EnvRunner 6-0 uses policy 0 +[2023-10-08 11:46:29,122][102934] EnvRunner 4-0 uses policy 0 +[2023-10-08 11:46:29,122][102941] EnvRunner 10-0 uses policy 0 +[2023-10-08 11:46:29,122][102936] EnvRunner 5-0 uses policy 1 +[2023-10-08 11:46:29,122][102932] EnvRunner 3-0 uses policy 1 +[2023-10-08 11:46:29,122][101941] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 0. Throughput: 0: nan, 1: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-10-08 11:46:29,296][103679] EnvRunner 15-0 uses policy 1 +[2023-10-08 11:46:29,304][103647] EnvRunner 14-0 uses policy 0 +[2023-10-08 11:46:31,344][101941] Heartbeat connected on Batcher_0 +[2023-10-08 11:46:31,347][101941] Heartbeat connected on LearnerWorker_p0 +[2023-10-08 11:46:31,350][101941] Heartbeat connected on Batcher_1 +[2023-10-08 11:46:31,352][101941] Heartbeat connected on LearnerWorker_p1 +[2023-10-08 11:46:31,359][101941] Heartbeat connected on InferenceWorker_p0-w0 +[2023-10-08 11:46:31,363][101941] Heartbeat connected on InferenceWorker_p1-w0 +[2023-10-08 11:46:31,364][101941] Heartbeat connected on RolloutWorker_w0 +[2023-10-08 11:46:31,368][101941] Heartbeat connected on RolloutWorker_w1 +[2023-10-08 11:46:31,373][101941] Heartbeat connected on RolloutWorker_w2 +[2023-10-08 11:46:31,374][101941] Heartbeat connected on RolloutWorker_w3 +[2023-10-08 11:46:31,378][101941] Heartbeat connected on RolloutWorker_w4 +[2023-10-08 11:46:31,379][101941] Heartbeat connected on RolloutWorker_w5 +[2023-10-08 11:46:31,382][101941] Heartbeat connected on RolloutWorker_w6 +[2023-10-08 11:46:31,386][101941] Heartbeat connected on RolloutWorker_w7 +[2023-10-08 11:46:31,389][101941] Heartbeat connected on RolloutWorker_w8 +[2023-10-08 11:46:31,389][101941] Heartbeat connected on RolloutWorker_w9 +[2023-10-08 11:46:31,392][101941] Heartbeat connected on RolloutWorker_w10 +[2023-10-08 11:46:31,396][101941] Heartbeat connected on RolloutWorker_w12 +[2023-10-08 11:46:31,399][101941] Heartbeat connected on RolloutWorker_w11 +[2023-10-08 11:46:31,400][101941] Heartbeat connected on RolloutWorker_w13 +[2023-10-08 11:46:31,402][101941] Heartbeat connected on RolloutWorker_w14 +[2023-10-08 11:46:31,407][101941] Heartbeat connected on RolloutWorker_w15 +[2023-10-08 11:46:31,875][101941] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 593.4, 1: 631.9. Samples: 3374. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-10-08 11:46:31,876][101941] Avg episode reward: [(0, '2.667'), (1, '1.750')] +[2023-10-08 11:46:36,875][101941] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 1018.4, 1: 1025.4. Samples: 15846. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-10-08 11:46:36,876][101941] Avg episode reward: [(0, '3.113'), (1, '3.016')] +[2023-10-08 11:46:38,904][102897] Updated weights for policy 0, policy_version 10 (0.0009) +[2023-10-08 11:46:38,944][102898] Updated weights for policy 1, policy_version 10 (0.0008) +[2023-10-08 11:46:39,270][102897] Updated weights for policy 0, policy_version 20 (0.0008) +[2023-10-08 11:46:39,306][102898] Updated weights for policy 1, policy_version 20 (0.0008) +[2023-10-08 11:46:39,635][102897] Updated weights for policy 0, policy_version 30 (0.0007) +[2023-10-08 11:46:39,678][102898] Updated weights for policy 1, policy_version 30 (0.0009) +[2023-10-08 11:46:41,875][101941] Fps is (10 sec: 6553.7, 60 sec: 5138.7, 300 sec: 5138.7). Total num frames: 65536. Throughput: 0: 1301.5, 1: 1300.2. Samples: 33180. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 11:46:41,876][101941] Avg episode reward: [(0, '3.230'), (1, '3.178')] +[2023-10-08 11:46:42,051][102897] Updated weights for policy 0, policy_version 40 (0.0008) +[2023-10-08 11:46:42,101][102898] Updated weights for policy 1, policy_version 40 (0.0010) +[2023-10-08 11:46:42,427][102897] Updated weights for policy 0, policy_version 50 (0.0010) +[2023-10-08 11:46:42,466][102898] Updated weights for policy 1, policy_version 50 (0.0008) +[2023-10-08 11:46:42,805][102897] Updated weights for policy 0, policy_version 60 (0.0009) +[2023-10-08 11:46:42,826][102898] Updated weights for policy 1, policy_version 60 (0.0009) +[2023-10-08 11:46:46,079][102897] Updated weights for policy 0, policy_version 70 (0.0007) +[2023-10-08 11:46:46,089][102898] Updated weights for policy 1, policy_version 70 (0.0008) +[2023-10-08 11:46:46,447][102897] Updated weights for policy 0, policy_version 80 (0.0008) +[2023-10-08 11:46:46,451][102898] Updated weights for policy 1, policy_version 80 (0.0008) +[2023-10-08 11:46:46,815][102898] Updated weights for policy 1, policy_version 90 (0.0009) +[2023-10-08 11:46:46,821][102897] Updated weights for policy 0, policy_version 90 (0.0008) +[2023-10-08 11:46:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 7383.0, 300 sec: 7383.0). Total num frames: 131072. Throughput: 0: 1512.6, 1: 1504.5. Samples: 53564. Policy #0 lag: (min: 33.0, avg: 33.0, max: 33.0) +[2023-10-08 11:46:46,875][101941] Avg episode reward: [(0, '3.430'), (1, '3.600')] +[2023-10-08 11:46:50,105][102898] Updated weights for policy 1, policy_version 100 (0.0008) +[2023-10-08 11:46:50,270][102897] Updated weights for policy 0, policy_version 100 (0.0008) +[2023-10-08 11:46:50,465][102898] Updated weights for policy 1, policy_version 110 (0.0007) +[2023-10-08 11:46:50,643][102897] Updated weights for policy 0, policy_version 110 (0.0008) +[2023-10-08 11:46:50,838][102898] Updated weights for policy 1, policy_version 120 (0.0008) +[2023-10-08 11:46:51,010][102897] Updated weights for policy 0, policy_version 120 (0.0008) +[2023-10-08 11:46:51,875][101941] Fps is (10 sec: 19661.0, 60 sec: 11521.2, 300 sec: 11521.2). Total num frames: 262144. Throughput: 0: 1410.6, 1: 1415.8. Samples: 64310. Policy #0 lag: (min: 22.0, avg: 29.9, max: 54.0) +[2023-10-08 11:46:51,875][101941] Avg episode reward: [(0, '3.990'), (1, '3.520')] +[2023-10-08 11:46:51,876][102634] Saving new best policy, reward=3.990! +[2023-10-08 11:46:51,876][102760] Saving new best policy, reward=3.520! +[2023-10-08 11:46:54,858][102898] Updated weights for policy 1, policy_version 130 (0.0008) +[2023-10-08 11:46:54,886][102897] Updated weights for policy 0, policy_version 130 (0.0009) +[2023-10-08 11:46:55,227][102898] Updated weights for policy 1, policy_version 140 (0.0007) +[2023-10-08 11:46:55,258][102897] Updated weights for policy 0, policy_version 140 (0.0007) +[2023-10-08 11:46:55,587][102898] Updated weights for policy 1, policy_version 150 (0.0008) +[2023-10-08 11:46:55,613][102897] Updated weights for policy 0, policy_version 150 (0.0009) +[2023-10-08 11:46:55,946][102898] Updated weights for policy 1, policy_version 160 (0.0008) +[2023-10-08 11:46:55,989][102897] Updated weights for policy 0, policy_version 160 (0.0007) +[2023-10-08 11:46:56,875][101941] Fps is (10 sec: 19660.4, 60 sec: 11806.8, 300 sec: 11806.8). Total num frames: 327680. Throughput: 0: 1528.0, 1: 1521.8. Samples: 84642. Policy #0 lag: (min: 31.0, avg: 31.1, max: 36.0) +[2023-10-08 11:46:56,876][101941] Avg episode reward: [(0, '4.050'), (1, '3.530')] +[2023-10-08 11:46:56,877][102634] Saving new best policy, reward=4.050! +[2023-10-08 11:46:56,878][102760] Saving new best policy, reward=3.530! +[2023-10-08 11:46:59,637][102898] Updated weights for policy 1, policy_version 170 (0.0007) +[2023-10-08 11:46:59,878][102897] Updated weights for policy 0, policy_version 170 (0.0007) +[2023-10-08 11:46:59,989][102898] Updated weights for policy 1, policy_version 180 (0.0009) +[2023-10-08 11:47:00,241][102897] Updated weights for policy 0, policy_version 180 (0.0007) +[2023-10-08 11:47:00,354][102898] Updated weights for policy 1, policy_version 190 (0.0009) +[2023-10-08 11:47:00,605][102897] Updated weights for policy 0, policy_version 190 (0.0010) +[2023-10-08 11:47:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 12005.4, 300 sec: 12005.4). Total num frames: 393216. Throughput: 0: 1616.4, 1: 1613.8. Samples: 105800. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:47:01,875][101941] Avg episode reward: [(0, '4.080'), (1, '3.680')] +[2023-10-08 11:47:01,880][102634] Saving new best policy, reward=4.080! +[2023-10-08 11:47:01,880][102760] Saving new best policy, reward=3.680! +[2023-10-08 11:47:04,213][102898] Updated weights for policy 1, policy_version 200 (0.0008) +[2023-10-08 11:47:04,531][102897] Updated weights for policy 0, policy_version 200 (0.0007) +[2023-10-08 11:47:04,584][102898] Updated weights for policy 1, policy_version 210 (0.0008) +[2023-10-08 11:47:04,903][102897] Updated weights for policy 0, policy_version 210 (0.0008) +[2023-10-08 11:47:04,954][102898] Updated weights for policy 1, policy_version 220 (0.0008) +[2023-10-08 11:47:05,279][102897] Updated weights for policy 0, policy_version 220 (0.0008) +[2023-10-08 11:47:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 12151.3, 300 sec: 12151.3). Total num frames: 458752. Throughput: 0: 1562.8, 1: 1546.9. Samples: 117404. Policy #0 lag: (min: 31.0, avg: 39.9, max: 63.0) +[2023-10-08 11:47:06,876][101941] Avg episode reward: [(0, '4.200'), (1, '3.710')] +[2023-10-08 11:47:06,877][102760] Saving new best policy, reward=3.710! +[2023-10-08 11:47:06,877][102634] Saving new best policy, reward=4.200! +[2023-10-08 11:47:08,741][102898] Updated weights for policy 1, policy_version 230 (0.0008) +[2023-10-08 11:47:09,081][102897] Updated weights for policy 0, policy_version 230 (0.0008) +[2023-10-08 11:47:09,118][102898] Updated weights for policy 1, policy_version 240 (0.0008) +[2023-10-08 11:47:09,446][102897] Updated weights for policy 0, policy_version 240 (0.0007) +[2023-10-08 11:47:09,480][102898] Updated weights for policy 1, policy_version 250 (0.0008) +[2023-10-08 11:47:09,808][102897] Updated weights for policy 0, policy_version 250 (0.0008) +[2023-10-08 11:47:11,875][101941] Fps is (10 sec: 13106.9, 60 sec: 12263.0, 300 sec: 12263.0). Total num frames: 524288. Throughput: 0: 1610.4, 1: 1613.8. Samples: 137846. Policy #0 lag: (min: 4.0, avg: 20.0, max: 36.0) +[2023-10-08 11:47:11,876][101941] Avg episode reward: [(0, '4.540'), (1, '4.540')] +[2023-10-08 11:47:11,877][102634] Saving new best policy, reward=4.540! +[2023-10-08 11:47:11,878][102760] Saving new best policy, reward=4.540! +[2023-10-08 11:47:13,209][102898] Updated weights for policy 1, policy_version 260 (0.0008) +[2023-10-08 11:47:13,415][102897] Updated weights for policy 0, policy_version 260 (0.0009) +[2023-10-08 11:47:13,570][102898] Updated weights for policy 1, policy_version 270 (0.0007) +[2023-10-08 11:47:13,781][102897] Updated weights for policy 0, policy_version 270 (0.0007) +[2023-10-08 11:47:13,938][102898] Updated weights for policy 1, policy_version 280 (0.0007) +[2023-10-08 11:47:14,155][102897] Updated weights for policy 0, policy_version 280 (0.0007) +[2023-10-08 11:47:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 12351.5, 300 sec: 12351.5). Total num frames: 589824. Throughput: 0: 1743.9, 1: 1746.1. Samples: 160422. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:47:16,875][101941] Avg episode reward: [(0, '4.670'), (1, '5.100')] +[2023-10-08 11:47:16,881][102634] Saving new best policy, reward=4.670! +[2023-10-08 11:47:16,882][102760] Saving new best policy, reward=5.100! +[2023-10-08 11:47:17,668][102898] Updated weights for policy 1, policy_version 290 (0.0008) +[2023-10-08 11:47:17,973][102897] Updated weights for policy 0, policy_version 290 (0.0009) +[2023-10-08 11:47:18,030][102898] Updated weights for policy 1, policy_version 300 (0.0009) +[2023-10-08 11:47:18,378][102897] Updated weights for policy 0, policy_version 300 (0.0007) +[2023-10-08 11:47:18,390][102898] Updated weights for policy 1, policy_version 310 (0.0008) +[2023-10-08 11:47:18,746][102897] Updated weights for policy 0, policy_version 310 (0.0008) +[2023-10-08 11:47:18,754][102898] Updated weights for policy 1, policy_version 320 (0.0007) +[2023-10-08 11:47:19,119][102897] Updated weights for policy 0, policy_version 320 (0.0009) +[2023-10-08 11:47:21,875][101941] Fps is (10 sec: 13107.5, 60 sec: 12423.1, 300 sec: 12423.1). Total num frames: 655360. Throughput: 0: 1710.1, 1: 1716.1. Samples: 170026. Policy #0 lag: (min: 31.0, avg: 39.9, max: 63.0) +[2023-10-08 11:47:21,875][101941] Avg episode reward: [(0, '4.750'), (1, '5.340')] +[2023-10-08 11:47:21,876][102634] Saving new best policy, reward=4.750! +[2023-10-08 11:47:21,876][102760] Saving new best policy, reward=5.340! +[2023-10-08 11:47:22,667][102898] Updated weights for policy 1, policy_version 330 (0.0007) +[2023-10-08 11:47:22,852][102897] Updated weights for policy 0, policy_version 330 (0.0007) +[2023-10-08 11:47:23,030][102898] Updated weights for policy 1, policy_version 340 (0.0007) +[2023-10-08 11:47:23,216][102897] Updated weights for policy 0, policy_version 340 (0.0009) +[2023-10-08 11:47:23,405][102898] Updated weights for policy 1, policy_version 350 (0.0007) +[2023-10-08 11:47:23,597][102897] Updated weights for policy 0, policy_version 350 (0.0008) +[2023-10-08 11:47:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 12482.3, 300 sec: 12482.3). Total num frames: 720896. Throughput: 0: 1755.2, 1: 1767.6. Samples: 191704. Policy #0 lag: (min: 26.0, avg: 33.9, max: 58.0) +[2023-10-08 11:47:26,876][101941] Avg episode reward: [(0, '5.070'), (1, '4.520')] +[2023-10-08 11:47:26,877][102634] Saving new best policy, reward=5.070! +[2023-10-08 11:47:27,351][102898] Updated weights for policy 1, policy_version 360 (0.0007) +[2023-10-08 11:47:27,521][102897] Updated weights for policy 0, policy_version 360 (0.0007) +[2023-10-08 11:47:27,727][102898] Updated weights for policy 1, policy_version 370 (0.0008) +[2023-10-08 11:47:27,896][102897] Updated weights for policy 0, policy_version 370 (0.0008) +[2023-10-08 11:47:28,092][102898] Updated weights for policy 1, policy_version 380 (0.0007) +[2023-10-08 11:47:28,266][102897] Updated weights for policy 0, policy_version 380 (0.0008) +[2023-10-08 11:47:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 12532.1). Total num frames: 786432. Throughput: 0: 1775.1, 1: 1782.2. Samples: 213640. Policy #0 lag: (min: 31.0, avg: 35.0, max: 63.0) +[2023-10-08 11:47:31,876][101941] Avg episode reward: [(0, '4.730'), (1, '3.950')] +[2023-10-08 11:47:31,923][102898] Updated weights for policy 1, policy_version 390 (0.0008) +[2023-10-08 11:47:32,020][102897] Updated weights for policy 0, policy_version 390 (0.0009) +[2023-10-08 11:47:32,285][102898] Updated weights for policy 1, policy_version 400 (0.0007) +[2023-10-08 11:47:32,382][102897] Updated weights for policy 0, policy_version 400 (0.0008) +[2023-10-08 11:47:32,654][102898] Updated weights for policy 1, policy_version 410 (0.0009) +[2023-10-08 11:47:32,747][102897] Updated weights for policy 0, policy_version 410 (0.0007) +[2023-10-08 11:47:36,474][102898] Updated weights for policy 1, policy_version 420 (0.0007) +[2023-10-08 11:47:36,541][102897] Updated weights for policy 0, policy_version 420 (0.0007) +[2023-10-08 11:47:36,833][102898] Updated weights for policy 1, policy_version 430 (0.0007) +[2023-10-08 11:47:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 12574.5). Total num frames: 851968. Throughput: 0: 1767.5, 1: 1768.8. Samples: 223448. Policy #0 lag: (min: 22.0, avg: 22.1, max: 28.0) +[2023-10-08 11:47:36,876][101941] Avg episode reward: [(0, '4.030'), (1, '3.780')] +[2023-10-08 11:47:36,912][102897] Updated weights for policy 0, policy_version 430 (0.0008) +[2023-10-08 11:47:37,199][102898] Updated weights for policy 1, policy_version 440 (0.0008) +[2023-10-08 11:47:37,277][102897] Updated weights for policy 0, policy_version 440 (0.0008) +[2023-10-08 11:47:40,860][102898] Updated weights for policy 1, policy_version 450 (0.0010) +[2023-10-08 11:47:41,160][102897] Updated weights for policy 0, policy_version 450 (0.0007) +[2023-10-08 11:47:41,238][102898] Updated weights for policy 1, policy_version 460 (0.0009) +[2023-10-08 11:47:41,533][102897] Updated weights for policy 0, policy_version 460 (0.0008) +[2023-10-08 11:47:41,597][102898] Updated weights for policy 1, policy_version 470 (0.0008) +[2023-10-08 11:47:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 12611.1). Total num frames: 917504. Throughput: 0: 1783.0, 1: 1794.7. Samples: 245636. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) +[2023-10-08 11:47:41,876][101941] Avg episode reward: [(0, '4.050'), (1, '4.130')] +[2023-10-08 11:47:41,910][102897] Updated weights for policy 0, policy_version 470 (0.0008) +[2023-10-08 11:47:41,959][102898] Updated weights for policy 1, policy_version 480 (0.0007) +[2023-10-08 11:47:42,270][102897] Updated weights for policy 0, policy_version 480 (0.0008) +[2023-10-08 11:47:45,825][102898] Updated weights for policy 1, policy_version 490 (0.0008) +[2023-10-08 11:47:45,947][102897] Updated weights for policy 0, policy_version 490 (0.0008) +[2023-10-08 11:47:46,188][102898] Updated weights for policy 1, policy_version 500 (0.0007) +[2023-10-08 11:47:46,313][102897] Updated weights for policy 0, policy_version 500 (0.0008) +[2023-10-08 11:47:46,558][102898] Updated weights for policy 1, policy_version 510 (0.0008) +[2023-10-08 11:47:46,679][102897] Updated weights for policy 0, policy_version 510 (0.0008) +[2023-10-08 11:47:46,875][101941] Fps is (10 sec: 19661.2, 60 sec: 15291.7, 300 sec: 13485.9). Total num frames: 1048576. Throughput: 0: 1778.6, 1: 1781.7. Samples: 266012. Policy #0 lag: (min: 26.0, avg: 26.0, max: 26.0) +[2023-10-08 11:47:46,875][101941] Avg episode reward: [(0, '4.220'), (1, '4.430')] +[2023-10-08 11:47:50,291][102898] Updated weights for policy 1, policy_version 520 (0.0008) +[2023-10-08 11:47:50,396][102897] Updated weights for policy 0, policy_version 520 (0.0007) +[2023-10-08 11:47:50,655][102898] Updated weights for policy 1, policy_version 530 (0.0007) +[2023-10-08 11:47:50,761][102897] Updated weights for policy 0, policy_version 530 (0.0009) +[2023-10-08 11:47:51,019][102898] Updated weights for policy 1, policy_version 540 (0.0007) +[2023-10-08 11:47:51,121][102897] Updated weights for policy 0, policy_version 540 (0.0007) +[2023-10-08 11:47:51,875][101941] Fps is (10 sec: 19661.3, 60 sec: 14199.5, 300 sec: 13463.1). Total num frames: 1114112. Throughput: 0: 1776.6, 1: 1791.9. Samples: 277984. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:47:51,876][101941] Avg episode reward: [(0, '4.460'), (1, '4.950')] +[2023-10-08 11:47:54,848][102898] Updated weights for policy 1, policy_version 550 (0.0008) +[2023-10-08 11:47:54,967][102897] Updated weights for policy 0, policy_version 550 (0.0007) +[2023-10-08 11:47:55,218][102898] Updated weights for policy 1, policy_version 560 (0.0007) +[2023-10-08 11:47:55,333][102897] Updated weights for policy 0, policy_version 560 (0.0007) +[2023-10-08 11:47:55,582][102898] Updated weights for policy 1, policy_version 570 (0.0009) +[2023-10-08 11:47:55,697][102897] Updated weights for policy 0, policy_version 570 (0.0008) +[2023-10-08 11:47:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13442.8). Total num frames: 1179648. Throughput: 0: 1787.3, 1: 1784.4. Samples: 298570. Policy #0 lag: (min: 31.0, avg: 32.9, max: 60.0) +[2023-10-08 11:47:56,876][101941] Avg episode reward: [(0, '4.490'), (1, '4.230')] +[2023-10-08 11:47:59,469][102897] Updated weights for policy 0, policy_version 580 (0.0009) +[2023-10-08 11:47:59,480][102898] Updated weights for policy 1, policy_version 580 (0.0007) +[2023-10-08 11:47:59,833][102897] Updated weights for policy 0, policy_version 590 (0.0008) +[2023-10-08 11:47:59,846][102898] Updated weights for policy 1, policy_version 590 (0.0007) +[2023-10-08 11:48:00,207][102897] Updated weights for policy 0, policy_version 600 (0.0010) +[2023-10-08 11:48:00,220][102898] Updated weights for policy 1, policy_version 600 (0.0009) +[2023-10-08 11:48:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13424.7). Total num frames: 1245184. Throughput: 0: 1770.2, 1: 1765.9. Samples: 319546. Policy #0 lag: (min: 17.0, avg: 22.9, max: 49.0) +[2023-10-08 11:48:01,875][101941] Avg episode reward: [(0, '4.470'), (1, '4.460')] +[2023-10-08 11:48:04,003][102897] Updated weights for policy 0, policy_version 610 (0.0008) +[2023-10-08 11:48:04,022][102898] Updated weights for policy 1, policy_version 610 (0.0008) +[2023-10-08 11:48:04,395][102898] Updated weights for policy 1, policy_version 620 (0.0007) +[2023-10-08 11:48:04,399][102897] Updated weights for policy 0, policy_version 620 (0.0008) +[2023-10-08 11:48:04,766][102897] Updated weights for policy 0, policy_version 630 (0.0008) +[2023-10-08 11:48:04,767][102898] Updated weights for policy 1, policy_version 630 (0.0009) +[2023-10-08 11:48:05,129][102898] Updated weights for policy 1, policy_version 640 (0.0007) +[2023-10-08 11:48:05,143][102897] Updated weights for policy 0, policy_version 640 (0.0008) +[2023-10-08 11:48:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13408.4). Total num frames: 1310720. Throughput: 0: 1795.7, 1: 1784.2. Samples: 331122. Policy #0 lag: (min: 28.0, avg: 29.6, max: 55.0) +[2023-10-08 11:48:06,876][101941] Avg episode reward: [(0, '4.450'), (1, '4.330')] +[2023-10-08 11:48:08,611][102897] Updated weights for policy 0, policy_version 650 (0.0008) +[2023-10-08 11:48:08,885][102898] Updated weights for policy 1, policy_version 650 (0.0007) +[2023-10-08 11:48:08,986][102897] Updated weights for policy 0, policy_version 660 (0.0008) +[2023-10-08 11:48:09,245][102898] Updated weights for policy 1, policy_version 660 (0.0007) +[2023-10-08 11:48:09,367][102897] Updated weights for policy 0, policy_version 670 (0.0007) +[2023-10-08 11:48:09,608][102898] Updated weights for policy 1, policy_version 670 (0.0009) +[2023-10-08 11:48:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13393.8). Total num frames: 1376256. Throughput: 0: 1791.4, 1: 1768.1. Samples: 351884. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:48:11,875][101941] Avg episode reward: [(0, '4.140'), (1, '4.260')] +[2023-10-08 11:48:13,242][102897] Updated weights for policy 0, policy_version 680 (0.0010) +[2023-10-08 11:48:13,410][102898] Updated weights for policy 1, policy_version 680 (0.0008) +[2023-10-08 11:48:13,605][102897] Updated weights for policy 0, policy_version 690 (0.0007) +[2023-10-08 11:48:13,784][102898] Updated weights for policy 1, policy_version 690 (0.0008) +[2023-10-08 11:48:13,981][102897] Updated weights for policy 0, policy_version 700 (0.0008) +[2023-10-08 11:48:14,158][102898] Updated weights for policy 1, policy_version 700 (0.0008) +[2023-10-08 11:48:16,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13380.5). Total num frames: 1441792. Throughput: 0: 1792.3, 1: 1776.4. Samples: 374234. Policy #0 lag: (min: 15.0, avg: 25.1, max: 47.0) +[2023-10-08 11:48:16,876][101941] Avg episode reward: [(0, '4.050'), (1, '4.620')] +[2023-10-08 11:48:16,889][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000000704_720896.pth... +[2023-10-08 11:48:16,889][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000000704_720896.pth... +[2023-10-08 11:48:17,730][102897] Updated weights for policy 0, policy_version 710 (0.0007) +[2023-10-08 11:48:17,962][102898] Updated weights for policy 1, policy_version 710 (0.0007) +[2023-10-08 11:48:18,094][102897] Updated weights for policy 0, policy_version 720 (0.0007) +[2023-10-08 11:48:18,326][102898] Updated weights for policy 1, policy_version 720 (0.0007) +[2023-10-08 11:48:18,464][102897] Updated weights for policy 0, policy_version 730 (0.0007) +[2023-10-08 11:48:18,694][102898] Updated weights for policy 1, policy_version 730 (0.0007) +[2023-10-08 11:48:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13368.4). Total num frames: 1507328. Throughput: 0: 1789.4, 1: 1775.0. Samples: 383848. Policy #0 lag: (min: 4.0, avg: 11.5, max: 36.0) +[2023-10-08 11:48:21,876][101941] Avg episode reward: [(0, '4.350'), (1, '4.110')] +[2023-10-08 11:48:22,216][102897] Updated weights for policy 0, policy_version 740 (0.0008) +[2023-10-08 11:48:22,591][102897] Updated weights for policy 0, policy_version 750 (0.0009) +[2023-10-08 11:48:22,592][102898] Updated weights for policy 1, policy_version 740 (0.0008) +[2023-10-08 11:48:22,950][102898] Updated weights for policy 1, policy_version 750 (0.0007) +[2023-10-08 11:48:22,954][102897] Updated weights for policy 0, policy_version 760 (0.0007) +[2023-10-08 11:48:23,325][102898] Updated weights for policy 1, policy_version 760 (0.0007) +[2023-10-08 11:48:26,689][102897] Updated weights for policy 0, policy_version 770 (0.0008) +[2023-10-08 11:48:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 13357.3). Total num frames: 1572864. Throughput: 0: 1788.5, 1: 1772.2. Samples: 405868. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:48:26,876][101941] Avg episode reward: [(0, '4.110'), (1, '4.090')] +[2023-10-08 11:48:26,999][102898] Updated weights for policy 1, policy_version 770 (0.0008) +[2023-10-08 11:48:27,061][102897] Updated weights for policy 0, policy_version 780 (0.0009) +[2023-10-08 11:48:27,362][102898] Updated weights for policy 1, policy_version 780 (0.0008) +[2023-10-08 11:48:27,440][102897] Updated weights for policy 0, policy_version 790 (0.0007) +[2023-10-08 11:48:27,730][102898] Updated weights for policy 1, policy_version 790 (0.0008) +[2023-10-08 11:48:27,806][102897] Updated weights for policy 0, policy_version 800 (0.0007) +[2023-10-08 11:48:28,096][102898] Updated weights for policy 1, policy_version 800 (0.0008) +[2023-10-08 11:48:31,643][102897] Updated weights for policy 0, policy_version 810 (0.0009) +[2023-10-08 11:48:31,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13347.1). Total num frames: 1638400. Throughput: 0: 1801.5, 1: 1797.3. Samples: 427962. Policy #0 lag: (min: 15.0, avg: 21.3, max: 47.0) +[2023-10-08 11:48:31,876][101941] Avg episode reward: [(0, '4.110'), (1, '4.190')] +[2023-10-08 11:48:31,939][102898] Updated weights for policy 1, policy_version 810 (0.0009) +[2023-10-08 11:48:32,019][102897] Updated weights for policy 0, policy_version 820 (0.0007) +[2023-10-08 11:48:32,299][102898] Updated weights for policy 1, policy_version 820 (0.0007) +[2023-10-08 11:48:32,381][102897] Updated weights for policy 0, policy_version 830 (0.0007) +[2023-10-08 11:48:32,671][102898] Updated weights for policy 1, policy_version 830 (0.0007) +[2023-10-08 11:48:36,268][102897] Updated weights for policy 0, policy_version 840 (0.0008) +[2023-10-08 11:48:36,487][102898] Updated weights for policy 1, policy_version 840 (0.0008) +[2023-10-08 11:48:36,639][102897] Updated weights for policy 0, policy_version 850 (0.0007) +[2023-10-08 11:48:36,858][102898] Updated weights for policy 1, policy_version 850 (0.0007) +[2023-10-08 11:48:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13337.7). Total num frames: 1703936. Throughput: 0: 1776.5, 1: 1771.3. Samples: 437636. Policy #0 lag: (min: 12.0, avg: 20.9, max: 44.0) +[2023-10-08 11:48:36,876][101941] Avg episode reward: [(0, '3.910'), (1, '4.540')] +[2023-10-08 11:48:36,993][102897] Updated weights for policy 0, policy_version 860 (0.0008) +[2023-10-08 11:48:37,222][102898] Updated weights for policy 1, policy_version 860 (0.0007) +[2023-10-08 11:48:40,720][102897] Updated weights for policy 0, policy_version 870 (0.0007) +[2023-10-08 11:48:41,094][102897] Updated weights for policy 0, policy_version 880 (0.0008) +[2023-10-08 11:48:41,098][102898] Updated weights for policy 1, policy_version 870 (0.0007) +[2023-10-08 11:48:41,457][102897] Updated weights for policy 0, policy_version 890 (0.0009) +[2023-10-08 11:48:41,465][102898] Updated weights for policy 1, policy_version 880 (0.0007) +[2023-10-08 11:48:41,836][102898] Updated weights for policy 1, policy_version 890 (0.0007) +[2023-10-08 11:48:41,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 13575.9). Total num frames: 1802240. Throughput: 0: 1795.6, 1: 1784.3. Samples: 459662. Policy #0 lag: (min: 16.0, avg: 38.5, max: 48.0) +[2023-10-08 11:48:41,876][101941] Avg episode reward: [(0, '4.280'), (1, '4.870')] +[2023-10-08 11:48:45,345][102897] Updated weights for policy 0, policy_version 900 (0.0009) +[2023-10-08 11:48:45,641][102898] Updated weights for policy 1, policy_version 900 (0.0008) +[2023-10-08 11:48:45,716][102897] Updated weights for policy 0, policy_version 910 (0.0007) +[2023-10-08 11:48:46,004][102898] Updated weights for policy 1, policy_version 910 (0.0008) +[2023-10-08 11:48:46,075][102897] Updated weights for policy 0, policy_version 920 (0.0009) +[2023-10-08 11:48:46,367][102898] Updated weights for policy 1, policy_version 920 (0.0009) +[2023-10-08 11:48:46,875][101941] Fps is (10 sec: 19660.7, 60 sec: 14199.4, 300 sec: 13796.7). Total num frames: 1900544. Throughput: 0: 1779.3, 1: 1773.3. Samples: 479414. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:48:46,876][101941] Avg episode reward: [(0, '4.550'), (1, '5.470')] +[2023-10-08 11:48:46,884][102760] Saving new best policy, reward=5.470! +[2023-10-08 11:48:49,902][102897] Updated weights for policy 0, policy_version 930 (0.0008) +[2023-10-08 11:48:50,147][102898] Updated weights for policy 1, policy_version 930 (0.0010) +[2023-10-08 11:48:50,297][102897] Updated weights for policy 0, policy_version 940 (0.0008) +[2023-10-08 11:48:50,516][102898] Updated weights for policy 1, policy_version 940 (0.0008) +[2023-10-08 11:48:50,657][102897] Updated weights for policy 0, policy_version 950 (0.0011) +[2023-10-08 11:48:50,876][102898] Updated weights for policy 1, policy_version 950 (0.0009) +[2023-10-08 11:48:51,029][102897] Updated weights for policy 0, policy_version 960 (0.0009) +[2023-10-08 11:48:51,248][102898] Updated weights for policy 1, policy_version 960 (0.0010) +[2023-10-08 11:48:51,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 13772.6). Total num frames: 1966080. Throughput: 0: 1784.6, 1: 1778.7. Samples: 491470. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 11:48:51,876][101941] Avg episode reward: [(0, '4.890'), (1, '5.710')] +[2023-10-08 11:48:51,877][102760] Saving new best policy, reward=5.710! +[2023-10-08 11:48:54,748][102897] Updated weights for policy 0, policy_version 970 (0.0009) +[2023-10-08 11:48:54,910][102898] Updated weights for policy 1, policy_version 970 (0.0008) +[2023-10-08 11:48:55,119][102897] Updated weights for policy 0, policy_version 980 (0.0008) +[2023-10-08 11:48:55,274][102898] Updated weights for policy 1, policy_version 980 (0.0008) +[2023-10-08 11:48:55,496][102897] Updated weights for policy 0, policy_version 990 (0.0009) +[2023-10-08 11:48:55,638][102898] Updated weights for policy 1, policy_version 990 (0.0008) +[2023-10-08 11:48:56,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13750.0). Total num frames: 2031616. Throughput: 0: 1772.6, 1: 1779.9. Samples: 511746. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 11:48:56,876][101941] Avg episode reward: [(0, '4.860'), (1, '5.080')] +[2023-10-08 11:48:59,332][102897] Updated weights for policy 0, policy_version 1000 (0.0010) +[2023-10-08 11:48:59,344][102898] Updated weights for policy 1, policy_version 1000 (0.0007) +[2023-10-08 11:48:59,705][102897] Updated weights for policy 0, policy_version 1010 (0.0009) +[2023-10-08 11:48:59,713][102898] Updated weights for policy 1, policy_version 1010 (0.0009) +[2023-10-08 11:49:00,070][102897] Updated weights for policy 0, policy_version 1020 (0.0008) +[2023-10-08 11:49:00,076][102898] Updated weights for policy 1, policy_version 1020 (0.0009) +[2023-10-08 11:49:01,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 13729.0). Total num frames: 2097152. Throughput: 0: 1762.1, 1: 1775.3. Samples: 533416. Policy #0 lag: (min: 13.0, avg: 13.8, max: 32.0) +[2023-10-08 11:49:01,876][101941] Avg episode reward: [(0, '4.700'), (1, '4.800')] +[2023-10-08 11:49:03,735][102897] Updated weights for policy 0, policy_version 1030 (0.0007) +[2023-10-08 11:49:03,807][102898] Updated weights for policy 1, policy_version 1030 (0.0009) +[2023-10-08 11:49:04,099][102897] Updated weights for policy 0, policy_version 1040 (0.0008) +[2023-10-08 11:49:04,174][102898] Updated weights for policy 1, policy_version 1040 (0.0010) +[2023-10-08 11:49:04,471][102897] Updated weights for policy 0, policy_version 1050 (0.0008) +[2023-10-08 11:49:04,543][102898] Updated weights for policy 1, policy_version 1050 (0.0007) +[2023-10-08 11:49:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13709.3). Total num frames: 2162688. Throughput: 0: 1778.7, 1: 1785.5. Samples: 544236. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 11:49:06,876][101941] Avg episode reward: [(0, '4.720'), (1, '5.150')] +[2023-10-08 11:49:08,166][102897] Updated weights for policy 0, policy_version 1060 (0.0008) +[2023-10-08 11:49:08,380][102898] Updated weights for policy 1, policy_version 1060 (0.0009) +[2023-10-08 11:49:08,540][102897] Updated weights for policy 0, policy_version 1070 (0.0008) +[2023-10-08 11:49:08,752][102898] Updated weights for policy 1, policy_version 1070 (0.0009) +[2023-10-08 11:49:08,901][102897] Updated weights for policy 0, policy_version 1080 (0.0009) +[2023-10-08 11:49:09,115][102898] Updated weights for policy 1, policy_version 1080 (0.0007) +[2023-10-08 11:49:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 13690.8). Total num frames: 2228224. Throughput: 0: 1773.7, 1: 1775.9. Samples: 565598. Policy #0 lag: (min: 31.0, avg: 38.9, max: 63.0) +[2023-10-08 11:49:11,876][101941] Avg episode reward: [(0, '4.500'), (1, '5.340')] +[2023-10-08 11:49:12,939][102897] Updated weights for policy 0, policy_version 1090 (0.0008) +[2023-10-08 11:49:13,020][102898] Updated weights for policy 1, policy_version 1090 (0.0007) +[2023-10-08 11:49:13,303][102897] Updated weights for policy 0, policy_version 1100 (0.0007) +[2023-10-08 11:49:13,386][102898] Updated weights for policy 1, policy_version 1100 (0.0007) +[2023-10-08 11:49:13,676][102897] Updated weights for policy 0, policy_version 1110 (0.0007) +[2023-10-08 11:49:13,747][102898] Updated weights for policy 1, policy_version 1110 (0.0008) +[2023-10-08 11:49:14,038][102897] Updated weights for policy 0, policy_version 1120 (0.0008) +[2023-10-08 11:49:14,107][102898] Updated weights for policy 1, policy_version 1120 (0.0009) +[2023-10-08 11:49:16,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13673.4). Total num frames: 2293760. Throughput: 0: 1777.5, 1: 1772.5. Samples: 587710. Policy #0 lag: (min: 6.0, avg: 13.8, max: 38.0) +[2023-10-08 11:49:16,875][101941] Avg episode reward: [(0, '4.550'), (1, '5.070')] +[2023-10-08 11:49:17,862][102897] Updated weights for policy 0, policy_version 1130 (0.0009) +[2023-10-08 11:49:17,907][102898] Updated weights for policy 1, policy_version 1130 (0.0007) +[2023-10-08 11:49:18,235][102897] Updated weights for policy 0, policy_version 1140 (0.0008) +[2023-10-08 11:49:18,273][102898] Updated weights for policy 1, policy_version 1140 (0.0008) +[2023-10-08 11:49:18,615][102897] Updated weights for policy 0, policy_version 1150 (0.0007) +[2023-10-08 11:49:18,649][102898] Updated weights for policy 1, policy_version 1150 (0.0007) +[2023-10-08 11:49:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 13657.0). Total num frames: 2359296. Throughput: 0: 1776.4, 1: 1776.2. Samples: 597504. Policy #0 lag: (min: 31.0, avg: 32.5, max: 57.0) +[2023-10-08 11:49:21,876][101941] Avg episode reward: [(0, '4.450'), (1, '4.970')] +[2023-10-08 11:49:22,255][102897] Updated weights for policy 0, policy_version 1160 (0.0007) +[2023-10-08 11:49:22,402][102898] Updated weights for policy 1, policy_version 1160 (0.0007) +[2023-10-08 11:49:22,622][102897] Updated weights for policy 0, policy_version 1170 (0.0009) +[2023-10-08 11:49:22,758][102898] Updated weights for policy 1, policy_version 1170 (0.0007) +[2023-10-08 11:49:22,992][102897] Updated weights for policy 0, policy_version 1180 (0.0010) +[2023-10-08 11:49:23,129][102898] Updated weights for policy 1, policy_version 1180 (0.0008) +[2023-10-08 11:49:26,690][102897] Updated weights for policy 0, policy_version 1190 (0.0009) +[2023-10-08 11:49:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13641.6). Total num frames: 2424832. Throughput: 0: 1774.9, 1: 1778.9. Samples: 619584. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:49:26,876][101941] Avg episode reward: [(0, '4.580'), (1, '5.270')] +[2023-10-08 11:49:27,045][102898] Updated weights for policy 1, policy_version 1190 (0.0009) +[2023-10-08 11:49:27,065][102897] Updated weights for policy 0, policy_version 1200 (0.0008) +[2023-10-08 11:49:27,395][102898] Updated weights for policy 1, policy_version 1200 (0.0007) +[2023-10-08 11:49:27,434][102897] Updated weights for policy 0, policy_version 1210 (0.0008) +[2023-10-08 11:49:27,764][102898] Updated weights for policy 1, policy_version 1210 (0.0008) +[2023-10-08 11:49:31,219][102897] Updated weights for policy 0, policy_version 1220 (0.0007) +[2023-10-08 11:49:31,422][102898] Updated weights for policy 1, policy_version 1220 (0.0009) +[2023-10-08 11:49:31,579][102897] Updated weights for policy 0, policy_version 1230 (0.0008) +[2023-10-08 11:49:31,788][102898] Updated weights for policy 1, policy_version 1230 (0.0008) +[2023-10-08 11:49:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13626.9). Total num frames: 2490368. Throughput: 0: 1797.6, 1: 1801.3. Samples: 641368. Policy #0 lag: (min: 31.0, avg: 32.5, max: 50.0) +[2023-10-08 11:49:31,876][101941] Avg episode reward: [(0, '4.970'), (1, '5.170')] +[2023-10-08 11:49:31,956][102897] Updated weights for policy 0, policy_version 1240 (0.0007) +[2023-10-08 11:49:32,161][102898] Updated weights for policy 1, policy_version 1240 (0.0007) +[2023-10-08 11:49:35,736][102897] Updated weights for policy 0, policy_version 1250 (0.0008) +[2023-10-08 11:49:35,959][102898] Updated weights for policy 1, policy_version 1250 (0.0007) +[2023-10-08 11:49:36,139][102897] Updated weights for policy 0, policy_version 1260 (0.0007) +[2023-10-08 11:49:36,323][102898] Updated weights for policy 1, policy_version 1260 (0.0007) +[2023-10-08 11:49:36,512][102897] Updated weights for policy 0, policy_version 1270 (0.0007) +[2023-10-08 11:49:36,692][102898] Updated weights for policy 1, policy_version 1270 (0.0007) +[2023-10-08 11:49:36,874][102897] Updated weights for policy 0, policy_version 1280 (0.0008) +[2023-10-08 11:49:36,877][101941] Fps is (10 sec: 16381.2, 60 sec: 14745.2, 300 sec: 13787.5). Total num frames: 2588672. Throughput: 0: 1783.1, 1: 1782.2. Samples: 651914. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:49:36,877][101941] Avg episode reward: [(0, '4.730'), (1, '5.380')] +[2023-10-08 11:49:37,055][102898] Updated weights for policy 1, policy_version 1280 (0.0008) +[2023-10-08 11:49:40,675][102897] Updated weights for policy 0, policy_version 1290 (0.0008) +[2023-10-08 11:49:40,842][102898] Updated weights for policy 1, policy_version 1290 (0.0007) +[2023-10-08 11:49:41,049][102897] Updated weights for policy 0, policy_version 1300 (0.0009) +[2023-10-08 11:49:41,208][102898] Updated weights for policy 1, policy_version 1300 (0.0007) +[2023-10-08 11:49:41,420][102897] Updated weights for policy 0, policy_version 1310 (0.0009) +[2023-10-08 11:49:41,580][102898] Updated weights for policy 1, policy_version 1310 (0.0007) +[2023-10-08 11:49:41,875][101941] Fps is (10 sec: 19661.1, 60 sec: 14745.6, 300 sec: 13940.0). Total num frames: 2686976. Throughput: 0: 1802.2, 1: 1802.7. Samples: 673966. Policy #0 lag: (min: 26.0, avg: 32.2, max: 58.0) +[2023-10-08 11:49:41,876][101941] Avg episode reward: [(0, '5.280'), (1, '5.350')] +[2023-10-08 11:49:41,877][102634] Saving new best policy, reward=5.280! +[2023-10-08 11:49:45,394][102897] Updated weights for policy 0, policy_version 1320 (0.0007) +[2023-10-08 11:49:45,479][102898] Updated weights for policy 1, policy_version 1320 (0.0008) +[2023-10-08 11:49:45,760][102897] Updated weights for policy 0, policy_version 1330 (0.0007) +[2023-10-08 11:49:45,859][102898] Updated weights for policy 1, policy_version 1330 (0.0010) +[2023-10-08 11:49:46,136][102897] Updated weights for policy 0, policy_version 1340 (0.0008) +[2023-10-08 11:49:46,226][102898] Updated weights for policy 1, policy_version 1340 (0.0007) +[2023-10-08 11:49:46,875][101941] Fps is (10 sec: 16386.5, 60 sec: 14199.4, 300 sec: 13918.9). Total num frames: 2752512. Throughput: 0: 1783.8, 1: 1769.1. Samples: 693294. Policy #0 lag: (min: 28.0, avg: 41.3, max: 60.0) +[2023-10-08 11:49:46,876][101941] Avg episode reward: [(0, '5.340'), (1, '5.240')] +[2023-10-08 11:49:46,887][102634] Saving new best policy, reward=5.340! +[2023-10-08 11:49:49,824][102897] Updated weights for policy 0, policy_version 1350 (0.0007) +[2023-10-08 11:49:50,052][102898] Updated weights for policy 1, policy_version 1350 (0.0009) +[2023-10-08 11:49:50,197][102897] Updated weights for policy 0, policy_version 1360 (0.0007) +[2023-10-08 11:49:50,416][102898] Updated weights for policy 1, policy_version 1360 (0.0007) +[2023-10-08 11:49:50,571][102897] Updated weights for policy 0, policy_version 1370 (0.0007) +[2023-10-08 11:49:50,793][102898] Updated weights for policy 1, policy_version 1370 (0.0008) +[2023-10-08 11:49:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 13898.9). Total num frames: 2818048. Throughput: 0: 1800.3, 1: 1789.7. Samples: 705784. Policy #0 lag: (min: 10.0, avg: 13.2, max: 42.0) +[2023-10-08 11:49:51,876][101941] Avg episode reward: [(0, '5.150'), (1, '5.420')] +[2023-10-08 11:49:54,292][102897] Updated weights for policy 0, policy_version 1380 (0.0008) +[2023-10-08 11:49:54,541][102898] Updated weights for policy 1, policy_version 1380 (0.0009) +[2023-10-08 11:49:54,664][102897] Updated weights for policy 0, policy_version 1390 (0.0009) +[2023-10-08 11:49:54,914][102898] Updated weights for policy 1, policy_version 1390 (0.0008) +[2023-10-08 11:49:55,034][102897] Updated weights for policy 0, policy_version 1400 (0.0008) +[2023-10-08 11:49:55,281][102898] Updated weights for policy 1, policy_version 1400 (0.0007) +[2023-10-08 11:49:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13879.8). Total num frames: 2883584. Throughput: 0: 1777.2, 1: 1773.9. Samples: 725396. Policy #0 lag: (min: 10.0, avg: 19.9, max: 42.0) +[2023-10-08 11:49:56,876][101941] Avg episode reward: [(0, '5.390'), (1, '5.860')] +[2023-10-08 11:49:56,878][102634] Saving new best policy, reward=5.390! +[2023-10-08 11:49:56,878][102760] Saving new best policy, reward=5.860! +[2023-10-08 11:49:58,576][102897] Updated weights for policy 0, policy_version 1410 (0.0009) +[2023-10-08 11:49:58,959][102897] Updated weights for policy 0, policy_version 1420 (0.0008) +[2023-10-08 11:49:59,066][102898] Updated weights for policy 1, policy_version 1410 (0.0011) +[2023-10-08 11:49:59,323][102897] Updated weights for policy 0, policy_version 1430 (0.0008) +[2023-10-08 11:49:59,440][102898] Updated weights for policy 1, policy_version 1420 (0.0007) +[2023-10-08 11:49:59,684][102897] Updated weights for policy 0, policy_version 1440 (0.0008) +[2023-10-08 11:49:59,816][102898] Updated weights for policy 1, policy_version 1430 (0.0008) +[2023-10-08 11:50:00,184][102898] Updated weights for policy 1, policy_version 1440 (0.0008) +[2023-10-08 11:50:01,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 13861.7). Total num frames: 2949120. Throughput: 0: 1778.7, 1: 1772.0. Samples: 747492. Policy #0 lag: (min: 15.0, avg: 17.8, max: 47.0) +[2023-10-08 11:50:01,875][101941] Avg episode reward: [(0, '5.180'), (1, '6.390')] +[2023-10-08 11:50:01,884][102760] Saving new best policy, reward=6.390! +[2023-10-08 11:50:03,468][102897] Updated weights for policy 0, policy_version 1450 (0.0010) +[2023-10-08 11:50:03,834][102897] Updated weights for policy 0, policy_version 1460 (0.0009) +[2023-10-08 11:50:03,928][102898] Updated weights for policy 1, policy_version 1450 (0.0007) +[2023-10-08 11:50:04,210][102897] Updated weights for policy 0, policy_version 1470 (0.0008) +[2023-10-08 11:50:04,301][102898] Updated weights for policy 1, policy_version 1460 (0.0008) +[2023-10-08 11:50:04,668][102898] Updated weights for policy 1, policy_version 1470 (0.0008) +[2023-10-08 11:50:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13844.4). Total num frames: 3014656. Throughput: 0: 1780.4, 1: 1778.0. Samples: 757632. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:50:06,876][101941] Avg episode reward: [(0, '4.510'), (1, '5.760')] +[2023-10-08 11:50:08,046][102897] Updated weights for policy 0, policy_version 1480 (0.0009) +[2023-10-08 11:50:08,425][102897] Updated weights for policy 0, policy_version 1490 (0.0008) +[2023-10-08 11:50:08,561][102898] Updated weights for policy 1, policy_version 1480 (0.0008) +[2023-10-08 11:50:08,787][102897] Updated weights for policy 0, policy_version 1500 (0.0008) +[2023-10-08 11:50:08,923][102898] Updated weights for policy 1, policy_version 1490 (0.0008) +[2023-10-08 11:50:09,302][102898] Updated weights for policy 1, policy_version 1500 (0.0009) +[2023-10-08 11:50:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13827.8). Total num frames: 3080192. Throughput: 0: 1780.1, 1: 1771.4. Samples: 779402. Policy #0 lag: (min: 31.0, avg: 36.5, max: 63.0) +[2023-10-08 11:50:11,875][101941] Avg episode reward: [(0, '4.400'), (1, '5.100')] +[2023-10-08 11:50:12,646][102897] Updated weights for policy 0, policy_version 1510 (0.0007) +[2023-10-08 11:50:13,002][102898] Updated weights for policy 1, policy_version 1510 (0.0007) +[2023-10-08 11:50:13,018][102897] Updated weights for policy 0, policy_version 1520 (0.0007) +[2023-10-08 11:50:13,378][102898] Updated weights for policy 1, policy_version 1520 (0.0007) +[2023-10-08 11:50:13,394][102897] Updated weights for policy 0, policy_version 1530 (0.0007) +[2023-10-08 11:50:13,740][102898] Updated weights for policy 1, policy_version 1530 (0.0007) +[2023-10-08 11:50:16,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13812.0). Total num frames: 3145728. Throughput: 0: 1783.3, 1: 1777.9. Samples: 801622. Policy #0 lag: (min: 5.0, avg: 11.4, max: 37.0) +[2023-10-08 11:50:16,875][101941] Avg episode reward: [(0, '4.580'), (1, '5.300')] +[2023-10-08 11:50:16,884][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000001536_1572864.pth... +[2023-10-08 11:50:16,885][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000001536_1572864.pth... +[2023-10-08 11:50:17,220][102897] Updated weights for policy 0, policy_version 1540 (0.0009) +[2023-10-08 11:50:17,406][102898] Updated weights for policy 1, policy_version 1540 (0.0008) +[2023-10-08 11:50:17,586][102897] Updated weights for policy 0, policy_version 1550 (0.0008) +[2023-10-08 11:50:17,782][102898] Updated weights for policy 1, policy_version 1550 (0.0007) +[2023-10-08 11:50:17,965][102897] Updated weights for policy 0, policy_version 1560 (0.0009) +[2023-10-08 11:50:18,151][102898] Updated weights for policy 1, policy_version 1560 (0.0009) +[2023-10-08 11:50:21,749][102897] Updated weights for policy 0, policy_version 1570 (0.0009) +[2023-10-08 11:50:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13796.9). Total num frames: 3211264. Throughput: 0: 1771.7, 1: 1773.1. Samples: 811424. Policy #0 lag: (min: 17.0, avg: 22.9, max: 49.0) +[2023-10-08 11:50:21,876][101941] Avg episode reward: [(0, '4.930'), (1, '5.990')] +[2023-10-08 11:50:21,918][102898] Updated weights for policy 1, policy_version 1570 (0.0009) +[2023-10-08 11:50:22,129][102897] Updated weights for policy 0, policy_version 1580 (0.0007) +[2023-10-08 11:50:22,276][102898] Updated weights for policy 1, policy_version 1580 (0.0008) +[2023-10-08 11:50:22,498][102897] Updated weights for policy 0, policy_version 1590 (0.0007) +[2023-10-08 11:50:22,647][102898] Updated weights for policy 1, policy_version 1590 (0.0007) +[2023-10-08 11:50:22,871][102897] Updated weights for policy 0, policy_version 1600 (0.0008) +[2023-10-08 11:50:23,028][102898] Updated weights for policy 1, policy_version 1600 (0.0007) +[2023-10-08 11:50:26,783][102898] Updated weights for policy 1, policy_version 1610 (0.0008) +[2023-10-08 11:50:26,828][102897] Updated weights for policy 0, policy_version 1610 (0.0007) +[2023-10-08 11:50:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13782.4). Total num frames: 3276800. Throughput: 0: 1775.0, 1: 1771.5. Samples: 833558. Policy #0 lag: (min: 30.0, avg: 30.8, max: 49.0) +[2023-10-08 11:50:26,876][101941] Avg episode reward: [(0, '5.430'), (1, '6.260')] +[2023-10-08 11:50:27,157][102898] Updated weights for policy 1, policy_version 1620 (0.0007) +[2023-10-08 11:50:27,204][102897] Updated weights for policy 0, policy_version 1620 (0.0009) +[2023-10-08 11:50:27,523][102898] Updated weights for policy 1, policy_version 1630 (0.0007) +[2023-10-08 11:50:27,575][102897] Updated weights for policy 0, policy_version 1630 (0.0007) +[2023-10-08 11:50:27,647][102634] Saving new best policy, reward=5.430! +[2023-10-08 11:50:31,337][102897] Updated weights for policy 0, policy_version 1640 (0.0007) +[2023-10-08 11:50:31,372][102898] Updated weights for policy 1, policy_version 1640 (0.0008) +[2023-10-08 11:50:31,718][102897] Updated weights for policy 0, policy_version 1650 (0.0008) +[2023-10-08 11:50:31,747][102898] Updated weights for policy 1, policy_version 1650 (0.0009) +[2023-10-08 11:50:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 13768.4). Total num frames: 3342336. Throughput: 0: 1793.1, 1: 1796.0. Samples: 854802. Policy #0 lag: (min: 13.0, avg: 17.5, max: 45.0) +[2023-10-08 11:50:31,876][101941] Avg episode reward: [(0, '5.230'), (1, '5.560')] +[2023-10-08 11:50:32,087][102897] Updated weights for policy 0, policy_version 1660 (0.0009) +[2023-10-08 11:50:32,117][102898] Updated weights for policy 1, policy_version 1660 (0.0008) +[2023-10-08 11:50:35,792][102897] Updated weights for policy 0, policy_version 1670 (0.0008) +[2023-10-08 11:50:35,985][102898] Updated weights for policy 1, policy_version 1670 (0.0008) +[2023-10-08 11:50:36,162][102897] Updated weights for policy 0, policy_version 1680 (0.0009) +[2023-10-08 11:50:36,351][102898] Updated weights for policy 1, policy_version 1680 (0.0007) +[2023-10-08 11:50:36,538][102897] Updated weights for policy 0, policy_version 1690 (0.0007) +[2023-10-08 11:50:36,718][102898] Updated weights for policy 1, policy_version 1690 (0.0008) +[2023-10-08 11:50:36,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.9, 300 sec: 13887.4). Total num frames: 3440640. Throughput: 0: 1769.4, 1: 1772.3. Samples: 865162. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 11:50:36,875][101941] Avg episode reward: [(0, '5.020'), (1, '5.230')] +[2023-10-08 11:50:40,412][102897] Updated weights for policy 0, policy_version 1700 (0.0008) +[2023-10-08 11:50:40,617][102898] Updated weights for policy 1, policy_version 1700 (0.0007) +[2023-10-08 11:50:40,787][102897] Updated weights for policy 0, policy_version 1710 (0.0009) +[2023-10-08 11:50:40,990][102898] Updated weights for policy 1, policy_version 1710 (0.0007) +[2023-10-08 11:50:41,146][102897] Updated weights for policy 0, policy_version 1720 (0.0010) +[2023-10-08 11:50:41,353][102898] Updated weights for policy 1, policy_version 1720 (0.0008) +[2023-10-08 11:50:41,875][101941] Fps is (10 sec: 19660.9, 60 sec: 14199.5, 300 sec: 14001.6). Total num frames: 3538944. Throughput: 0: 1794.4, 1: 1797.7. Samples: 887042. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 11:50:41,876][101941] Avg episode reward: [(0, '4.950'), (1, '4.880')] +[2023-10-08 11:50:44,912][102897] Updated weights for policy 0, policy_version 1730 (0.0008) +[2023-10-08 11:50:45,152][102898] Updated weights for policy 1, policy_version 1730 (0.0008) +[2023-10-08 11:50:45,283][102897] Updated weights for policy 0, policy_version 1740 (0.0008) +[2023-10-08 11:50:45,518][102898] Updated weights for policy 1, policy_version 1740 (0.0007) +[2023-10-08 11:50:45,648][102897] Updated weights for policy 0, policy_version 1750 (0.0008) +[2023-10-08 11:50:45,882][102898] Updated weights for policy 1, policy_version 1750 (0.0008) +[2023-10-08 11:50:46,011][102897] Updated weights for policy 0, policy_version 1760 (0.0009) +[2023-10-08 11:50:46,247][102898] Updated weights for policy 1, policy_version 1760 (0.0008) +[2023-10-08 11:50:46,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 13984.2). Total num frames: 3604480. Throughput: 0: 1766.4, 1: 1770.7. Samples: 906662. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:50:46,876][101941] Avg episode reward: [(0, '5.100'), (1, '5.240')] +[2023-10-08 11:50:49,799][102897] Updated weights for policy 0, policy_version 1770 (0.0010) +[2023-10-08 11:50:50,021][102898] Updated weights for policy 1, policy_version 1770 (0.0008) +[2023-10-08 11:50:50,169][102897] Updated weights for policy 0, policy_version 1780 (0.0008) +[2023-10-08 11:50:50,384][102898] Updated weights for policy 1, policy_version 1780 (0.0008) +[2023-10-08 11:50:50,545][102897] Updated weights for policy 0, policy_version 1790 (0.0007) +[2023-10-08 11:50:50,753][102898] Updated weights for policy 1, policy_version 1790 (0.0009) +[2023-10-08 11:50:51,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 13967.5). Total num frames: 3670016. Throughput: 0: 1796.1, 1: 1792.0. Samples: 919096. Policy #0 lag: (min: 8.0, avg: 35.0, max: 40.0) +[2023-10-08 11:50:51,876][101941] Avg episode reward: [(0, '5.030'), (1, '6.040')] +[2023-10-08 11:50:54,273][102897] Updated weights for policy 0, policy_version 1800 (0.0007) +[2023-10-08 11:50:54,642][102897] Updated weights for policy 0, policy_version 1810 (0.0008) +[2023-10-08 11:50:54,707][102898] Updated weights for policy 1, policy_version 1800 (0.0008) +[2023-10-08 11:50:55,009][102897] Updated weights for policy 0, policy_version 1820 (0.0007) +[2023-10-08 11:50:55,074][102898] Updated weights for policy 1, policy_version 1810 (0.0007) +[2023-10-08 11:50:55,441][102898] Updated weights for policy 1, policy_version 1820 (0.0009) +[2023-10-08 11:50:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13951.5). Total num frames: 3735552. Throughput: 0: 1762.5, 1: 1776.5. Samples: 938658. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:50:56,876][101941] Avg episode reward: [(0, '5.160'), (1, '5.940')] +[2023-10-08 11:50:58,746][102897] Updated weights for policy 0, policy_version 1830 (0.0010) +[2023-10-08 11:50:59,114][102897] Updated weights for policy 0, policy_version 1840 (0.0009) +[2023-10-08 11:50:59,222][102898] Updated weights for policy 1, policy_version 1830 (0.0007) +[2023-10-08 11:50:59,486][102897] Updated weights for policy 0, policy_version 1850 (0.0008) +[2023-10-08 11:50:59,597][102898] Updated weights for policy 1, policy_version 1840 (0.0007) +[2023-10-08 11:50:59,964][102898] Updated weights for policy 1, policy_version 1850 (0.0007) +[2023-10-08 11:51:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13936.0). Total num frames: 3801088. Throughput: 0: 1772.7, 1: 1764.7. Samples: 960806. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:51:01,876][101941] Avg episode reward: [(0, '5.610'), (1, '5.600')] +[2023-10-08 11:51:01,887][102634] Saving new best policy, reward=5.610! +[2023-10-08 11:51:03,272][102897] Updated weights for policy 0, policy_version 1860 (0.0007) +[2023-10-08 11:51:03,644][102897] Updated weights for policy 0, policy_version 1870 (0.0007) +[2023-10-08 11:51:03,719][102898] Updated weights for policy 1, policy_version 1860 (0.0008) +[2023-10-08 11:51:04,015][102897] Updated weights for policy 0, policy_version 1880 (0.0008) +[2023-10-08 11:51:04,084][102898] Updated weights for policy 1, policy_version 1870 (0.0008) +[2023-10-08 11:51:04,448][102898] Updated weights for policy 1, policy_version 1880 (0.0008) +[2023-10-08 11:51:06,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 13921.1). Total num frames: 3866624. Throughput: 0: 1769.5, 1: 1771.5. Samples: 970772. Policy #0 lag: (min: 26.0, avg: 26.0, max: 26.0) +[2023-10-08 11:51:06,876][101941] Avg episode reward: [(0, '5.690'), (1, '5.530')] +[2023-10-08 11:51:06,878][102634] Saving new best policy, reward=5.690! +[2023-10-08 11:51:07,759][102897] Updated weights for policy 0, policy_version 1890 (0.0008) +[2023-10-08 11:51:08,183][102897] Updated weights for policy 0, policy_version 1900 (0.0009) +[2023-10-08 11:51:08,306][102898] Updated weights for policy 1, policy_version 1890 (0.0007) +[2023-10-08 11:51:08,553][102897] Updated weights for policy 0, policy_version 1910 (0.0010) +[2023-10-08 11:51:08,684][102898] Updated weights for policy 1, policy_version 1900 (0.0008) +[2023-10-08 11:51:08,930][102897] Updated weights for policy 0, policy_version 1920 (0.0008) +[2023-10-08 11:51:09,056][102898] Updated weights for policy 1, policy_version 1910 (0.0008) +[2023-10-08 11:51:09,422][102898] Updated weights for policy 1, policy_version 1920 (0.0008) +[2023-10-08 11:51:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13906.7). Total num frames: 3932160. Throughput: 0: 1771.3, 1: 1759.0. Samples: 992424. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:51:11,875][101941] Avg episode reward: [(0, '5.760'), (1, '5.130')] +[2023-10-08 11:51:11,876][102634] Saving new best policy, reward=5.760! +[2023-10-08 11:51:12,505][102897] Updated weights for policy 0, policy_version 1930 (0.0007) +[2023-10-08 11:51:12,878][102897] Updated weights for policy 0, policy_version 1940 (0.0008) +[2023-10-08 11:51:13,255][102897] Updated weights for policy 0, policy_version 1950 (0.0007) +[2023-10-08 11:51:13,336][102898] Updated weights for policy 1, policy_version 1930 (0.0008) +[2023-10-08 11:51:13,695][102898] Updated weights for policy 1, policy_version 1940 (0.0009) +[2023-10-08 11:51:14,078][102898] Updated weights for policy 1, policy_version 1950 (0.0010) +[2023-10-08 11:51:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 13892.8). Total num frames: 3997696. Throughput: 0: 1785.3, 1: 1762.8. Samples: 1014468. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:51:16,876][101941] Avg episode reward: [(0, '5.350'), (1, '4.910')] +[2023-10-08 11:51:17,021][102897] Updated weights for policy 0, policy_version 1960 (0.0007) +[2023-10-08 11:51:17,398][102897] Updated weights for policy 0, policy_version 1970 (0.0007) +[2023-10-08 11:51:17,770][102897] Updated weights for policy 0, policy_version 1980 (0.0010) +[2023-10-08 11:51:18,095][102898] Updated weights for policy 1, policy_version 1960 (0.0007) +[2023-10-08 11:51:18,467][102898] Updated weights for policy 1, policy_version 1970 (0.0008) +[2023-10-08 11:51:18,833][102898] Updated weights for policy 1, policy_version 1980 (0.0009) +[2023-10-08 11:51:21,426][102897] Updated weights for policy 0, policy_version 1990 (0.0008) +[2023-10-08 11:51:21,807][102897] Updated weights for policy 0, policy_version 2000 (0.0008) +[2023-10-08 11:51:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 13879.4). Total num frames: 4063232. Throughput: 0: 1779.6, 1: 1755.4. Samples: 1024238. Policy #0 lag: (min: 31.0, avg: 32.2, max: 56.0) +[2023-10-08 11:51:21,876][101941] Avg episode reward: [(0, '5.160'), (1, '5.000')] +[2023-10-08 11:51:22,190][102897] Updated weights for policy 0, policy_version 2010 (0.0009) +[2023-10-08 11:51:22,538][102898] Updated weights for policy 1, policy_version 1990 (0.0008) +[2023-10-08 11:51:22,906][102898] Updated weights for policy 1, policy_version 2000 (0.0009) +[2023-10-08 11:51:23,278][102898] Updated weights for policy 1, policy_version 2010 (0.0007) +[2023-10-08 11:51:25,874][102897] Updated weights for policy 0, policy_version 2020 (0.0008) +[2023-10-08 11:51:26,244][102897] Updated weights for policy 0, policy_version 2030 (0.0007) +[2023-10-08 11:51:26,619][102897] Updated weights for policy 0, policy_version 2040 (0.0007) +[2023-10-08 11:51:26,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 13995.8). Total num frames: 4128768. Throughput: 0: 1790.6, 1: 1758.1. Samples: 1046734. Policy #0 lag: (min: 1.0, avg: 5.1, max: 33.0) +[2023-10-08 11:51:26,876][101941] Avg episode reward: [(0, '5.480'), (1, '4.930')] +[2023-10-08 11:51:26,978][102898] Updated weights for policy 1, policy_version 2020 (0.0008) +[2023-10-08 11:51:27,344][102898] Updated weights for policy 1, policy_version 2030 (0.0007) +[2023-10-08 11:51:27,713][102898] Updated weights for policy 1, policy_version 2040 (0.0009) +[2023-10-08 11:51:30,530][102897] Updated weights for policy 0, policy_version 2050 (0.0007) +[2023-10-08 11:51:30,907][102897] Updated weights for policy 0, policy_version 2060 (0.0011) +[2023-10-08 11:51:31,282][102897] Updated weights for policy 0, policy_version 2070 (0.0009) +[2023-10-08 11:51:31,513][102898] Updated weights for policy 1, policy_version 2050 (0.0008) +[2023-10-08 11:51:31,652][102897] Updated weights for policy 0, policy_version 2080 (0.0007) +[2023-10-08 11:51:31,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 4227072. Throughput: 0: 1790.8, 1: 1786.5. Samples: 1067642. Policy #0 lag: (min: 31.0, avg: 35.3, max: 63.0) +[2023-10-08 11:51:31,876][101941] Avg episode reward: [(0, '5.250'), (1, '5.140')] +[2023-10-08 11:51:31,881][102898] Updated weights for policy 1, policy_version 2060 (0.0010) +[2023-10-08 11:51:32,254][102898] Updated weights for policy 1, policy_version 2070 (0.0007) +[2023-10-08 11:51:32,625][102898] Updated weights for policy 1, policy_version 2080 (0.0008) +[2023-10-08 11:51:35,431][102897] Updated weights for policy 0, policy_version 2090 (0.0007) +[2023-10-08 11:51:35,802][102897] Updated weights for policy 0, policy_version 2100 (0.0008) +[2023-10-08 11:51:36,169][102897] Updated weights for policy 0, policy_version 2110 (0.0007) +[2023-10-08 11:51:36,387][102898] Updated weights for policy 1, policy_version 2090 (0.0008) +[2023-10-08 11:51:36,758][102898] Updated weights for policy 1, policy_version 2100 (0.0007) +[2023-10-08 11:51:36,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 4292608. Throughput: 0: 1784.9, 1: 1753.7. Samples: 1078334. Policy #0 lag: (min: 26.0, avg: 26.0, max: 26.0) +[2023-10-08 11:51:36,875][101941] Avg episode reward: [(0, '5.550'), (1, '5.450')] +[2023-10-08 11:51:37,125][102898] Updated weights for policy 1, policy_version 2110 (0.0007) +[2023-10-08 11:51:39,912][102897] Updated weights for policy 0, policy_version 2120 (0.0010) +[2023-10-08 11:51:40,292][102897] Updated weights for policy 0, policy_version 2130 (0.0010) +[2023-10-08 11:51:40,662][102897] Updated weights for policy 0, policy_version 2140 (0.0009) +[2023-10-08 11:51:40,902][102898] Updated weights for policy 1, policy_version 2120 (0.0008) +[2023-10-08 11:51:41,262][102898] Updated weights for policy 1, policy_version 2130 (0.0008) +[2023-10-08 11:51:41,641][102898] Updated weights for policy 1, policy_version 2140 (0.0008) +[2023-10-08 11:51:41,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 4390912. Throughput: 0: 1804.9, 1: 1782.4. Samples: 1100086. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 11:51:41,876][101941] Avg episode reward: [(0, '6.220'), (1, '5.190')] +[2023-10-08 11:51:41,877][102634] Saving new best policy, reward=6.220! +[2023-10-08 11:51:44,347][102897] Updated weights for policy 0, policy_version 2150 (0.0008) +[2023-10-08 11:51:44,720][102897] Updated weights for policy 0, policy_version 2160 (0.0007) +[2023-10-08 11:51:45,091][102897] Updated weights for policy 0, policy_version 2170 (0.0008) +[2023-10-08 11:51:45,481][102898] Updated weights for policy 1, policy_version 2150 (0.0010) +[2023-10-08 11:51:45,859][102898] Updated weights for policy 1, policy_version 2160 (0.0008) +[2023-10-08 11:51:46,241][102898] Updated weights for policy 1, policy_version 2170 (0.0010) +[2023-10-08 11:51:46,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 4456448. Throughput: 0: 1793.3, 1: 1761.8. Samples: 1120786. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:51:46,875][101941] Avg episode reward: [(0, '5.880'), (1, '5.360')] +[2023-10-08 11:51:48,863][102897] Updated weights for policy 0, policy_version 2180 (0.0008) +[2023-10-08 11:51:49,229][102897] Updated weights for policy 0, policy_version 2190 (0.0009) +[2023-10-08 11:51:49,604][102897] Updated weights for policy 0, policy_version 2200 (0.0010) +[2023-10-08 11:51:49,973][102898] Updated weights for policy 1, policy_version 2180 (0.0009) +[2023-10-08 11:51:50,337][102898] Updated weights for policy 1, policy_version 2190 (0.0008) +[2023-10-08 11:51:50,702][102898] Updated weights for policy 1, policy_version 2200 (0.0008) +[2023-10-08 11:51:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 4521984. Throughput: 0: 1807.9, 1: 1784.8. Samples: 1132446. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:51:51,876][101941] Avg episode reward: [(0, '5.700'), (1, '6.670')] +[2023-10-08 11:51:51,879][102760] Saving new best policy, reward=6.670! +[2023-10-08 11:51:53,370][102897] Updated weights for policy 0, policy_version 2210 (0.0008) +[2023-10-08 11:51:53,734][102897] Updated weights for policy 0, policy_version 2220 (0.0007) +[2023-10-08 11:51:54,099][102897] Updated weights for policy 0, policy_version 2230 (0.0007) +[2023-10-08 11:51:54,450][102898] Updated weights for policy 1, policy_version 2210 (0.0009) +[2023-10-08 11:51:54,472][102897] Updated weights for policy 0, policy_version 2240 (0.0008) +[2023-10-08 11:51:54,828][102898] Updated weights for policy 1, policy_version 2220 (0.0008) +[2023-10-08 11:51:55,202][102898] Updated weights for policy 1, policy_version 2230 (0.0009) +[2023-10-08 11:51:55,568][102898] Updated weights for policy 1, policy_version 2240 (0.0009) +[2023-10-08 11:51:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 4587520. Throughput: 0: 1797.2, 1: 1770.0. Samples: 1152950. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:51:56,875][101941] Avg episode reward: [(0, '5.350'), (1, '6.170')] +[2023-10-08 11:51:58,325][102897] Updated weights for policy 0, policy_version 2250 (0.0008) +[2023-10-08 11:51:58,698][102897] Updated weights for policy 0, policy_version 2260 (0.0007) +[2023-10-08 11:51:59,071][102897] Updated weights for policy 0, policy_version 2270 (0.0008) +[2023-10-08 11:51:59,212][102898] Updated weights for policy 1, policy_version 2250 (0.0010) +[2023-10-08 11:51:59,579][102898] Updated weights for policy 1, policy_version 2260 (0.0007) +[2023-10-08 11:51:59,949][102898] Updated weights for policy 1, policy_version 2270 (0.0007) +[2023-10-08 11:52:01,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 4653056. Throughput: 0: 1793.5, 1: 1776.8. Samples: 1175128. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:52:01,875][101941] Avg episode reward: [(0, '5.320'), (1, '5.440')] +[2023-10-08 11:52:02,877][102897] Updated weights for policy 0, policy_version 2280 (0.0008) +[2023-10-08 11:52:03,256][102897] Updated weights for policy 0, policy_version 2290 (0.0009) +[2023-10-08 11:52:03,620][102897] Updated weights for policy 0, policy_version 2300 (0.0008) +[2023-10-08 11:52:03,804][102898] Updated weights for policy 1, policy_version 2280 (0.0008) +[2023-10-08 11:52:04,181][102898] Updated weights for policy 1, policy_version 2290 (0.0009) +[2023-10-08 11:52:04,545][102898] Updated weights for policy 1, policy_version 2300 (0.0007) +[2023-10-08 11:52:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 4718592. Throughput: 0: 1791.4, 1: 1784.4. Samples: 1185148. Policy #0 lag: (min: 9.0, avg: 25.4, max: 41.0) +[2023-10-08 11:52:06,875][101941] Avg episode reward: [(0, '5.910'), (1, '5.010')] +[2023-10-08 11:52:07,341][102897] Updated weights for policy 0, policy_version 2310 (0.0008) +[2023-10-08 11:52:07,720][102897] Updated weights for policy 0, policy_version 2320 (0.0010) +[2023-10-08 11:52:08,082][102897] Updated weights for policy 0, policy_version 2330 (0.0010) +[2023-10-08 11:52:08,405][102898] Updated weights for policy 1, policy_version 2310 (0.0008) +[2023-10-08 11:52:08,773][102898] Updated weights for policy 1, policy_version 2320 (0.0009) +[2023-10-08 11:52:09,149][102898] Updated weights for policy 1, policy_version 2330 (0.0008) +[2023-10-08 11:52:11,671][102897] Updated weights for policy 0, policy_version 2340 (0.0009) +[2023-10-08 11:52:11,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 4784128. Throughput: 0: 1788.6, 1: 1771.5. Samples: 1206940. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 11:52:11,875][101941] Avg episode reward: [(0, '6.100'), (1, '4.440')] +[2023-10-08 11:52:12,050][102897] Updated weights for policy 0, policy_version 2350 (0.0009) +[2023-10-08 11:52:12,413][102897] Updated weights for policy 0, policy_version 2360 (0.0010) +[2023-10-08 11:52:12,837][102898] Updated weights for policy 1, policy_version 2340 (0.0008) +[2023-10-08 11:52:13,208][102898] Updated weights for policy 1, policy_version 2350 (0.0011) +[2023-10-08 11:52:13,577][102898] Updated weights for policy 1, policy_version 2360 (0.0010) +[2023-10-08 11:52:16,231][102897] Updated weights for policy 0, policy_version 2370 (0.0008) +[2023-10-08 11:52:16,608][102897] Updated weights for policy 0, policy_version 2380 (0.0009) +[2023-10-08 11:52:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 4849664. Throughput: 0: 1809.4, 1: 1777.2. Samples: 1229038. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 11:52:16,876][101941] Avg episode reward: [(0, '5.580'), (1, '5.010')] +[2023-10-08 11:52:16,883][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000002368_2424832.pth... +[2023-10-08 11:52:16,912][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000000704_720896.pth +[2023-10-08 11:52:16,978][102897] Updated weights for policy 0, policy_version 2390 (0.0008) +[2023-10-08 11:52:17,353][102897] Updated weights for policy 0, policy_version 2400 (0.0008) +[2023-10-08 11:52:17,354][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000002400_2457600.pth... +[2023-10-08 11:52:17,377][102898] Updated weights for policy 1, policy_version 2370 (0.0007) +[2023-10-08 11:52:17,382][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000000704_720896.pth +[2023-10-08 11:52:17,740][102898] Updated weights for policy 1, policy_version 2380 (0.0007) +[2023-10-08 11:52:18,111][102898] Updated weights for policy 1, policy_version 2390 (0.0007) +[2023-10-08 11:52:18,479][102898] Updated weights for policy 1, policy_version 2400 (0.0007) +[2023-10-08 11:52:20,969][102897] Updated weights for policy 0, policy_version 2410 (0.0008) +[2023-10-08 11:52:21,348][102897] Updated weights for policy 0, policy_version 2420 (0.0008) +[2023-10-08 11:52:21,719][102897] Updated weights for policy 0, policy_version 2430 (0.0007) +[2023-10-08 11:52:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 4947968. Throughput: 0: 1790.9, 1: 1781.4. Samples: 1239090. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:52:21,876][101941] Avg episode reward: [(0, '5.610'), (1, '5.320')] +[2023-10-08 11:52:22,206][102898] Updated weights for policy 1, policy_version 2410 (0.0008) +[2023-10-08 11:52:22,581][102898] Updated weights for policy 1, policy_version 2420 (0.0008) +[2023-10-08 11:52:22,941][102898] Updated weights for policy 1, policy_version 2430 (0.0007) +[2023-10-08 11:52:25,477][102897] Updated weights for policy 0, policy_version 2440 (0.0009) +[2023-10-08 11:52:25,849][102897] Updated weights for policy 0, policy_version 2450 (0.0008) +[2023-10-08 11:52:26,233][102897] Updated weights for policy 0, policy_version 2460 (0.0009) +[2023-10-08 11:52:26,738][102898] Updated weights for policy 1, policy_version 2440 (0.0009) +[2023-10-08 11:52:26,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 5013504. Throughput: 0: 1799.8, 1: 1781.0. Samples: 1261222. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:52:26,876][101941] Avg episode reward: [(0, '5.960'), (1, '5.160')] +[2023-10-08 11:52:27,106][102898] Updated weights for policy 1, policy_version 2450 (0.0007) +[2023-10-08 11:52:27,470][102898] Updated weights for policy 1, policy_version 2460 (0.0007) +[2023-10-08 11:52:30,026][102897] Updated weights for policy 0, policy_version 2470 (0.0008) +[2023-10-08 11:52:30,401][102897] Updated weights for policy 0, policy_version 2480 (0.0007) +[2023-10-08 11:52:30,772][102897] Updated weights for policy 0, policy_version 2490 (0.0008) +[2023-10-08 11:52:31,149][102898] Updated weights for policy 1, policy_version 2470 (0.0007) +[2023-10-08 11:52:31,517][102898] Updated weights for policy 1, policy_version 2480 (0.0008) +[2023-10-08 11:52:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 5079040. Throughput: 0: 1776.4, 1: 1798.7. Samples: 1281666. Policy #0 lag: (min: 21.0, avg: 21.6, max: 38.0) +[2023-10-08 11:52:31,876][101941] Avg episode reward: [(0, '5.550'), (1, '4.520')] +[2023-10-08 11:52:31,891][102898] Updated weights for policy 1, policy_version 2490 (0.0008) +[2023-10-08 11:52:34,548][102897] Updated weights for policy 0, policy_version 2500 (0.0007) +[2023-10-08 11:52:34,924][102897] Updated weights for policy 0, policy_version 2510 (0.0007) +[2023-10-08 11:52:35,289][102897] Updated weights for policy 0, policy_version 2520 (0.0008) +[2023-10-08 11:52:35,545][102898] Updated weights for policy 1, policy_version 2500 (0.0010) +[2023-10-08 11:52:35,909][102898] Updated weights for policy 1, policy_version 2510 (0.0008) +[2023-10-08 11:52:36,274][102898] Updated weights for policy 1, policy_version 2520 (0.0007) +[2023-10-08 11:52:36,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 5177344. Throughput: 0: 1800.3, 1: 1785.4. Samples: 1293802. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 11:52:36,876][101941] Avg episode reward: [(0, '5.370'), (1, '5.070')] +[2023-10-08 11:52:38,970][102897] Updated weights for policy 0, policy_version 2530 (0.0008) +[2023-10-08 11:52:39,329][102897] Updated weights for policy 0, policy_version 2540 (0.0007) +[2023-10-08 11:52:39,714][102897] Updated weights for policy 0, policy_version 2550 (0.0009) +[2023-10-08 11:52:40,051][102898] Updated weights for policy 1, policy_version 2530 (0.0007) +[2023-10-08 11:52:40,085][102897] Updated weights for policy 0, policy_version 2560 (0.0009) +[2023-10-08 11:52:40,419][102898] Updated weights for policy 1, policy_version 2540 (0.0010) +[2023-10-08 11:52:40,786][102898] Updated weights for policy 1, policy_version 2550 (0.0011) +[2023-10-08 11:52:41,153][102898] Updated weights for policy 1, policy_version 2560 (0.0008) +[2023-10-08 11:52:41,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 5242880. Throughput: 0: 1784.5, 1: 1804.3. Samples: 1314446. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:52:41,876][101941] Avg episode reward: [(0, '5.220'), (1, '5.470')] +[2023-10-08 11:52:43,860][102897] Updated weights for policy 0, policy_version 2570 (0.0009) +[2023-10-08 11:52:44,245][102897] Updated weights for policy 0, policy_version 2580 (0.0009) +[2023-10-08 11:52:44,620][102897] Updated weights for policy 0, policy_version 2590 (0.0009) +[2023-10-08 11:52:44,919][102898] Updated weights for policy 1, policy_version 2570 (0.0009) +[2023-10-08 11:52:45,288][102898] Updated weights for policy 1, policy_version 2580 (0.0009) +[2023-10-08 11:52:45,656][102898] Updated weights for policy 1, policy_version 2590 (0.0008) +[2023-10-08 11:52:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 5308416. Throughput: 0: 1781.6, 1: 1787.1. Samples: 1335720. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:52:46,876][101941] Avg episode reward: [(0, '4.590'), (1, '5.470')] +[2023-10-08 11:52:48,437][102897] Updated weights for policy 0, policy_version 2600 (0.0008) +[2023-10-08 11:52:48,821][102897] Updated weights for policy 0, policy_version 2610 (0.0010) +[2023-10-08 11:52:49,182][102897] Updated weights for policy 0, policy_version 2620 (0.0007) +[2023-10-08 11:52:49,389][102898] Updated weights for policy 1, policy_version 2600 (0.0008) +[2023-10-08 11:52:49,765][102898] Updated weights for policy 1, policy_version 2610 (0.0008) +[2023-10-08 11:52:50,128][102898] Updated weights for policy 1, policy_version 2620 (0.0008) +[2023-10-08 11:52:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 5373952. Throughput: 0: 1779.1, 1: 1803.9. Samples: 1346382. Policy #0 lag: (min: 31.0, avg: 32.8, max: 60.0) +[2023-10-08 11:52:51,876][101941] Avg episode reward: [(0, '4.910'), (1, '5.820')] +[2023-10-08 11:52:52,997][102897] Updated weights for policy 0, policy_version 2630 (0.0009) +[2023-10-08 11:52:53,375][102897] Updated weights for policy 0, policy_version 2640 (0.0009) +[2023-10-08 11:52:53,749][102897] Updated weights for policy 0, policy_version 2650 (0.0009) +[2023-10-08 11:52:53,943][102898] Updated weights for policy 1, policy_version 2630 (0.0008) +[2023-10-08 11:52:54,314][102898] Updated weights for policy 1, policy_version 2640 (0.0011) +[2023-10-08 11:52:54,698][102898] Updated weights for policy 1, policy_version 2650 (0.0011) +[2023-10-08 11:52:56,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 5439488. Throughput: 0: 1782.5, 1: 1794.8. Samples: 1367918. Policy #0 lag: (min: 31.0, avg: 32.8, max: 60.0) +[2023-10-08 11:52:56,875][101941] Avg episode reward: [(0, '6.000'), (1, '5.310')] +[2023-10-08 11:52:57,549][102897] Updated weights for policy 0, policy_version 2660 (0.0008) +[2023-10-08 11:52:57,923][102897] Updated weights for policy 0, policy_version 2670 (0.0008) +[2023-10-08 11:52:58,301][102897] Updated weights for policy 0, policy_version 2680 (0.0008) +[2023-10-08 11:52:58,426][102898] Updated weights for policy 1, policy_version 2660 (0.0008) +[2023-10-08 11:52:58,806][102898] Updated weights for policy 1, policy_version 2670 (0.0009) +[2023-10-08 11:52:59,171][102898] Updated weights for policy 1, policy_version 2680 (0.0010) +[2023-10-08 11:53:01,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 5505024. Throughput: 0: 1789.3, 1: 1796.9. Samples: 1390414. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:53:01,875][101941] Avg episode reward: [(0, '5.880'), (1, '4.950')] +[2023-10-08 11:53:02,111][102897] Updated weights for policy 0, policy_version 2690 (0.0008) +[2023-10-08 11:53:02,469][102897] Updated weights for policy 0, policy_version 2700 (0.0011) +[2023-10-08 11:53:02,843][102897] Updated weights for policy 0, policy_version 2710 (0.0007) +[2023-10-08 11:53:02,917][102898] Updated weights for policy 1, policy_version 2690 (0.0009) +[2023-10-08 11:53:03,207][102897] Updated weights for policy 0, policy_version 2720 (0.0008) +[2023-10-08 11:53:03,289][102898] Updated weights for policy 1, policy_version 2700 (0.0008) +[2023-10-08 11:53:03,652][102898] Updated weights for policy 1, policy_version 2710 (0.0010) +[2023-10-08 11:53:04,025][102898] Updated weights for policy 1, policy_version 2720 (0.0010) +[2023-10-08 11:53:06,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 5570560. Throughput: 0: 1780.7, 1: 1791.9. Samples: 1399858. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:53:06,876][101941] Avg episode reward: [(0, '4.800'), (1, '4.850')] +[2023-10-08 11:53:07,096][102897] Updated weights for policy 0, policy_version 2730 (0.0010) +[2023-10-08 11:53:07,474][102897] Updated weights for policy 0, policy_version 2740 (0.0008) +[2023-10-08 11:53:07,853][102897] Updated weights for policy 0, policy_version 2750 (0.0008) +[2023-10-08 11:53:07,938][102898] Updated weights for policy 1, policy_version 2730 (0.0008) +[2023-10-08 11:53:08,298][102898] Updated weights for policy 1, policy_version 2740 (0.0008) +[2023-10-08 11:53:08,670][102898] Updated weights for policy 1, policy_version 2750 (0.0007) +[2023-10-08 11:53:11,688][102897] Updated weights for policy 0, policy_version 2760 (0.0009) +[2023-10-08 11:53:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 5636096. Throughput: 0: 1785.5, 1: 1788.3. Samples: 1422046. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 11:53:11,876][101941] Avg episode reward: [(0, '5.090'), (1, '5.000')] +[2023-10-08 11:53:12,049][102897] Updated weights for policy 0, policy_version 2770 (0.0009) +[2023-10-08 11:53:12,424][102898] Updated weights for policy 1, policy_version 2760 (0.0009) +[2023-10-08 11:53:12,435][102897] Updated weights for policy 0, policy_version 2780 (0.0009) +[2023-10-08 11:53:12,792][102898] Updated weights for policy 1, policy_version 2770 (0.0009) +[2023-10-08 11:53:13,166][102898] Updated weights for policy 1, policy_version 2780 (0.0010) +[2023-10-08 11:53:16,105][102897] Updated weights for policy 0, policy_version 2790 (0.0008) +[2023-10-08 11:53:16,474][102897] Updated weights for policy 0, policy_version 2800 (0.0008) +[2023-10-08 11:53:16,835][102898] Updated weights for policy 1, policy_version 2790 (0.0008) +[2023-10-08 11:53:16,848][102897] Updated weights for policy 0, policy_version 2810 (0.0009) +[2023-10-08 11:53:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 5701632. Throughput: 0: 1804.3, 1: 1801.4. Samples: 1443924. Policy #0 lag: (min: 25.0, avg: 42.5, max: 57.0) +[2023-10-08 11:53:16,876][101941] Avg episode reward: [(0, '5.500'), (1, '5.220')] +[2023-10-08 11:53:17,205][102898] Updated weights for policy 1, policy_version 2800 (0.0007) +[2023-10-08 11:53:17,566][102898] Updated weights for policy 1, policy_version 2810 (0.0007) +[2023-10-08 11:53:20,491][102897] Updated weights for policy 0, policy_version 2820 (0.0007) +[2023-10-08 11:53:20,860][102897] Updated weights for policy 0, policy_version 2830 (0.0007) +[2023-10-08 11:53:21,234][102897] Updated weights for policy 0, policy_version 2840 (0.0010) +[2023-10-08 11:53:21,463][102898] Updated weights for policy 1, policy_version 2820 (0.0008) +[2023-10-08 11:53:21,829][102898] Updated weights for policy 1, policy_version 2830 (0.0009) +[2023-10-08 11:53:21,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 5799936. Throughput: 0: 1782.6, 1: 1783.6. Samples: 1454280. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:53:21,876][101941] Avg episode reward: [(0, '5.530'), (1, '4.960')] +[2023-10-08 11:53:22,200][102898] Updated weights for policy 1, policy_version 2840 (0.0009) +[2023-10-08 11:53:24,972][102897] Updated weights for policy 0, policy_version 2850 (0.0008) +[2023-10-08 11:53:25,340][102897] Updated weights for policy 0, policy_version 2860 (0.0009) +[2023-10-08 11:53:25,723][102897] Updated weights for policy 0, policy_version 2870 (0.0008) +[2023-10-08 11:53:26,014][102898] Updated weights for policy 1, policy_version 2850 (0.0009) +[2023-10-08 11:53:26,090][102897] Updated weights for policy 0, policy_version 2880 (0.0008) +[2023-10-08 11:53:26,387][102898] Updated weights for policy 1, policy_version 2860 (0.0009) +[2023-10-08 11:53:26,757][102898] Updated weights for policy 1, policy_version 2870 (0.0009) +[2023-10-08 11:53:26,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 5865472. Throughput: 0: 1798.4, 1: 1794.4. Samples: 1476126. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:53:26,876][101941] Avg episode reward: [(0, '5.570'), (1, '5.070')] +[2023-10-08 11:53:27,112][102898] Updated weights for policy 1, policy_version 2880 (0.0010) +[2023-10-08 11:53:29,934][102897] Updated weights for policy 0, policy_version 2890 (0.0008) +[2023-10-08 11:53:30,307][102897] Updated weights for policy 0, policy_version 2900 (0.0007) +[2023-10-08 11:53:30,675][102897] Updated weights for policy 0, policy_version 2910 (0.0010) +[2023-10-08 11:53:30,940][102898] Updated weights for policy 1, policy_version 2890 (0.0009) +[2023-10-08 11:53:31,305][102898] Updated weights for policy 1, policy_version 2900 (0.0008) +[2023-10-08 11:53:31,679][102898] Updated weights for policy 1, policy_version 2910 (0.0008) +[2023-10-08 11:53:31,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 5963776. Throughput: 0: 1779.6, 1: 1788.3. Samples: 1496274. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 11:53:31,875][101941] Avg episode reward: [(0, '5.840'), (1, '5.660')] +[2023-10-08 11:53:34,463][102897] Updated weights for policy 0, policy_version 2920 (0.0009) +[2023-10-08 11:53:34,830][102897] Updated weights for policy 0, policy_version 2930 (0.0008) +[2023-10-08 11:53:35,196][102897] Updated weights for policy 0, policy_version 2940 (0.0007) +[2023-10-08 11:53:35,622][102898] Updated weights for policy 1, policy_version 2920 (0.0009) +[2023-10-08 11:53:35,992][102898] Updated weights for policy 1, policy_version 2930 (0.0009) +[2023-10-08 11:53:36,352][102898] Updated weights for policy 1, policy_version 2940 (0.0008) +[2023-10-08 11:53:36,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 6029312. Throughput: 0: 1808.0, 1: 1785.5. Samples: 1508088. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 11:53:36,876][101941] Avg episode reward: [(0, '5.680'), (1, '5.760')] +[2023-10-08 11:53:38,993][102897] Updated weights for policy 0, policy_version 2950 (0.0010) +[2023-10-08 11:53:39,357][102897] Updated weights for policy 0, policy_version 2960 (0.0009) +[2023-10-08 11:53:39,730][102897] Updated weights for policy 0, policy_version 2970 (0.0007) +[2023-10-08 11:53:40,142][102898] Updated weights for policy 1, policy_version 2950 (0.0010) +[2023-10-08 11:53:40,515][102898] Updated weights for policy 1, policy_version 2960 (0.0009) +[2023-10-08 11:53:40,884][102898] Updated weights for policy 1, policy_version 2970 (0.0009) +[2023-10-08 11:53:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 6094848. Throughput: 0: 1774.7, 1: 1792.5. Samples: 1528440. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 11:53:41,876][101941] Avg episode reward: [(0, '5.110'), (1, '5.820')] +[2023-10-08 11:53:43,422][102897] Updated weights for policy 0, policy_version 2980 (0.0008) +[2023-10-08 11:53:43,794][102897] Updated weights for policy 0, policy_version 2990 (0.0007) +[2023-10-08 11:53:44,173][102897] Updated weights for policy 0, policy_version 3000 (0.0008) +[2023-10-08 11:53:44,582][102898] Updated weights for policy 1, policy_version 2980 (0.0008) +[2023-10-08 11:53:44,944][102898] Updated weights for policy 1, policy_version 2990 (0.0007) +[2023-10-08 11:53:45,317][102898] Updated weights for policy 1, policy_version 3000 (0.0008) +[2023-10-08 11:53:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 6160384. Throughput: 0: 1778.9, 1: 1771.6. Samples: 1550186. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 11:53:46,876][101941] Avg episode reward: [(0, '5.100'), (1, '5.770')] +[2023-10-08 11:53:47,991][102897] Updated weights for policy 0, policy_version 3010 (0.0008) +[2023-10-08 11:53:48,375][102897] Updated weights for policy 0, policy_version 3020 (0.0010) +[2023-10-08 11:53:48,757][102897] Updated weights for policy 0, policy_version 3030 (0.0010) +[2023-10-08 11:53:49,125][102897] Updated weights for policy 0, policy_version 3040 (0.0007) +[2023-10-08 11:53:49,146][102898] Updated weights for policy 1, policy_version 3010 (0.0009) +[2023-10-08 11:53:49,509][102898] Updated weights for policy 1, policy_version 3020 (0.0009) +[2023-10-08 11:53:49,887][102898] Updated weights for policy 1, policy_version 3030 (0.0009) +[2023-10-08 11:53:50,260][102898] Updated weights for policy 1, policy_version 3040 (0.0007) +[2023-10-08 11:53:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 6225920. Throughput: 0: 1781.6, 1: 1795.9. Samples: 1560844. Policy #0 lag: (min: 31.0, avg: 31.5, max: 46.0) +[2023-10-08 11:53:51,876][101941] Avg episode reward: [(0, '5.300'), (1, '5.680')] +[2023-10-08 11:53:52,870][102897] Updated weights for policy 0, policy_version 3050 (0.0009) +[2023-10-08 11:53:53,254][102897] Updated weights for policy 0, policy_version 3060 (0.0007) +[2023-10-08 11:53:53,626][102897] Updated weights for policy 0, policy_version 3070 (0.0007) +[2023-10-08 11:53:54,211][102898] Updated weights for policy 1, policy_version 3050 (0.0008) +[2023-10-08 11:53:54,586][102898] Updated weights for policy 1, policy_version 3060 (0.0009) +[2023-10-08 11:53:54,953][102898] Updated weights for policy 1, policy_version 3070 (0.0008) +[2023-10-08 11:53:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 6291456. Throughput: 0: 1784.4, 1: 1771.7. Samples: 1582068. Policy #0 lag: (min: 31.0, avg: 31.5, max: 46.0) +[2023-10-08 11:53:56,876][101941] Avg episode reward: [(0, '5.740'), (1, '4.990')] +[2023-10-08 11:53:57,353][102897] Updated weights for policy 0, policy_version 3080 (0.0008) +[2023-10-08 11:53:57,733][102897] Updated weights for policy 0, policy_version 3090 (0.0007) +[2023-10-08 11:53:58,115][102897] Updated weights for policy 0, policy_version 3100 (0.0008) +[2023-10-08 11:53:58,706][102898] Updated weights for policy 1, policy_version 3080 (0.0007) +[2023-10-08 11:53:59,068][102898] Updated weights for policy 1, policy_version 3090 (0.0007) +[2023-10-08 11:53:59,438][102898] Updated weights for policy 1, policy_version 3100 (0.0008) +[2023-10-08 11:54:01,830][102897] Updated weights for policy 0, policy_version 3110 (0.0009) +[2023-10-08 11:54:01,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 6356992. Throughput: 0: 1797.6, 1: 1768.3. Samples: 1604394. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 11:54:01,876][101941] Avg episode reward: [(0, '6.270'), (1, '5.060')] +[2023-10-08 11:54:02,205][102897] Updated weights for policy 0, policy_version 3120 (0.0008) +[2023-10-08 11:54:02,577][102897] Updated weights for policy 0, policy_version 3130 (0.0007) +[2023-10-08 11:54:02,802][102634] Saving new best policy, reward=6.270! +[2023-10-08 11:54:03,217][102898] Updated weights for policy 1, policy_version 3110 (0.0009) +[2023-10-08 11:54:03,583][102898] Updated weights for policy 1, policy_version 3120 (0.0009) +[2023-10-08 11:54:03,959][102898] Updated weights for policy 1, policy_version 3130 (0.0010) +[2023-10-08 11:54:06,319][102897] Updated weights for policy 0, policy_version 3140 (0.0007) +[2023-10-08 11:54:06,684][102897] Updated weights for policy 0, policy_version 3150 (0.0008) +[2023-10-08 11:54:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 6422528. Throughput: 0: 1782.1, 1: 1770.4. Samples: 1614142. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:54:06,876][101941] Avg episode reward: [(0, '6.180'), (1, '5.640')] +[2023-10-08 11:54:07,048][102897] Updated weights for policy 0, policy_version 3160 (0.0008) +[2023-10-08 11:54:07,654][102898] Updated weights for policy 1, policy_version 3140 (0.0010) +[2023-10-08 11:54:08,015][102898] Updated weights for policy 1, policy_version 3150 (0.0011) +[2023-10-08 11:54:08,397][102898] Updated weights for policy 1, policy_version 3160 (0.0008) +[2023-10-08 11:54:10,881][102897] Updated weights for policy 0, policy_version 3170 (0.0008) +[2023-10-08 11:54:11,251][102897] Updated weights for policy 0, policy_version 3180 (0.0007) +[2023-10-08 11:54:11,621][102897] Updated weights for policy 0, policy_version 3190 (0.0009) +[2023-10-08 11:54:11,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 6488064. Throughput: 0: 1787.4, 1: 1773.2. Samples: 1636352. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:54:11,875][101941] Avg episode reward: [(0, '6.320'), (1, '5.290')] +[2023-10-08 11:54:11,985][102634] Saving new best policy, reward=6.320! +[2023-10-08 11:54:11,985][102897] Updated weights for policy 0, policy_version 3200 (0.0009) +[2023-10-08 11:54:12,229][102898] Updated weights for policy 1, policy_version 3170 (0.0009) +[2023-10-08 11:54:12,593][102898] Updated weights for policy 1, policy_version 3180 (0.0009) +[2023-10-08 11:54:12,955][102898] Updated weights for policy 1, policy_version 3190 (0.0008) +[2023-10-08 11:54:13,321][102898] Updated weights for policy 1, policy_version 3200 (0.0008) +[2023-10-08 11:54:15,684][102897] Updated weights for policy 0, policy_version 3210 (0.0008) +[2023-10-08 11:54:16,061][102897] Updated weights for policy 0, policy_version 3220 (0.0007) +[2023-10-08 11:54:16,438][102897] Updated weights for policy 0, policy_version 3230 (0.0007) +[2023-10-08 11:54:16,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 6586368. Throughput: 0: 1784.7, 1: 1799.0. Samples: 1657542. Policy #0 lag: (min: 29.0, avg: 29.5, max: 45.0) +[2023-10-08 11:54:16,876][101941] Avg episode reward: [(0, '6.410'), (1, '4.840')] +[2023-10-08 11:54:16,889][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000003232_3309568.pth... +[2023-10-08 11:54:16,920][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000001536_1572864.pth +[2023-10-08 11:54:16,924][102634] Saving new best policy, reward=6.410! +[2023-10-08 11:54:16,973][102898] Updated weights for policy 1, policy_version 3210 (0.0007) +[2023-10-08 11:54:17,343][102898] Updated weights for policy 1, policy_version 3220 (0.0007) +[2023-10-08 11:54:17,715][102898] Updated weights for policy 1, policy_version 3230 (0.0008) +[2023-10-08 11:54:17,790][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000003232_3309568.pth... +[2023-10-08 11:54:17,829][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000001536_1572864.pth +[2023-10-08 11:54:20,217][102897] Updated weights for policy 0, policy_version 3240 (0.0008) +[2023-10-08 11:54:20,587][102897] Updated weights for policy 0, policy_version 3250 (0.0007) +[2023-10-08 11:54:20,964][102897] Updated weights for policy 0, policy_version 3260 (0.0010) +[2023-10-08 11:54:21,552][102898] Updated weights for policy 1, policy_version 3240 (0.0008) +[2023-10-08 11:54:21,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 6651904. Throughput: 0: 1788.7, 1: 1774.4. Samples: 1668426. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 11:54:21,876][101941] Avg episode reward: [(0, '5.860'), (1, '4.680')] +[2023-10-08 11:54:21,932][102898] Updated weights for policy 1, policy_version 3250 (0.0008) +[2023-10-08 11:54:22,294][102898] Updated weights for policy 1, policy_version 3260 (0.0007) +[2023-10-08 11:54:24,567][102897] Updated weights for policy 0, policy_version 3270 (0.0008) +[2023-10-08 11:54:24,940][102897] Updated weights for policy 0, policy_version 3280 (0.0007) +[2023-10-08 11:54:25,314][102897] Updated weights for policy 0, policy_version 3290 (0.0007) +[2023-10-08 11:54:26,095][102898] Updated weights for policy 1, policy_version 3270 (0.0010) +[2023-10-08 11:54:26,462][102898] Updated weights for policy 1, policy_version 3280 (0.0007) +[2023-10-08 11:54:26,823][102898] Updated weights for policy 1, policy_version 3290 (0.0007) +[2023-10-08 11:54:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 6717440. Throughput: 0: 1793.1, 1: 1786.4. Samples: 1689518. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 11:54:26,876][101941] Avg episode reward: [(0, '5.550'), (1, '5.090')] +[2023-10-08 11:54:29,186][102897] Updated weights for policy 0, policy_version 3300 (0.0008) +[2023-10-08 11:54:29,561][102897] Updated weights for policy 0, policy_version 3310 (0.0007) +[2023-10-08 11:54:29,926][102897] Updated weights for policy 0, policy_version 3320 (0.0007) +[2023-10-08 11:54:30,641][102898] Updated weights for policy 1, policy_version 3300 (0.0007) +[2023-10-08 11:54:31,009][102898] Updated weights for policy 1, policy_version 3310 (0.0010) +[2023-10-08 11:54:31,384][102898] Updated weights for policy 1, policy_version 3320 (0.0009) +[2023-10-08 11:54:31,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 6815744. Throughput: 0: 1782.7, 1: 1780.5. Samples: 1710532. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:54:31,876][101941] Avg episode reward: [(0, '5.700'), (1, '5.340')] +[2023-10-08 11:54:33,606][102897] Updated weights for policy 0, policy_version 3330 (0.0007) +[2023-10-08 11:54:33,974][102897] Updated weights for policy 0, policy_version 3340 (0.0007) +[2023-10-08 11:54:34,359][102897] Updated weights for policy 0, policy_version 3350 (0.0010) +[2023-10-08 11:54:34,733][102897] Updated weights for policy 0, policy_version 3360 (0.0008) +[2023-10-08 11:54:35,058][102898] Updated weights for policy 1, policy_version 3330 (0.0010) +[2023-10-08 11:54:35,427][102898] Updated weights for policy 1, policy_version 3340 (0.0009) +[2023-10-08 11:54:35,794][102898] Updated weights for policy 1, policy_version 3350 (0.0009) +[2023-10-08 11:54:36,164][102898] Updated weights for policy 1, policy_version 3360 (0.0008) +[2023-10-08 11:54:36,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 6881280. Throughput: 0: 1791.4, 1: 1783.9. Samples: 1721732. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:54:36,876][101941] Avg episode reward: [(0, '5.750'), (1, '5.130')] +[2023-10-08 11:54:38,400][102897] Updated weights for policy 0, policy_version 3370 (0.0009) +[2023-10-08 11:54:38,771][102897] Updated weights for policy 0, policy_version 3380 (0.0009) +[2023-10-08 11:54:39,142][102897] Updated weights for policy 0, policy_version 3390 (0.0007) +[2023-10-08 11:54:39,937][102898] Updated weights for policy 1, policy_version 3370 (0.0008) +[2023-10-08 11:54:40,310][102898] Updated weights for policy 1, policy_version 3380 (0.0008) +[2023-10-08 11:54:40,670][102898] Updated weights for policy 1, policy_version 3390 (0.0009) +[2023-10-08 11:54:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 6946816. Throughput: 0: 1786.6, 1: 1788.4. Samples: 1742942. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:54:41,876][101941] Avg episode reward: [(0, '5.640'), (1, '4.950')] +[2023-10-08 11:54:42,974][102897] Updated weights for policy 0, policy_version 3400 (0.0007) +[2023-10-08 11:54:43,352][102897] Updated weights for policy 0, policy_version 3410 (0.0007) +[2023-10-08 11:54:43,729][102897] Updated weights for policy 0, policy_version 3420 (0.0007) +[2023-10-08 11:54:44,368][102898] Updated weights for policy 1, policy_version 3400 (0.0008) +[2023-10-08 11:54:44,731][102898] Updated weights for policy 1, policy_version 3410 (0.0008) +[2023-10-08 11:54:45,105][102898] Updated weights for policy 1, policy_version 3420 (0.0007) +[2023-10-08 11:54:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 7012352. Throughput: 0: 1783.2, 1: 1778.7. Samples: 1764676. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:54:46,876][101941] Avg episode reward: [(0, '5.180'), (1, '5.200')] +[2023-10-08 11:54:47,382][102897] Updated weights for policy 0, policy_version 3430 (0.0008) +[2023-10-08 11:54:47,753][102897] Updated weights for policy 0, policy_version 3440 (0.0009) +[2023-10-08 11:54:48,129][102897] Updated weights for policy 0, policy_version 3450 (0.0009) +[2023-10-08 11:54:48,966][102898] Updated weights for policy 1, policy_version 3430 (0.0010) +[2023-10-08 11:54:49,342][102898] Updated weights for policy 1, policy_version 3440 (0.0009) +[2023-10-08 11:54:49,712][102898] Updated weights for policy 1, policy_version 3450 (0.0010) +[2023-10-08 11:54:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 7077888. Throughput: 0: 1783.9, 1: 1794.0. Samples: 1775146. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:54:51,875][101941] Avg episode reward: [(0, '5.220'), (1, '5.470')] +[2023-10-08 11:54:52,011][102897] Updated weights for policy 0, policy_version 3460 (0.0009) +[2023-10-08 11:54:52,392][102897] Updated weights for policy 0, policy_version 3470 (0.0009) +[2023-10-08 11:54:52,770][102897] Updated weights for policy 0, policy_version 3480 (0.0008) +[2023-10-08 11:54:53,450][102898] Updated weights for policy 1, policy_version 3460 (0.0011) +[2023-10-08 11:54:53,819][102898] Updated weights for policy 1, policy_version 3470 (0.0010) +[2023-10-08 11:54:54,176][102898] Updated weights for policy 1, policy_version 3480 (0.0008) +[2023-10-08 11:54:56,549][102897] Updated weights for policy 0, policy_version 3490 (0.0009) +[2023-10-08 11:54:56,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 7143424. Throughput: 0: 1792.8, 1: 1778.0. Samples: 1797040. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:54:56,876][101941] Avg episode reward: [(0, '5.550'), (1, '5.850')] +[2023-10-08 11:54:56,919][102897] Updated weights for policy 0, policy_version 3500 (0.0009) +[2023-10-08 11:54:57,284][102897] Updated weights for policy 0, policy_version 3510 (0.0009) +[2023-10-08 11:54:57,656][102897] Updated weights for policy 0, policy_version 3520 (0.0008) +[2023-10-08 11:54:57,978][102898] Updated weights for policy 1, policy_version 3490 (0.0008) +[2023-10-08 11:54:58,341][102898] Updated weights for policy 1, policy_version 3500 (0.0007) +[2023-10-08 11:54:58,705][102898] Updated weights for policy 1, policy_version 3510 (0.0007) +[2023-10-08 11:54:59,068][102898] Updated weights for policy 1, policy_version 3520 (0.0007) +[2023-10-08 11:55:01,475][102897] Updated weights for policy 0, policy_version 3530 (0.0011) +[2023-10-08 11:55:01,849][102897] Updated weights for policy 0, policy_version 3540 (0.0008) +[2023-10-08 11:55:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 7208960. Throughput: 0: 1806.1, 1: 1776.8. Samples: 1818770. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:55:01,876][101941] Avg episode reward: [(0, '5.600'), (1, '5.760')] +[2023-10-08 11:55:02,220][102897] Updated weights for policy 0, policy_version 3550 (0.0007) +[2023-10-08 11:55:02,758][102898] Updated weights for policy 1, policy_version 3530 (0.0011) +[2023-10-08 11:55:03,126][102898] Updated weights for policy 1, policy_version 3540 (0.0008) +[2023-10-08 11:55:03,500][102898] Updated weights for policy 1, policy_version 3550 (0.0008) +[2023-10-08 11:55:06,094][102897] Updated weights for policy 0, policy_version 3560 (0.0010) +[2023-10-08 11:55:06,462][102897] Updated weights for policy 0, policy_version 3570 (0.0008) +[2023-10-08 11:55:06,838][102897] Updated weights for policy 0, policy_version 3580 (0.0007) +[2023-10-08 11:55:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 7274496. Throughput: 0: 1779.8, 1: 1782.4. Samples: 1828728. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:55:06,876][101941] Avg episode reward: [(0, '5.790'), (1, '5.320')] +[2023-10-08 11:55:07,225][102898] Updated weights for policy 1, policy_version 3560 (0.0007) +[2023-10-08 11:55:07,597][102898] Updated weights for policy 1, policy_version 3570 (0.0008) +[2023-10-08 11:55:07,968][102898] Updated weights for policy 1, policy_version 3580 (0.0008) +[2023-10-08 11:55:10,748][102897] Updated weights for policy 0, policy_version 3590 (0.0009) +[2023-10-08 11:55:11,128][102897] Updated weights for policy 0, policy_version 3600 (0.0010) +[2023-10-08 11:55:11,510][102897] Updated weights for policy 0, policy_version 3610 (0.0008) +[2023-10-08 11:55:11,845][102898] Updated weights for policy 1, policy_version 3590 (0.0008) +[2023-10-08 11:55:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 7372800. Throughput: 0: 1801.0, 1: 1781.7. Samples: 1850742. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 11:55:11,875][101941] Avg episode reward: [(0, '5.350'), (1, '5.120')] +[2023-10-08 11:55:12,211][102898] Updated weights for policy 1, policy_version 3600 (0.0007) +[2023-10-08 11:55:12,579][102898] Updated weights for policy 1, policy_version 3610 (0.0007) +[2023-10-08 11:55:15,238][102897] Updated weights for policy 0, policy_version 3620 (0.0007) +[2023-10-08 11:55:15,618][102897] Updated weights for policy 0, policy_version 3630 (0.0009) +[2023-10-08 11:55:15,988][102897] Updated weights for policy 0, policy_version 3640 (0.0010) +[2023-10-08 11:55:16,335][102898] Updated weights for policy 1, policy_version 3620 (0.0007) +[2023-10-08 11:55:16,713][102898] Updated weights for policy 1, policy_version 3630 (0.0007) +[2023-10-08 11:55:16,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 7438336. Throughput: 0: 1774.0, 1: 1796.9. Samples: 1871222. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:55:16,876][101941] Avg episode reward: [(0, '4.820'), (1, '5.300')] +[2023-10-08 11:55:17,087][102898] Updated weights for policy 1, policy_version 3640 (0.0007) +[2023-10-08 11:55:19,799][102897] Updated weights for policy 0, policy_version 3650 (0.0007) +[2023-10-08 11:55:20,179][102897] Updated weights for policy 0, policy_version 3660 (0.0011) +[2023-10-08 11:55:20,561][102897] Updated weights for policy 0, policy_version 3670 (0.0010) +[2023-10-08 11:55:20,794][102898] Updated weights for policy 1, policy_version 3650 (0.0007) +[2023-10-08 11:55:20,924][102897] Updated weights for policy 0, policy_version 3680 (0.0008) +[2023-10-08 11:55:21,164][102898] Updated weights for policy 1, policy_version 3660 (0.0007) +[2023-10-08 11:55:21,528][102898] Updated weights for policy 1, policy_version 3670 (0.0010) +[2023-10-08 11:55:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 7503872. Throughput: 0: 1797.3, 1: 1779.9. Samples: 1882706. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:55:21,876][101941] Avg episode reward: [(0, '5.370'), (1, '5.480')] +[2023-10-08 11:55:21,900][102898] Updated weights for policy 1, policy_version 3680 (0.0007) +[2023-10-08 11:55:24,672][102897] Updated weights for policy 0, policy_version 3690 (0.0008) +[2023-10-08 11:55:25,046][102897] Updated weights for policy 0, policy_version 3700 (0.0007) +[2023-10-08 11:55:25,415][102897] Updated weights for policy 0, policy_version 3710 (0.0010) +[2023-10-08 11:55:25,686][102898] Updated weights for policy 1, policy_version 3690 (0.0008) +[2023-10-08 11:55:26,059][102898] Updated weights for policy 1, policy_version 3700 (0.0007) +[2023-10-08 11:55:26,416][102898] Updated weights for policy 1, policy_version 3710 (0.0007) +[2023-10-08 11:55:26,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 7602176. Throughput: 0: 1766.3, 1: 1798.5. Samples: 1903354. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:55:26,876][101941] Avg episode reward: [(0, '5.830'), (1, '5.670')] +[2023-10-08 11:55:29,261][102897] Updated weights for policy 0, policy_version 3720 (0.0009) +[2023-10-08 11:55:29,637][102897] Updated weights for policy 0, policy_version 3730 (0.0008) +[2023-10-08 11:55:30,012][102897] Updated weights for policy 0, policy_version 3740 (0.0008) +[2023-10-08 11:55:30,322][102898] Updated weights for policy 1, policy_version 3720 (0.0009) +[2023-10-08 11:55:30,686][102898] Updated weights for policy 1, policy_version 3730 (0.0007) +[2023-10-08 11:55:31,053][102898] Updated weights for policy 1, policy_version 3740 (0.0009) +[2023-10-08 11:55:31,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 7667712. Throughput: 0: 1763.2, 1: 1781.8. Samples: 1924198. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:55:31,876][101941] Avg episode reward: [(0, '5.500'), (1, '5.200')] +[2023-10-08 11:55:33,816][102897] Updated weights for policy 0, policy_version 3750 (0.0007) +[2023-10-08 11:55:34,197][102897] Updated weights for policy 0, policy_version 3760 (0.0009) +[2023-10-08 11:55:34,569][102897] Updated weights for policy 0, policy_version 3770 (0.0007) +[2023-10-08 11:55:34,772][102898] Updated weights for policy 1, policy_version 3750 (0.0008) +[2023-10-08 11:55:35,148][102898] Updated weights for policy 1, policy_version 3760 (0.0010) +[2023-10-08 11:55:35,510][102898] Updated weights for policy 1, policy_version 3770 (0.0011) +[2023-10-08 11:55:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 7733248. Throughput: 0: 1771.2, 1: 1799.7. Samples: 1935834. Policy #0 lag: (min: 25.0, avg: 46.3, max: 48.0) +[2023-10-08 11:55:36,876][101941] Avg episode reward: [(0, '5.630'), (1, '5.160')] +[2023-10-08 11:55:38,235][102897] Updated weights for policy 0, policy_version 3780 (0.0008) +[2023-10-08 11:55:38,612][102897] Updated weights for policy 0, policy_version 3790 (0.0007) +[2023-10-08 11:55:38,979][102897] Updated weights for policy 0, policy_version 3800 (0.0009) +[2023-10-08 11:55:39,326][102898] Updated weights for policy 1, policy_version 3780 (0.0009) +[2023-10-08 11:55:39,691][102898] Updated weights for policy 1, policy_version 3790 (0.0007) +[2023-10-08 11:55:40,052][102898] Updated weights for policy 1, policy_version 3800 (0.0009) +[2023-10-08 11:55:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 7798784. Throughput: 0: 1760.7, 1: 1774.1. Samples: 1956108. Policy #0 lag: (min: 25.0, avg: 46.3, max: 48.0) +[2023-10-08 11:55:41,876][101941] Avg episode reward: [(0, '5.770'), (1, '4.900')] +[2023-10-08 11:55:42,768][102897] Updated weights for policy 0, policy_version 3810 (0.0008) +[2023-10-08 11:55:43,139][102897] Updated weights for policy 0, policy_version 3820 (0.0009) +[2023-10-08 11:55:43,518][102897] Updated weights for policy 0, policy_version 3830 (0.0007) +[2023-10-08 11:55:43,793][102898] Updated weights for policy 1, policy_version 3810 (0.0010) +[2023-10-08 11:55:43,898][102897] Updated weights for policy 0, policy_version 3840 (0.0008) +[2023-10-08 11:55:44,153][102898] Updated weights for policy 1, policy_version 3820 (0.0009) +[2023-10-08 11:55:44,517][102898] Updated weights for policy 1, policy_version 3830 (0.0011) +[2023-10-08 11:55:44,878][102898] Updated weights for policy 1, policy_version 3840 (0.0009) +[2023-10-08 11:55:46,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 7864320. Throughput: 0: 1766.0, 1: 1776.5. Samples: 1978182. Policy #0 lag: (min: 29.0, avg: 39.4, max: 61.0) +[2023-10-08 11:55:46,877][101941] Avg episode reward: [(0, '5.880'), (1, '5.090')] +[2023-10-08 11:55:47,916][102897] Updated weights for policy 0, policy_version 3850 (0.0008) +[2023-10-08 11:55:48,297][102897] Updated weights for policy 0, policy_version 3860 (0.0008) +[2023-10-08 11:55:48,628][102898] Updated weights for policy 1, policy_version 3850 (0.0009) +[2023-10-08 11:55:48,676][102897] Updated weights for policy 0, policy_version 3870 (0.0007) +[2023-10-08 11:55:49,004][102898] Updated weights for policy 1, policy_version 3860 (0.0007) +[2023-10-08 11:55:49,365][102898] Updated weights for policy 1, policy_version 3870 (0.0008) +[2023-10-08 11:55:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 7929856. Throughput: 0: 1760.0, 1: 1774.6. Samples: 1987784. Policy #0 lag: (min: 29.0, avg: 39.4, max: 61.0) +[2023-10-08 11:55:51,876][101941] Avg episode reward: [(0, '6.220'), (1, '5.320')] +[2023-10-08 11:55:52,438][102897] Updated weights for policy 0, policy_version 3880 (0.0008) +[2023-10-08 11:55:52,821][102897] Updated weights for policy 0, policy_version 3890 (0.0009) +[2023-10-08 11:55:52,975][102898] Updated weights for policy 1, policy_version 3880 (0.0007) +[2023-10-08 11:55:53,193][102897] Updated weights for policy 0, policy_version 3900 (0.0007) +[2023-10-08 11:55:53,341][102898] Updated weights for policy 1, policy_version 3890 (0.0008) +[2023-10-08 11:55:53,712][102898] Updated weights for policy 1, policy_version 3900 (0.0008) +[2023-10-08 11:55:56,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 7995392. Throughput: 0: 1764.4, 1: 1781.2. Samples: 2010298. Policy #0 lag: (min: 31.0, avg: 32.7, max: 59.0) +[2023-10-08 11:55:56,875][101941] Avg episode reward: [(0, '6.040'), (1, '4.820')] +[2023-10-08 11:55:57,077][102897] Updated weights for policy 0, policy_version 3910 (0.0008) +[2023-10-08 11:55:57,453][102897] Updated weights for policy 0, policy_version 3920 (0.0008) +[2023-10-08 11:55:57,526][102898] Updated weights for policy 1, policy_version 3910 (0.0008) +[2023-10-08 11:55:57,824][102897] Updated weights for policy 0, policy_version 3930 (0.0009) +[2023-10-08 11:55:57,902][102898] Updated weights for policy 1, policy_version 3920 (0.0007) +[2023-10-08 11:55:58,273][102898] Updated weights for policy 1, policy_version 3930 (0.0009) +[2023-10-08 11:56:01,613][102897] Updated weights for policy 0, policy_version 3940 (0.0009) +[2023-10-08 11:56:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 8060928. Throughput: 0: 1795.3, 1: 1784.7. Samples: 2032322. Policy #0 lag: (min: 31.0, avg: 32.7, max: 59.0) +[2023-10-08 11:56:01,876][101941] Avg episode reward: [(0, '5.630'), (1, '5.060')] +[2023-10-08 11:56:01,977][102897] Updated weights for policy 0, policy_version 3950 (0.0008) +[2023-10-08 11:56:02,298][102898] Updated weights for policy 1, policy_version 3940 (0.0007) +[2023-10-08 11:56:02,354][102897] Updated weights for policy 0, policy_version 3960 (0.0008) +[2023-10-08 11:56:02,671][102898] Updated weights for policy 1, policy_version 3950 (0.0009) +[2023-10-08 11:56:03,045][102898] Updated weights for policy 1, policy_version 3960 (0.0008) +[2023-10-08 11:56:06,183][102897] Updated weights for policy 0, policy_version 3970 (0.0007) +[2023-10-08 11:56:06,563][102897] Updated weights for policy 0, policy_version 3980 (0.0008) +[2023-10-08 11:56:06,843][102898] Updated weights for policy 1, policy_version 3970 (0.0007) +[2023-10-08 11:56:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 8126464. Throughput: 0: 1762.1, 1: 1775.5. Samples: 2041900. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 11:56:06,875][101941] Avg episode reward: [(0, '5.470'), (1, '5.590')] +[2023-10-08 11:56:06,935][102897] Updated weights for policy 0, policy_version 3990 (0.0008) +[2023-10-08 11:56:07,220][102898] Updated weights for policy 1, policy_version 3980 (0.0008) +[2023-10-08 11:56:07,305][102897] Updated weights for policy 0, policy_version 4000 (0.0009) +[2023-10-08 11:56:07,577][102898] Updated weights for policy 1, policy_version 3990 (0.0007) +[2023-10-08 11:56:07,944][102898] Updated weights for policy 1, policy_version 4000 (0.0008) +[2023-10-08 11:56:11,097][102897] Updated weights for policy 0, policy_version 4010 (0.0007) +[2023-10-08 11:56:11,468][102897] Updated weights for policy 0, policy_version 4020 (0.0007) +[2023-10-08 11:56:11,807][102898] Updated weights for policy 1, policy_version 4010 (0.0008) +[2023-10-08 11:56:11,836][102897] Updated weights for policy 0, policy_version 4030 (0.0007) +[2023-10-08 11:56:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 14218.0). Total num frames: 8192000. Throughput: 0: 1792.6, 1: 1775.1. Samples: 2063902. Policy #0 lag: (min: 31.0, avg: 38.1, max: 63.0) +[2023-10-08 11:56:11,875][101941] Avg episode reward: [(0, '5.250'), (1, '5.470')] +[2023-10-08 11:56:12,168][102898] Updated weights for policy 1, policy_version 4020 (0.0009) +[2023-10-08 11:56:12,535][102898] Updated weights for policy 1, policy_version 4030 (0.0009) +[2023-10-08 11:56:15,412][102897] Updated weights for policy 0, policy_version 4040 (0.0007) +[2023-10-08 11:56:15,778][102897] Updated weights for policy 0, policy_version 4050 (0.0008) +[2023-10-08 11:56:16,148][102897] Updated weights for policy 0, policy_version 4060 (0.0007) +[2023-10-08 11:56:16,275][102898] Updated weights for policy 1, policy_version 4040 (0.0007) +[2023-10-08 11:56:16,643][102898] Updated weights for policy 1, policy_version 4050 (0.0007) +[2023-10-08 11:56:16,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 8290304. Throughput: 0: 1770.4, 1: 1792.1. Samples: 2084510. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:56:16,875][101941] Avg episode reward: [(0, '4.930'), (1, '5.440')] +[2023-10-08 11:56:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000004064_4161536.pth... +[2023-10-08 11:56:16,923][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000002400_2457600.pth +[2023-10-08 11:56:17,019][102898] Updated weights for policy 1, policy_version 4060 (0.0007) +[2023-10-08 11:56:17,163][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000004064_4161536.pth... +[2023-10-08 11:56:17,192][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000002368_2424832.pth +[2023-10-08 11:56:20,003][102897] Updated weights for policy 0, policy_version 4070 (0.0008) +[2023-10-08 11:56:20,367][102897] Updated weights for policy 0, policy_version 4080 (0.0007) +[2023-10-08 11:56:20,740][102897] Updated weights for policy 0, policy_version 4090 (0.0007) +[2023-10-08 11:56:20,900][102898] Updated weights for policy 1, policy_version 4070 (0.0008) +[2023-10-08 11:56:21,258][102898] Updated weights for policy 1, policy_version 4080 (0.0009) +[2023-10-08 11:56:21,621][102898] Updated weights for policy 1, policy_version 4090 (0.0007) +[2023-10-08 11:56:21,875][101941] Fps is (10 sec: 19660.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 8388608. Throughput: 0: 1793.3, 1: 1768.3. Samples: 2096106. Policy #0 lag: (min: 2.0, avg: 3.5, max: 28.0) +[2023-10-08 11:56:21,875][101941] Avg episode reward: [(0, '5.420'), (1, '5.200')] +[2023-10-08 11:56:24,492][102897] Updated weights for policy 0, policy_version 4100 (0.0008) +[2023-10-08 11:56:24,859][102897] Updated weights for policy 0, policy_version 4110 (0.0007) +[2023-10-08 11:56:25,229][102897] Updated weights for policy 0, policy_version 4120 (0.0007) +[2023-10-08 11:56:25,324][102898] Updated weights for policy 1, policy_version 4100 (0.0009) +[2023-10-08 11:56:25,694][102898] Updated weights for policy 1, policy_version 4110 (0.0008) +[2023-10-08 11:56:26,060][102898] Updated weights for policy 1, policy_version 4120 (0.0009) +[2023-10-08 11:56:26,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 8454144. Throughput: 0: 1776.9, 1: 1799.2. Samples: 2117032. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 11:56:26,875][101941] Avg episode reward: [(0, '5.700'), (1, '5.230')] +[2023-10-08 11:56:28,949][102897] Updated weights for policy 0, policy_version 4130 (0.0008) +[2023-10-08 11:56:29,315][102897] Updated weights for policy 0, policy_version 4140 (0.0007) +[2023-10-08 11:56:29,690][102897] Updated weights for policy 0, policy_version 4150 (0.0007) +[2023-10-08 11:56:29,861][102898] Updated weights for policy 1, policy_version 4130 (0.0007) +[2023-10-08 11:56:30,062][102897] Updated weights for policy 0, policy_version 4160 (0.0008) +[2023-10-08 11:56:30,228][102898] Updated weights for policy 1, policy_version 4140 (0.0007) +[2023-10-08 11:56:30,603][102898] Updated weights for policy 1, policy_version 4150 (0.0008) +[2023-10-08 11:56:30,968][102898] Updated weights for policy 1, policy_version 4160 (0.0007) +[2023-10-08 11:56:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 8519680. Throughput: 0: 1779.8, 1: 1775.4. Samples: 2138168. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 11:56:31,876][101941] Avg episode reward: [(0, '5.650'), (1, '5.740')] +[2023-10-08 11:56:33,786][102897] Updated weights for policy 0, policy_version 4170 (0.0009) +[2023-10-08 11:56:34,154][102897] Updated weights for policy 0, policy_version 4180 (0.0008) +[2023-10-08 11:56:34,527][102897] Updated weights for policy 0, policy_version 4190 (0.0007) +[2023-10-08 11:56:34,722][102898] Updated weights for policy 1, policy_version 4170 (0.0008) +[2023-10-08 11:56:35,092][102898] Updated weights for policy 1, policy_version 4180 (0.0008) +[2023-10-08 11:56:35,464][102898] Updated weights for policy 1, policy_version 4190 (0.0009) +[2023-10-08 11:56:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 8585216. Throughput: 0: 1791.2, 1: 1807.3. Samples: 2149720. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 11:56:36,876][101941] Avg episode reward: [(0, '6.280'), (1, '6.020')] +[2023-10-08 11:56:38,212][102897] Updated weights for policy 0, policy_version 4200 (0.0010) +[2023-10-08 11:56:38,588][102897] Updated weights for policy 0, policy_version 4210 (0.0011) +[2023-10-08 11:56:38,960][102897] Updated weights for policy 0, policy_version 4220 (0.0009) +[2023-10-08 11:56:39,303][102898] Updated weights for policy 1, policy_version 4200 (0.0008) +[2023-10-08 11:56:39,669][102898] Updated weights for policy 1, policy_version 4210 (0.0007) +[2023-10-08 11:56:40,049][102898] Updated weights for policy 1, policy_version 4220 (0.0007) +[2023-10-08 11:56:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 8650752. Throughput: 0: 1785.3, 1: 1772.3. Samples: 2170392. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 11:56:41,876][101941] Avg episode reward: [(0, '6.310'), (1, '6.190')] +[2023-10-08 11:56:42,737][102897] Updated weights for policy 0, policy_version 4230 (0.0007) +[2023-10-08 11:56:43,115][102897] Updated weights for policy 0, policy_version 4240 (0.0009) +[2023-10-08 11:56:43,478][102897] Updated weights for policy 0, policy_version 4250 (0.0008) +[2023-10-08 11:56:43,729][102898] Updated weights for policy 1, policy_version 4230 (0.0007) +[2023-10-08 11:56:44,097][102898] Updated weights for policy 1, policy_version 4240 (0.0010) +[2023-10-08 11:56:44,464][102898] Updated weights for policy 1, policy_version 4250 (0.0011) +[2023-10-08 11:56:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.6, 300 sec: 14218.0). Total num frames: 8716288. Throughput: 0: 1790.0, 1: 1780.2. Samples: 2192984. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:56:46,875][101941] Avg episode reward: [(0, '5.560'), (1, '6.200')] +[2023-10-08 11:56:47,099][102897] Updated weights for policy 0, policy_version 4260 (0.0008) +[2023-10-08 11:56:47,482][102897] Updated weights for policy 0, policy_version 4270 (0.0009) +[2023-10-08 11:56:47,844][102897] Updated weights for policy 0, policy_version 4280 (0.0009) +[2023-10-08 11:56:48,176][102898] Updated weights for policy 1, policy_version 4260 (0.0010) +[2023-10-08 11:56:48,550][102898] Updated weights for policy 1, policy_version 4270 (0.0010) +[2023-10-08 11:56:48,925][102898] Updated weights for policy 1, policy_version 4280 (0.0009) +[2023-10-08 11:56:51,620][102897] Updated weights for policy 0, policy_version 4290 (0.0007) +[2023-10-08 11:56:51,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 8781824. Throughput: 0: 1791.0, 1: 1783.8. Samples: 2202766. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:56:51,876][101941] Avg episode reward: [(0, '5.550'), (1, '5.710')] +[2023-10-08 11:56:51,990][102897] Updated weights for policy 0, policy_version 4300 (0.0009) +[2023-10-08 11:56:52,358][102897] Updated weights for policy 0, policy_version 4310 (0.0007) +[2023-10-08 11:56:52,731][102897] Updated weights for policy 0, policy_version 4320 (0.0008) +[2023-10-08 11:56:52,769][102898] Updated weights for policy 1, policy_version 4290 (0.0010) +[2023-10-08 11:56:53,136][102898] Updated weights for policy 1, policy_version 4300 (0.0009) +[2023-10-08 11:56:53,504][102898] Updated weights for policy 1, policy_version 4310 (0.0010) +[2023-10-08 11:56:53,872][102898] Updated weights for policy 1, policy_version 4320 (0.0010) +[2023-10-08 11:56:56,440][102897] Updated weights for policy 0, policy_version 4330 (0.0007) +[2023-10-08 11:56:56,814][102897] Updated weights for policy 0, policy_version 4340 (0.0010) +[2023-10-08 11:56:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 8847360. Throughput: 0: 1799.5, 1: 1788.1. Samples: 2225344. Policy #0 lag: (min: 0.0, avg: 27.9, max: 32.0) +[2023-10-08 11:56:56,876][101941] Avg episode reward: [(0, '5.560'), (1, '5.330')] +[2023-10-08 11:56:57,186][102897] Updated weights for policy 0, policy_version 4350 (0.0010) +[2023-10-08 11:56:57,676][102898] Updated weights for policy 1, policy_version 4330 (0.0009) +[2023-10-08 11:56:58,048][102898] Updated weights for policy 1, policy_version 4340 (0.0009) +[2023-10-08 11:56:58,428][102898] Updated weights for policy 1, policy_version 4350 (0.0009) +[2023-10-08 11:57:00,885][102897] Updated weights for policy 0, policy_version 4360 (0.0008) +[2023-10-08 11:57:01,269][102897] Updated weights for policy 0, policy_version 4370 (0.0009) +[2023-10-08 11:57:01,639][102897] Updated weights for policy 0, policy_version 4380 (0.0010) +[2023-10-08 11:57:01,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 8945664. Throughput: 0: 1807.5, 1: 1798.2. Samples: 2246768. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:57:01,875][101941] Avg episode reward: [(0, '5.660'), (1, '5.350')] +[2023-10-08 11:57:02,134][102898] Updated weights for policy 1, policy_version 4360 (0.0010) +[2023-10-08 11:57:02,505][102898] Updated weights for policy 1, policy_version 4370 (0.0007) +[2023-10-08 11:57:02,866][102898] Updated weights for policy 1, policy_version 4380 (0.0008) +[2023-10-08 11:57:05,401][102897] Updated weights for policy 0, policy_version 4390 (0.0007) +[2023-10-08 11:57:05,776][102897] Updated weights for policy 0, policy_version 4400 (0.0009) +[2023-10-08 11:57:06,154][102897] Updated weights for policy 0, policy_version 4410 (0.0007) +[2023-10-08 11:57:06,623][102898] Updated weights for policy 1, policy_version 4390 (0.0008) +[2023-10-08 11:57:06,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 9011200. Throughput: 0: 1801.5, 1: 1791.4. Samples: 2257786. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:57:06,875][101941] Avg episode reward: [(0, '6.170'), (1, '4.880')] +[2023-10-08 11:57:06,991][102898] Updated weights for policy 1, policy_version 4400 (0.0007) +[2023-10-08 11:57:07,359][102898] Updated weights for policy 1, policy_version 4410 (0.0007) +[2023-10-08 11:57:09,758][102897] Updated weights for policy 0, policy_version 4420 (0.0007) +[2023-10-08 11:57:10,125][102897] Updated weights for policy 0, policy_version 4430 (0.0007) +[2023-10-08 11:57:10,504][102897] Updated weights for policy 0, policy_version 4440 (0.0009) +[2023-10-08 11:57:11,175][102898] Updated weights for policy 1, policy_version 4420 (0.0009) +[2023-10-08 11:57:11,538][102898] Updated weights for policy 1, policy_version 4430 (0.0010) +[2023-10-08 11:57:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 9076736. Throughput: 0: 1805.4, 1: 1794.0. Samples: 2279008. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:57:11,875][101941] Avg episode reward: [(0, '6.360'), (1, '4.510')] +[2023-10-08 11:57:11,920][102898] Updated weights for policy 1, policy_version 4440 (0.0009) +[2023-10-08 11:57:14,284][102897] Updated weights for policy 0, policy_version 4450 (0.0009) +[2023-10-08 11:57:14,654][102897] Updated weights for policy 0, policy_version 4460 (0.0010) +[2023-10-08 11:57:15,030][102897] Updated weights for policy 0, policy_version 4470 (0.0011) +[2023-10-08 11:57:15,408][102897] Updated weights for policy 0, policy_version 4480 (0.0010) +[2023-10-08 11:57:15,643][102898] Updated weights for policy 1, policy_version 4450 (0.0010) +[2023-10-08 11:57:16,026][102898] Updated weights for policy 1, policy_version 4460 (0.0008) +[2023-10-08 11:57:16,396][102898] Updated weights for policy 1, policy_version 4470 (0.0008) +[2023-10-08 11:57:16,772][102898] Updated weights for policy 1, policy_version 4480 (0.0008) +[2023-10-08 11:57:16,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 9175040. Throughput: 0: 1799.3, 1: 1793.0. Samples: 2299824. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:57:16,876][101941] Avg episode reward: [(0, '5.970'), (1, '5.010')] +[2023-10-08 11:57:19,242][102897] Updated weights for policy 0, policy_version 4490 (0.0010) +[2023-10-08 11:57:19,615][102897] Updated weights for policy 0, policy_version 4500 (0.0009) +[2023-10-08 11:57:19,982][102897] Updated weights for policy 0, policy_version 4510 (0.0008) +[2023-10-08 11:57:20,539][102898] Updated weights for policy 1, policy_version 4490 (0.0008) +[2023-10-08 11:57:20,907][102898] Updated weights for policy 1, policy_version 4500 (0.0010) +[2023-10-08 11:57:21,283][102898] Updated weights for policy 1, policy_version 4510 (0.0009) +[2023-10-08 11:57:21,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 9240576. Throughput: 0: 1805.2, 1: 1780.8. Samples: 2311090. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:57:21,875][101941] Avg episode reward: [(0, '5.520'), (1, '4.830')] +[2023-10-08 11:57:23,828][102897] Updated weights for policy 0, policy_version 4520 (0.0007) +[2023-10-08 11:57:24,194][102897] Updated weights for policy 0, policy_version 4530 (0.0008) +[2023-10-08 11:57:24,571][102897] Updated weights for policy 0, policy_version 4540 (0.0007) +[2023-10-08 11:57:24,941][102898] Updated weights for policy 1, policy_version 4520 (0.0008) +[2023-10-08 11:57:25,303][102898] Updated weights for policy 1, policy_version 4530 (0.0010) +[2023-10-08 11:57:25,678][102898] Updated weights for policy 1, policy_version 4540 (0.0010) +[2023-10-08 11:57:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 9306112. Throughput: 0: 1788.1, 1: 1798.4. Samples: 2331788. Policy #0 lag: (min: 31.0, avg: 34.5, max: 63.0) +[2023-10-08 11:57:26,876][101941] Avg episode reward: [(0, '5.600'), (1, '4.600')] +[2023-10-08 11:57:28,337][102897] Updated weights for policy 0, policy_version 4550 (0.0009) +[2023-10-08 11:57:28,711][102897] Updated weights for policy 0, policy_version 4560 (0.0007) +[2023-10-08 11:57:29,093][102897] Updated weights for policy 0, policy_version 4570 (0.0007) +[2023-10-08 11:57:29,534][102898] Updated weights for policy 1, policy_version 4550 (0.0010) +[2023-10-08 11:57:29,912][102898] Updated weights for policy 1, policy_version 4560 (0.0009) +[2023-10-08 11:57:30,272][102898] Updated weights for policy 1, policy_version 4570 (0.0007) +[2023-10-08 11:57:31,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 9371648. Throughput: 0: 1787.0, 1: 1783.4. Samples: 2353650. Policy #0 lag: (min: 31.0, avg: 34.5, max: 63.0) +[2023-10-08 11:57:31,876][101941] Avg episode reward: [(0, '5.530'), (1, '4.900')] +[2023-10-08 11:57:32,889][102897] Updated weights for policy 0, policy_version 4580 (0.0009) +[2023-10-08 11:57:33,260][102897] Updated weights for policy 0, policy_version 4590 (0.0007) +[2023-10-08 11:57:33,631][102897] Updated weights for policy 0, policy_version 4600 (0.0007) +[2023-10-08 11:57:33,950][102898] Updated weights for policy 1, policy_version 4580 (0.0007) +[2023-10-08 11:57:34,323][102898] Updated weights for policy 1, policy_version 4590 (0.0009) +[2023-10-08 11:57:34,691][102898] Updated weights for policy 1, policy_version 4600 (0.0007) +[2023-10-08 11:57:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 9437184. Throughput: 0: 1784.7, 1: 1798.0. Samples: 2363986. Policy #0 lag: (min: 10.0, avg: 10.0, max: 10.0) +[2023-10-08 11:57:36,876][101941] Avg episode reward: [(0, '6.100'), (1, '5.240')] +[2023-10-08 11:57:37,407][102897] Updated weights for policy 0, policy_version 4610 (0.0008) +[2023-10-08 11:57:37,779][102897] Updated weights for policy 0, policy_version 4620 (0.0008) +[2023-10-08 11:57:38,162][102897] Updated weights for policy 0, policy_version 4630 (0.0009) +[2023-10-08 11:57:38,411][102898] Updated weights for policy 1, policy_version 4610 (0.0007) +[2023-10-08 11:57:38,531][102897] Updated weights for policy 0, policy_version 4640 (0.0008) +[2023-10-08 11:57:38,778][102898] Updated weights for policy 1, policy_version 4620 (0.0009) +[2023-10-08 11:57:39,145][102898] Updated weights for policy 1, policy_version 4630 (0.0008) +[2023-10-08 11:57:39,518][102898] Updated weights for policy 1, policy_version 4640 (0.0007) +[2023-10-08 11:57:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 9502720. Throughput: 0: 1776.8, 1: 1779.2. Samples: 2385364. Policy #0 lag: (min: 10.0, avg: 10.0, max: 10.0) +[2023-10-08 11:57:41,876][101941] Avg episode reward: [(0, '6.400'), (1, '5.480')] +[2023-10-08 11:57:42,391][102897] Updated weights for policy 0, policy_version 4650 (0.0008) +[2023-10-08 11:57:42,762][102897] Updated weights for policy 0, policy_version 4660 (0.0007) +[2023-10-08 11:57:43,130][102897] Updated weights for policy 0, policy_version 4670 (0.0007) +[2023-10-08 11:57:43,315][102898] Updated weights for policy 1, policy_version 4650 (0.0009) +[2023-10-08 11:57:43,684][102898] Updated weights for policy 1, policy_version 4660 (0.0008) +[2023-10-08 11:57:44,047][102898] Updated weights for policy 1, policy_version 4670 (0.0008) +[2023-10-08 11:57:46,823][102897] Updated weights for policy 0, policy_version 4680 (0.0007) +[2023-10-08 11:57:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 9568256. Throughput: 0: 1799.2, 1: 1777.9. Samples: 2407738. Policy #0 lag: (min: 31.0, avg: 34.4, max: 63.0) +[2023-10-08 11:57:46,876][101941] Avg episode reward: [(0, '6.370'), (1, '5.550')] +[2023-10-08 11:57:47,202][102897] Updated weights for policy 0, policy_version 4690 (0.0007) +[2023-10-08 11:57:47,581][102897] Updated weights for policy 0, policy_version 4700 (0.0007) +[2023-10-08 11:57:47,974][102898] Updated weights for policy 1, policy_version 4680 (0.0009) +[2023-10-08 11:57:48,345][102898] Updated weights for policy 1, policy_version 4690 (0.0010) +[2023-10-08 11:57:48,710][102898] Updated weights for policy 1, policy_version 4700 (0.0007) +[2023-10-08 11:57:51,254][102897] Updated weights for policy 0, policy_version 4710 (0.0010) +[2023-10-08 11:57:51,629][102897] Updated weights for policy 0, policy_version 4720 (0.0009) +[2023-10-08 11:57:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 9633792. Throughput: 0: 1774.5, 1: 1775.6. Samples: 2417540. Policy #0 lag: (min: 31.0, avg: 34.4, max: 63.0) +[2023-10-08 11:57:51,876][101941] Avg episode reward: [(0, '6.480'), (1, '5.040')] +[2023-10-08 11:57:51,998][102897] Updated weights for policy 0, policy_version 4730 (0.0007) +[2023-10-08 11:57:52,221][102634] Saving new best policy, reward=6.480! +[2023-10-08 11:57:52,353][102898] Updated weights for policy 1, policy_version 4710 (0.0008) +[2023-10-08 11:57:52,720][102898] Updated weights for policy 1, policy_version 4720 (0.0008) +[2023-10-08 11:57:53,089][102898] Updated weights for policy 1, policy_version 4730 (0.0009) +[2023-10-08 11:57:55,704][102897] Updated weights for policy 0, policy_version 4740 (0.0008) +[2023-10-08 11:57:56,077][102897] Updated weights for policy 0, policy_version 4750 (0.0009) +[2023-10-08 11:57:56,443][102897] Updated weights for policy 0, policy_version 4760 (0.0008) +[2023-10-08 11:57:56,819][102898] Updated weights for policy 1, policy_version 4740 (0.0008) +[2023-10-08 11:57:56,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 9732096. Throughput: 0: 1801.5, 1: 1776.8. Samples: 2440032. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:57:56,876][101941] Avg episode reward: [(0, '6.150'), (1, '5.390')] +[2023-10-08 11:57:57,178][102898] Updated weights for policy 1, policy_version 4750 (0.0008) +[2023-10-08 11:57:57,547][102898] Updated weights for policy 1, policy_version 4760 (0.0009) +[2023-10-08 11:58:00,117][102897] Updated weights for policy 0, policy_version 4770 (0.0009) +[2023-10-08 11:58:00,483][102897] Updated weights for policy 0, policy_version 4780 (0.0010) +[2023-10-08 11:58:00,861][102897] Updated weights for policy 0, policy_version 4790 (0.0007) +[2023-10-08 11:58:01,133][102898] Updated weights for policy 1, policy_version 4770 (0.0008) +[2023-10-08 11:58:01,233][102897] Updated weights for policy 0, policy_version 4800 (0.0008) +[2023-10-08 11:58:01,491][102898] Updated weights for policy 1, policy_version 4780 (0.0009) +[2023-10-08 11:58:01,861][102898] Updated weights for policy 1, policy_version 4790 (0.0009) +[2023-10-08 11:58:01,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 9797632. Throughput: 0: 1778.0, 1: 1798.8. Samples: 2460784. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 11:58:01,875][101941] Avg episode reward: [(0, '5.360'), (1, '5.850')] +[2023-10-08 11:58:02,229][102898] Updated weights for policy 1, policy_version 4800 (0.0007) +[2023-10-08 11:58:05,073][102897] Updated weights for policy 0, policy_version 4810 (0.0007) +[2023-10-08 11:58:05,450][102897] Updated weights for policy 0, policy_version 4820 (0.0008) +[2023-10-08 11:58:05,824][102897] Updated weights for policy 0, policy_version 4830 (0.0009) +[2023-10-08 11:58:06,206][102898] Updated weights for policy 1, policy_version 4810 (0.0007) +[2023-10-08 11:58:06,570][102898] Updated weights for policy 1, policy_version 4820 (0.0008) +[2023-10-08 11:58:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 9863168. Throughput: 0: 1794.6, 1: 1786.8. Samples: 2472252. Policy #0 lag: (min: 7.0, avg: 7.0, max: 7.0) +[2023-10-08 11:58:06,876][101941] Avg episode reward: [(0, '5.520'), (1, '5.200')] +[2023-10-08 11:58:06,938][102898] Updated weights for policy 1, policy_version 4830 (0.0008) +[2023-10-08 11:58:09,412][102897] Updated weights for policy 0, policy_version 4840 (0.0008) +[2023-10-08 11:58:09,786][102897] Updated weights for policy 0, policy_version 4850 (0.0008) +[2023-10-08 11:58:10,170][102897] Updated weights for policy 0, policy_version 4860 (0.0010) +[2023-10-08 11:58:10,685][102898] Updated weights for policy 1, policy_version 4840 (0.0007) +[2023-10-08 11:58:11,059][102898] Updated weights for policy 1, policy_version 4850 (0.0010) +[2023-10-08 11:58:11,426][102898] Updated weights for policy 1, policy_version 4860 (0.0010) +[2023-10-08 11:58:11,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 9961472. Throughput: 0: 1787.5, 1: 1794.9. Samples: 2492996. Policy #0 lag: (min: 12.0, avg: 12.0, max: 12.0) +[2023-10-08 11:58:11,876][101941] Avg episode reward: [(0, '5.600'), (1, '5.060')] +[2023-10-08 11:58:13,938][102897] Updated weights for policy 0, policy_version 4870 (0.0009) +[2023-10-08 11:58:14,307][102897] Updated weights for policy 0, policy_version 4880 (0.0011) +[2023-10-08 11:58:14,675][102897] Updated weights for policy 0, policy_version 4890 (0.0010) +[2023-10-08 11:58:15,294][102898] Updated weights for policy 1, policy_version 4870 (0.0008) +[2023-10-08 11:58:15,674][102898] Updated weights for policy 1, policy_version 4880 (0.0007) +[2023-10-08 11:58:16,046][102898] Updated weights for policy 1, policy_version 4890 (0.0007) +[2023-10-08 11:58:16,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 10027008. Throughput: 0: 1786.4, 1: 1779.9. Samples: 2514132. Policy #0 lag: (min: 12.0, avg: 12.0, max: 12.0) +[2023-10-08 11:58:16,876][101941] Avg episode reward: [(0, '5.770'), (1, '5.870')] +[2023-10-08 11:58:16,888][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000004896_5013504.pth... +[2023-10-08 11:58:16,888][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000004896_5013504.pth... +[2023-10-08 11:58:16,930][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000003232_3309568.pth +[2023-10-08 11:58:16,930][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000003232_3309568.pth +[2023-10-08 11:58:18,437][102897] Updated weights for policy 0, policy_version 4900 (0.0010) +[2023-10-08 11:58:18,803][102897] Updated weights for policy 0, policy_version 4910 (0.0010) +[2023-10-08 11:58:19,189][102897] Updated weights for policy 0, policy_version 4920 (0.0008) +[2023-10-08 11:58:19,857][102898] Updated weights for policy 1, policy_version 4900 (0.0009) +[2023-10-08 11:58:20,226][102898] Updated weights for policy 1, policy_version 4910 (0.0009) +[2023-10-08 11:58:20,600][102898] Updated weights for policy 1, policy_version 4920 (0.0009) +[2023-10-08 11:58:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 10092544. Throughput: 0: 1794.7, 1: 1793.8. Samples: 2525470. Policy #0 lag: (min: 31.0, avg: 34.4, max: 63.0) +[2023-10-08 11:58:21,876][101941] Avg episode reward: [(0, '5.740'), (1, '5.190')] +[2023-10-08 11:58:23,100][102897] Updated weights for policy 0, policy_version 4930 (0.0007) +[2023-10-08 11:58:23,474][102897] Updated weights for policy 0, policy_version 4940 (0.0007) +[2023-10-08 11:58:23,847][102897] Updated weights for policy 0, policy_version 4950 (0.0007) +[2023-10-08 11:58:24,218][102897] Updated weights for policy 0, policy_version 4960 (0.0007) +[2023-10-08 11:58:24,486][102898] Updated weights for policy 1, policy_version 4930 (0.0008) +[2023-10-08 11:58:24,856][102898] Updated weights for policy 1, policy_version 4940 (0.0007) +[2023-10-08 11:58:25,221][102898] Updated weights for policy 1, policy_version 4950 (0.0007) +[2023-10-08 11:58:25,589][102898] Updated weights for policy 1, policy_version 4960 (0.0009) +[2023-10-08 11:58:26,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 10158080. Throughput: 0: 1793.1, 1: 1782.4. Samples: 2546258. Policy #0 lag: (min: 31.0, avg: 34.4, max: 63.0) +[2023-10-08 11:58:26,876][101941] Avg episode reward: [(0, '5.540'), (1, '4.710')] +[2023-10-08 11:58:27,975][102897] Updated weights for policy 0, policy_version 4970 (0.0009) +[2023-10-08 11:58:28,347][102897] Updated weights for policy 0, policy_version 4980 (0.0009) +[2023-10-08 11:58:28,726][102897] Updated weights for policy 0, policy_version 4990 (0.0010) +[2023-10-08 11:58:29,269][102898] Updated weights for policy 1, policy_version 4970 (0.0008) +[2023-10-08 11:58:29,637][102898] Updated weights for policy 1, policy_version 4980 (0.0007) +[2023-10-08 11:58:30,004][102898] Updated weights for policy 1, policy_version 4990 (0.0007) +[2023-10-08 11:58:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 10223616. Throughput: 0: 1792.0, 1: 1778.7. Samples: 2568420. Policy #0 lag: (min: 8.0, avg: 30.6, max: 40.0) +[2023-10-08 11:58:31,876][101941] Avg episode reward: [(0, '5.560'), (1, '5.350')] +[2023-10-08 11:58:32,544][102897] Updated weights for policy 0, policy_version 5000 (0.0010) +[2023-10-08 11:58:32,915][102897] Updated weights for policy 0, policy_version 5010 (0.0010) +[2023-10-08 11:58:33,293][102897] Updated weights for policy 0, policy_version 5020 (0.0008) +[2023-10-08 11:58:33,692][102898] Updated weights for policy 1, policy_version 5000 (0.0007) +[2023-10-08 11:58:34,075][102898] Updated weights for policy 1, policy_version 5010 (0.0010) +[2023-10-08 11:58:34,440][102898] Updated weights for policy 1, policy_version 5020 (0.0007) +[2023-10-08 11:58:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 10289152. Throughput: 0: 1792.2, 1: 1783.4. Samples: 2578440. Policy #0 lag: (min: 8.0, avg: 30.6, max: 40.0) +[2023-10-08 11:58:36,876][101941] Avg episode reward: [(0, '5.610'), (1, '5.320')] +[2023-10-08 11:58:36,927][102897] Updated weights for policy 0, policy_version 5030 (0.0009) +[2023-10-08 11:58:37,307][102897] Updated weights for policy 0, policy_version 5040 (0.0007) +[2023-10-08 11:58:37,680][102897] Updated weights for policy 0, policy_version 5050 (0.0007) +[2023-10-08 11:58:38,268][102898] Updated weights for policy 1, policy_version 5030 (0.0007) +[2023-10-08 11:58:38,649][102898] Updated weights for policy 1, policy_version 5040 (0.0008) +[2023-10-08 11:58:39,011][102898] Updated weights for policy 1, policy_version 5050 (0.0007) +[2023-10-08 11:58:41,491][102897] Updated weights for policy 0, policy_version 5060 (0.0008) +[2023-10-08 11:58:41,864][102897] Updated weights for policy 0, policy_version 5070 (0.0009) +[2023-10-08 11:58:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 10354688. Throughput: 0: 1787.0, 1: 1775.6. Samples: 2600348. Policy #0 lag: (min: 27.0, avg: 31.6, max: 59.0) +[2023-10-08 11:58:41,876][101941] Avg episode reward: [(0, '5.560'), (1, '4.900')] +[2023-10-08 11:58:42,244][102897] Updated weights for policy 0, policy_version 5080 (0.0010) +[2023-10-08 11:58:42,878][102898] Updated weights for policy 1, policy_version 5060 (0.0009) +[2023-10-08 11:58:43,247][102898] Updated weights for policy 1, policy_version 5070 (0.0008) +[2023-10-08 11:58:43,619][102898] Updated weights for policy 1, policy_version 5080 (0.0007) +[2023-10-08 11:58:45,946][102897] Updated weights for policy 0, policy_version 5090 (0.0010) +[2023-10-08 11:58:46,308][102897] Updated weights for policy 0, policy_version 5100 (0.0009) +[2023-10-08 11:58:46,686][102897] Updated weights for policy 0, policy_version 5110 (0.0009) +[2023-10-08 11:58:46,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 10420224. Throughput: 0: 1806.0, 1: 1778.0. Samples: 2622066. Policy #0 lag: (min: 27.0, avg: 31.6, max: 59.0) +[2023-10-08 11:58:46,875][101941] Avg episode reward: [(0, '6.100'), (1, '5.140')] +[2023-10-08 11:58:47,062][102897] Updated weights for policy 0, policy_version 5120 (0.0009) +[2023-10-08 11:58:47,433][102898] Updated weights for policy 1, policy_version 5090 (0.0008) +[2023-10-08 11:58:47,791][102898] Updated weights for policy 1, policy_version 5100 (0.0009) +[2023-10-08 11:58:48,165][102898] Updated weights for policy 1, policy_version 5110 (0.0008) +[2023-10-08 11:58:48,533][102898] Updated weights for policy 1, policy_version 5120 (0.0008) +[2023-10-08 11:58:50,885][102897] Updated weights for policy 0, policy_version 5130 (0.0009) +[2023-10-08 11:58:51,249][102897] Updated weights for policy 0, policy_version 5140 (0.0007) +[2023-10-08 11:58:51,620][102897] Updated weights for policy 0, policy_version 5150 (0.0008) +[2023-10-08 11:58:51,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 10518528. Throughput: 0: 1787.0, 1: 1769.6. Samples: 2632300. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 11:58:51,875][101941] Avg episode reward: [(0, '6.480'), (1, '5.430')] +[2023-10-08 11:58:52,273][102898] Updated weights for policy 1, policy_version 5130 (0.0007) +[2023-10-08 11:58:52,640][102898] Updated weights for policy 1, policy_version 5140 (0.0008) +[2023-10-08 11:58:53,012][102898] Updated weights for policy 1, policy_version 5150 (0.0008) +[2023-10-08 11:58:55,161][102897] Updated weights for policy 0, policy_version 5160 (0.0012) +[2023-10-08 11:58:55,538][102897] Updated weights for policy 0, policy_version 5170 (0.0011) +[2023-10-08 11:58:55,910][102897] Updated weights for policy 0, policy_version 5180 (0.0009) +[2023-10-08 11:58:56,821][102898] Updated weights for policy 1, policy_version 5160 (0.0010) +[2023-10-08 11:58:56,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 10584064. Throughput: 0: 1807.0, 1: 1774.4. Samples: 2654160. Policy #0 lag: (min: 26.0, avg: 29.3, max: 58.0) +[2023-10-08 11:58:56,875][101941] Avg episode reward: [(0, '6.610'), (1, '5.300')] +[2023-10-08 11:58:56,876][102634] Saving new best policy, reward=6.610! +[2023-10-08 11:58:57,194][102898] Updated weights for policy 1, policy_version 5170 (0.0008) +[2023-10-08 11:58:57,569][102898] Updated weights for policy 1, policy_version 5180 (0.0007) +[2023-10-08 11:58:59,878][102897] Updated weights for policy 0, policy_version 5190 (0.0007) +[2023-10-08 11:59:00,244][102897] Updated weights for policy 0, policy_version 5200 (0.0009) +[2023-10-08 11:59:00,625][102897] Updated weights for policy 0, policy_version 5210 (0.0008) +[2023-10-08 11:59:01,234][102898] Updated weights for policy 1, policy_version 5190 (0.0009) +[2023-10-08 11:59:01,605][102898] Updated weights for policy 1, policy_version 5200 (0.0007) +[2023-10-08 11:59:01,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 10649600. Throughput: 0: 1784.5, 1: 1792.1. Samples: 2675080. Policy #0 lag: (min: 26.0, avg: 29.3, max: 58.0) +[2023-10-08 11:59:01,876][101941] Avg episode reward: [(0, '6.200'), (1, '4.900')] +[2023-10-08 11:59:01,969][102898] Updated weights for policy 1, policy_version 5210 (0.0008) +[2023-10-08 11:59:04,239][102897] Updated weights for policy 0, policy_version 5220 (0.0011) +[2023-10-08 11:59:04,609][102897] Updated weights for policy 0, policy_version 5230 (0.0009) +[2023-10-08 11:59:04,976][102897] Updated weights for policy 0, policy_version 5240 (0.0009) +[2023-10-08 11:59:05,755][102898] Updated weights for policy 1, policy_version 5220 (0.0010) +[2023-10-08 11:59:06,122][102898] Updated weights for policy 1, policy_version 5230 (0.0009) +[2023-10-08 11:59:06,497][102898] Updated weights for policy 1, policy_version 5240 (0.0007) +[2023-10-08 11:59:06,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 10747904. Throughput: 0: 1804.7, 1: 1772.1. Samples: 2686426. Policy #0 lag: (min: 1.0, avg: 14.2, max: 33.0) +[2023-10-08 11:59:06,876][101941] Avg episode reward: [(0, '5.560'), (1, '4.960')] +[2023-10-08 11:59:08,727][102897] Updated weights for policy 0, policy_version 5250 (0.0010) +[2023-10-08 11:59:09,105][102897] Updated weights for policy 0, policy_version 5260 (0.0010) +[2023-10-08 11:59:09,485][102897] Updated weights for policy 0, policy_version 5270 (0.0010) +[2023-10-08 11:59:09,848][102897] Updated weights for policy 0, policy_version 5280 (0.0011) +[2023-10-08 11:59:10,295][102898] Updated weights for policy 1, policy_version 5250 (0.0008) +[2023-10-08 11:59:10,667][102898] Updated weights for policy 1, policy_version 5260 (0.0007) +[2023-10-08 11:59:11,026][102898] Updated weights for policy 1, policy_version 5270 (0.0007) +[2023-10-08 11:59:11,397][102898] Updated weights for policy 1, policy_version 5280 (0.0008) +[2023-10-08 11:59:11,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 10813440. Throughput: 0: 1785.1, 1: 1798.4. Samples: 2707514. Policy #0 lag: (min: 1.0, avg: 14.2, max: 33.0) +[2023-10-08 11:59:11,875][101941] Avg episode reward: [(0, '6.100'), (1, '5.160')] +[2023-10-08 11:59:13,770][102897] Updated weights for policy 0, policy_version 5290 (0.0007) +[2023-10-08 11:59:14,138][102897] Updated weights for policy 0, policy_version 5300 (0.0007) +[2023-10-08 11:59:14,517][102897] Updated weights for policy 0, policy_version 5310 (0.0008) +[2023-10-08 11:59:15,258][102898] Updated weights for policy 1, policy_version 5290 (0.0007) +[2023-10-08 11:59:15,627][102898] Updated weights for policy 1, policy_version 5300 (0.0008) +[2023-10-08 11:59:15,993][102898] Updated weights for policy 1, policy_version 5310 (0.0007) +[2023-10-08 11:59:16,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 10878976. Throughput: 0: 1780.8, 1: 1781.0. Samples: 2728698. Policy #0 lag: (min: 31.0, avg: 32.6, max: 58.0) +[2023-10-08 11:59:16,876][101941] Avg episode reward: [(0, '6.000'), (1, '5.690')] +[2023-10-08 11:59:18,434][102897] Updated weights for policy 0, policy_version 5320 (0.0008) +[2023-10-08 11:59:18,818][102897] Updated weights for policy 0, policy_version 5330 (0.0008) +[2023-10-08 11:59:19,181][102897] Updated weights for policy 0, policy_version 5340 (0.0007) +[2023-10-08 11:59:19,723][102898] Updated weights for policy 1, policy_version 5320 (0.0007) +[2023-10-08 11:59:20,097][102898] Updated weights for policy 1, policy_version 5330 (0.0011) +[2023-10-08 11:59:20,459][102898] Updated weights for policy 1, policy_version 5340 (0.0008) +[2023-10-08 11:59:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 10944512. Throughput: 0: 1780.1, 1: 1806.2. Samples: 2739822. Policy #0 lag: (min: 31.0, avg: 32.6, max: 58.0) +[2023-10-08 11:59:21,876][101941] Avg episode reward: [(0, '6.190'), (1, '5.600')] +[2023-10-08 11:59:22,841][102897] Updated weights for policy 0, policy_version 5350 (0.0008) +[2023-10-08 11:59:23,211][102897] Updated weights for policy 0, policy_version 5360 (0.0007) +[2023-10-08 11:59:23,586][102897] Updated weights for policy 0, policy_version 5370 (0.0007) +[2023-10-08 11:59:24,259][102898] Updated weights for policy 1, policy_version 5350 (0.0008) +[2023-10-08 11:59:24,623][102898] Updated weights for policy 1, policy_version 5360 (0.0008) +[2023-10-08 11:59:25,008][102898] Updated weights for policy 1, policy_version 5370 (0.0009) +[2023-10-08 11:59:26,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 11010048. Throughput: 0: 1782.6, 1: 1777.2. Samples: 2760536. Policy #0 lag: (min: 4.0, avg: 6.0, max: 35.0) +[2023-10-08 11:59:26,875][101941] Avg episode reward: [(0, '6.400'), (1, '5.680')] +[2023-10-08 11:59:27,246][102897] Updated weights for policy 0, policy_version 5380 (0.0009) +[2023-10-08 11:59:27,615][102897] Updated weights for policy 0, policy_version 5390 (0.0008) +[2023-10-08 11:59:27,987][102897] Updated weights for policy 0, policy_version 5400 (0.0008) +[2023-10-08 11:59:28,785][102898] Updated weights for policy 1, policy_version 5380 (0.0010) +[2023-10-08 11:59:29,154][102898] Updated weights for policy 1, policy_version 5390 (0.0008) +[2023-10-08 11:59:29,517][102898] Updated weights for policy 1, policy_version 5400 (0.0008) +[2023-10-08 11:59:31,449][102897] Updated weights for policy 0, policy_version 5410 (0.0010) +[2023-10-08 11:59:31,816][102897] Updated weights for policy 0, policy_version 5420 (0.0007) +[2023-10-08 11:59:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 11075584. Throughput: 0: 1803.8, 1: 1772.8. Samples: 2783014. Policy #0 lag: (min: 4.0, avg: 6.0, max: 35.0) +[2023-10-08 11:59:31,876][101941] Avg episode reward: [(0, '6.780'), (1, '5.290')] +[2023-10-08 11:59:32,188][102897] Updated weights for policy 0, policy_version 5430 (0.0007) +[2023-10-08 11:59:32,560][102634] Saving new best policy, reward=6.780! +[2023-10-08 11:59:32,563][102897] Updated weights for policy 0, policy_version 5440 (0.0008) +[2023-10-08 11:59:33,393][102898] Updated weights for policy 1, policy_version 5410 (0.0009) +[2023-10-08 11:59:33,770][102898] Updated weights for policy 1, policy_version 5420 (0.0008) +[2023-10-08 11:59:34,142][102898] Updated weights for policy 1, policy_version 5430 (0.0009) +[2023-10-08 11:59:34,509][102898] Updated weights for policy 1, policy_version 5440 (0.0010) +[2023-10-08 11:59:36,448][102897] Updated weights for policy 0, policy_version 5450 (0.0007) +[2023-10-08 11:59:36,820][102897] Updated weights for policy 0, policy_version 5460 (0.0010) +[2023-10-08 11:59:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 11141120. Throughput: 0: 1791.8, 1: 1782.0. Samples: 2793122. Policy #0 lag: (min: 2.0, avg: 4.8, max: 28.0) +[2023-10-08 11:59:36,876][101941] Avg episode reward: [(0, '6.340'), (1, '5.380')] +[2023-10-08 11:59:37,196][102897] Updated weights for policy 0, policy_version 5470 (0.0009) +[2023-10-08 11:59:38,251][102898] Updated weights for policy 1, policy_version 5450 (0.0010) +[2023-10-08 11:59:38,612][102898] Updated weights for policy 1, policy_version 5460 (0.0007) +[2023-10-08 11:59:38,975][102898] Updated weights for policy 1, policy_version 5470 (0.0009) +[2023-10-08 11:59:40,936][102897] Updated weights for policy 0, policy_version 5480 (0.0010) +[2023-10-08 11:59:41,313][102897] Updated weights for policy 0, policy_version 5490 (0.0007) +[2023-10-08 11:59:41,691][102897] Updated weights for policy 0, policy_version 5500 (0.0008) +[2023-10-08 11:59:41,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 11239424. Throughput: 0: 1802.8, 1: 1780.3. Samples: 2815400. Policy #0 lag: (min: 17.0, avg: 32.1, max: 49.0) +[2023-10-08 11:59:41,876][101941] Avg episode reward: [(0, '6.120'), (1, '5.060')] +[2023-10-08 11:59:42,714][102898] Updated weights for policy 1, policy_version 5480 (0.0007) +[2023-10-08 11:59:43,100][102898] Updated weights for policy 1, policy_version 5490 (0.0009) +[2023-10-08 11:59:43,469][102898] Updated weights for policy 1, policy_version 5500 (0.0009) +[2023-10-08 11:59:45,345][102897] Updated weights for policy 0, policy_version 5510 (0.0008) +[2023-10-08 11:59:45,717][102897] Updated weights for policy 0, policy_version 5520 (0.0008) +[2023-10-08 11:59:46,086][102897] Updated weights for policy 0, policy_version 5530 (0.0007) +[2023-10-08 11:59:46,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 11304960. Throughput: 0: 1795.8, 1: 1792.1. Samples: 2836536. Policy #0 lag: (min: 17.0, avg: 32.1, max: 49.0) +[2023-10-08 11:59:46,876][101941] Avg episode reward: [(0, '5.940'), (1, '4.680')] +[2023-10-08 11:59:47,231][102898] Updated weights for policy 1, policy_version 5510 (0.0009) +[2023-10-08 11:59:47,615][102898] Updated weights for policy 1, policy_version 5520 (0.0011) +[2023-10-08 11:59:47,986][102898] Updated weights for policy 1, policy_version 5530 (0.0010) +[2023-10-08 11:59:49,947][102897] Updated weights for policy 0, policy_version 5540 (0.0007) +[2023-10-08 11:59:50,316][102897] Updated weights for policy 0, policy_version 5550 (0.0009) +[2023-10-08 11:59:50,698][102897] Updated weights for policy 0, policy_version 5560 (0.0009) +[2023-10-08 11:59:51,819][102898] Updated weights for policy 1, policy_version 5540 (0.0008) +[2023-10-08 11:59:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 11370496. Throughput: 0: 1803.4, 1: 1781.2. Samples: 2847734. Policy #0 lag: (min: 17.0, avg: 33.3, max: 49.0) +[2023-10-08 11:59:51,875][101941] Avg episode reward: [(0, '5.820'), (1, '4.920')] +[2023-10-08 11:59:52,197][102898] Updated weights for policy 1, policy_version 5550 (0.0007) +[2023-10-08 11:59:52,577][102898] Updated weights for policy 1, policy_version 5560 (0.0009) +[2023-10-08 11:59:54,463][102897] Updated weights for policy 0, policy_version 5570 (0.0011) +[2023-10-08 11:59:54,833][102897] Updated weights for policy 0, policy_version 5580 (0.0008) +[2023-10-08 11:59:55,203][102897] Updated weights for policy 0, policy_version 5590 (0.0007) +[2023-10-08 11:59:55,576][102897] Updated weights for policy 0, policy_version 5600 (0.0008) +[2023-10-08 11:59:56,341][102898] Updated weights for policy 1, policy_version 5570 (0.0007) +[2023-10-08 11:59:56,700][102898] Updated weights for policy 1, policy_version 5580 (0.0007) +[2023-10-08 11:59:56,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 11436032. Throughput: 0: 1801.3, 1: 1781.7. Samples: 2868752. Policy #0 lag: (min: 17.0, avg: 33.3, max: 49.0) +[2023-10-08 11:59:56,875][101941] Avg episode reward: [(0, '5.890'), (1, '5.680')] +[2023-10-08 11:59:57,078][102898] Updated weights for policy 1, policy_version 5590 (0.0008) +[2023-10-08 11:59:57,437][102898] Updated weights for policy 1, policy_version 5600 (0.0008) +[2023-10-08 11:59:59,218][102897] Updated weights for policy 0, policy_version 5610 (0.0010) +[2023-10-08 11:59:59,595][102897] Updated weights for policy 0, policy_version 5620 (0.0007) +[2023-10-08 11:59:59,968][102897] Updated weights for policy 0, policy_version 5630 (0.0007) +[2023-10-08 12:00:01,279][102898] Updated weights for policy 1, policy_version 5610 (0.0008) +[2023-10-08 12:00:01,650][102898] Updated weights for policy 1, policy_version 5620 (0.0011) +[2023-10-08 12:00:01,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 11501568. Throughput: 0: 1797.3, 1: 1791.1. Samples: 2890178. Policy #0 lag: (min: 31.0, avg: 47.8, max: 63.0) +[2023-10-08 12:00:01,876][101941] Avg episode reward: [(0, '5.450'), (1, '6.020')] +[2023-10-08 12:00:02,023][102898] Updated weights for policy 1, policy_version 5630 (0.0011) +[2023-10-08 12:00:03,813][102897] Updated weights for policy 0, policy_version 5640 (0.0008) +[2023-10-08 12:00:04,190][102897] Updated weights for policy 0, policy_version 5650 (0.0008) +[2023-10-08 12:00:04,574][102897] Updated weights for policy 0, policy_version 5660 (0.0010) +[2023-10-08 12:00:05,818][102898] Updated weights for policy 1, policy_version 5640 (0.0009) +[2023-10-08 12:00:06,193][102898] Updated weights for policy 1, policy_version 5650 (0.0008) +[2023-10-08 12:00:06,561][102898] Updated weights for policy 1, policy_version 5660 (0.0007) +[2023-10-08 12:00:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 11599872. Throughput: 0: 1804.4, 1: 1774.0. Samples: 2900848. Policy #0 lag: (min: 31.0, avg: 47.8, max: 63.0) +[2023-10-08 12:00:06,875][101941] Avg episode reward: [(0, '5.750'), (1, '5.550')] +[2023-10-08 12:00:08,283][102897] Updated weights for policy 0, policy_version 5670 (0.0009) +[2023-10-08 12:00:08,656][102897] Updated weights for policy 0, policy_version 5680 (0.0007) +[2023-10-08 12:00:09,028][102897] Updated weights for policy 0, policy_version 5690 (0.0008) +[2023-10-08 12:00:10,104][102898] Updated weights for policy 1, policy_version 5670 (0.0007) +[2023-10-08 12:00:10,481][102898] Updated weights for policy 1, policy_version 5680 (0.0008) +[2023-10-08 12:00:10,850][102898] Updated weights for policy 1, policy_version 5690 (0.0008) +[2023-10-08 12:00:11,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 11665408. Throughput: 0: 1792.5, 1: 1802.7. Samples: 2922322. Policy #0 lag: (min: 31.0, avg: 31.1, max: 38.0) +[2023-10-08 12:00:11,876][101941] Avg episode reward: [(0, '5.890'), (1, '5.820')] +[2023-10-08 12:00:12,840][102897] Updated weights for policy 0, policy_version 5700 (0.0008) +[2023-10-08 12:00:13,222][102897] Updated weights for policy 0, policy_version 5710 (0.0008) +[2023-10-08 12:00:13,587][102897] Updated weights for policy 0, policy_version 5720 (0.0009) +[2023-10-08 12:00:14,522][102898] Updated weights for policy 1, policy_version 5700 (0.0008) +[2023-10-08 12:00:14,890][102898] Updated weights for policy 1, policy_version 5710 (0.0008) +[2023-10-08 12:00:15,259][102898] Updated weights for policy 1, policy_version 5720 (0.0008) +[2023-10-08 12:00:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 11730944. Throughput: 0: 1784.1, 1: 1793.6. Samples: 2944010. Policy #0 lag: (min: 31.0, avg: 31.1, max: 38.0) +[2023-10-08 12:00:16,876][101941] Avg episode reward: [(0, '5.930'), (1, '6.270')] +[2023-10-08 12:00:16,885][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000005728_5865472.pth... +[2023-10-08 12:00:16,885][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000005728_5865472.pth... +[2023-10-08 12:00:16,921][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000004064_4161536.pth +[2023-10-08 12:00:16,925][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000004064_4161536.pth +[2023-10-08 12:00:17,387][102897] Updated weights for policy 0, policy_version 5730 (0.0009) +[2023-10-08 12:00:17,763][102897] Updated weights for policy 0, policy_version 5740 (0.0010) +[2023-10-08 12:00:18,130][102897] Updated weights for policy 0, policy_version 5750 (0.0010) +[2023-10-08 12:00:18,505][102897] Updated weights for policy 0, policy_version 5760 (0.0009) +[2023-10-08 12:00:18,997][102898] Updated weights for policy 1, policy_version 5730 (0.0007) +[2023-10-08 12:00:19,364][102898] Updated weights for policy 1, policy_version 5740 (0.0008) +[2023-10-08 12:00:19,732][102898] Updated weights for policy 1, policy_version 5750 (0.0007) +[2023-10-08 12:00:20,109][102898] Updated weights for policy 1, policy_version 5760 (0.0007) +[2023-10-08 12:00:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 11796480. Throughput: 0: 1784.0, 1: 1802.9. Samples: 2954530. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:00:21,876][101941] Avg episode reward: [(0, '6.010'), (1, '5.560')] +[2023-10-08 12:00:22,361][102897] Updated weights for policy 0, policy_version 5770 (0.0009) +[2023-10-08 12:00:22,724][102897] Updated weights for policy 0, policy_version 5780 (0.0010) +[2023-10-08 12:00:23,116][102897] Updated weights for policy 0, policy_version 5790 (0.0010) +[2023-10-08 12:00:23,931][102898] Updated weights for policy 1, policy_version 5770 (0.0007) +[2023-10-08 12:00:24,294][102898] Updated weights for policy 1, policy_version 5780 (0.0009) +[2023-10-08 12:00:24,652][102898] Updated weights for policy 1, policy_version 5790 (0.0009) +[2023-10-08 12:00:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 11862016. Throughput: 0: 1775.7, 1: 1785.9. Samples: 2975672. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:00:26,875][101941] Avg episode reward: [(0, '6.380'), (1, '5.050')] +[2023-10-08 12:00:26,903][102897] Updated weights for policy 0, policy_version 5800 (0.0008) +[2023-10-08 12:00:27,280][102897] Updated weights for policy 0, policy_version 5810 (0.0008) +[2023-10-08 12:00:27,652][102897] Updated weights for policy 0, policy_version 5820 (0.0010) +[2023-10-08 12:00:28,455][102898] Updated weights for policy 1, policy_version 5800 (0.0008) +[2023-10-08 12:00:28,823][102898] Updated weights for policy 1, policy_version 5810 (0.0007) +[2023-10-08 12:00:29,192][102898] Updated weights for policy 1, policy_version 5820 (0.0009) +[2023-10-08 12:00:31,453][102897] Updated weights for policy 0, policy_version 5830 (0.0008) +[2023-10-08 12:00:31,816][102897] Updated weights for policy 0, policy_version 5840 (0.0008) +[2023-10-08 12:00:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 11927552. Throughput: 0: 1802.6, 1: 1782.6. Samples: 2997872. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:00:31,875][101941] Avg episode reward: [(0, '6.260'), (1, '5.450')] +[2023-10-08 12:00:32,192][102897] Updated weights for policy 0, policy_version 5850 (0.0009) +[2023-10-08 12:00:33,064][102898] Updated weights for policy 1, policy_version 5830 (0.0009) +[2023-10-08 12:00:33,453][102898] Updated weights for policy 1, policy_version 5840 (0.0008) +[2023-10-08 12:00:33,817][102898] Updated weights for policy 1, policy_version 5850 (0.0009) +[2023-10-08 12:00:35,944][102897] Updated weights for policy 0, policy_version 5860 (0.0008) +[2023-10-08 12:00:36,309][102897] Updated weights for policy 0, policy_version 5870 (0.0008) +[2023-10-08 12:00:36,685][102897] Updated weights for policy 0, policy_version 5880 (0.0007) +[2023-10-08 12:00:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 11993088. Throughput: 0: 1772.4, 1: 1779.0. Samples: 3007550. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:00:36,875][101941] Avg episode reward: [(0, '5.840'), (1, '5.820')] +[2023-10-08 12:00:37,541][102898] Updated weights for policy 1, policy_version 5860 (0.0012) +[2023-10-08 12:00:37,902][102898] Updated weights for policy 1, policy_version 5870 (0.0010) +[2023-10-08 12:00:38,272][102898] Updated weights for policy 1, policy_version 5880 (0.0009) +[2023-10-08 12:00:40,404][102897] Updated weights for policy 0, policy_version 5890 (0.0009) +[2023-10-08 12:00:40,768][102897] Updated weights for policy 0, policy_version 5900 (0.0008) +[2023-10-08 12:00:41,138][102897] Updated weights for policy 0, policy_version 5910 (0.0011) +[2023-10-08 12:00:41,509][102897] Updated weights for policy 0, policy_version 5920 (0.0009) +[2023-10-08 12:00:41,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 12091392. Throughput: 0: 1797.7, 1: 1781.2. Samples: 3029804. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:00:41,876][101941] Avg episode reward: [(0, '6.110'), (1, '5.580')] +[2023-10-08 12:00:42,157][102898] Updated weights for policy 1, policy_version 5890 (0.0010) +[2023-10-08 12:00:42,516][102898] Updated weights for policy 1, policy_version 5900 (0.0007) +[2023-10-08 12:00:42,878][102898] Updated weights for policy 1, policy_version 5910 (0.0007) +[2023-10-08 12:00:43,247][102898] Updated weights for policy 1, policy_version 5920 (0.0009) +[2023-10-08 12:00:45,447][102897] Updated weights for policy 0, policy_version 5930 (0.0008) +[2023-10-08 12:00:45,818][102897] Updated weights for policy 0, policy_version 5940 (0.0007) +[2023-10-08 12:00:46,202][102897] Updated weights for policy 0, policy_version 5950 (0.0008) +[2023-10-08 12:00:46,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 12156928. Throughput: 0: 1770.0, 1: 1795.2. Samples: 3050612. Policy #0 lag: (min: 17.0, avg: 21.2, max: 49.0) +[2023-10-08 12:00:46,876][101941] Avg episode reward: [(0, '5.800'), (1, '5.260')] +[2023-10-08 12:00:46,996][102898] Updated weights for policy 1, policy_version 5930 (0.0007) +[2023-10-08 12:00:47,353][102898] Updated weights for policy 1, policy_version 5940 (0.0009) +[2023-10-08 12:00:47,724][102898] Updated weights for policy 1, policy_version 5950 (0.0007) +[2023-10-08 12:00:49,799][102897] Updated weights for policy 0, policy_version 5960 (0.0009) +[2023-10-08 12:00:50,169][102897] Updated weights for policy 0, policy_version 5970 (0.0007) +[2023-10-08 12:00:50,548][102897] Updated weights for policy 0, policy_version 5980 (0.0007) +[2023-10-08 12:00:51,435][102898] Updated weights for policy 1, policy_version 5960 (0.0007) +[2023-10-08 12:00:51,805][102898] Updated weights for policy 1, policy_version 5970 (0.0008) +[2023-10-08 12:00:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 12222464. Throughput: 0: 1799.0, 1: 1782.8. Samples: 3062030. Policy #0 lag: (min: 17.0, avg: 21.2, max: 49.0) +[2023-10-08 12:00:51,876][101941] Avg episode reward: [(0, '6.500'), (1, '5.640')] +[2023-10-08 12:00:52,163][102898] Updated weights for policy 1, policy_version 5980 (0.0008) +[2023-10-08 12:00:54,199][102897] Updated weights for policy 0, policy_version 5990 (0.0008) +[2023-10-08 12:00:54,564][102897] Updated weights for policy 0, policy_version 6000 (0.0010) +[2023-10-08 12:00:54,936][102897] Updated weights for policy 0, policy_version 6010 (0.0008) +[2023-10-08 12:00:55,912][102898] Updated weights for policy 1, policy_version 5990 (0.0010) +[2023-10-08 12:00:56,288][102898] Updated weights for policy 1, policy_version 6000 (0.0009) +[2023-10-08 12:00:56,655][102898] Updated weights for policy 1, policy_version 6010 (0.0010) +[2023-10-08 12:00:56,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 12288000. Throughput: 0: 1777.4, 1: 1792.0. Samples: 3082942. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:00:56,876][101941] Avg episode reward: [(0, '6.730'), (1, '5.440')] +[2023-10-08 12:00:58,663][102897] Updated weights for policy 0, policy_version 6020 (0.0008) +[2023-10-08 12:00:59,047][102897] Updated weights for policy 0, policy_version 6030 (0.0008) +[2023-10-08 12:00:59,417][102897] Updated weights for policy 0, policy_version 6040 (0.0007) +[2023-10-08 12:01:00,370][102898] Updated weights for policy 1, policy_version 6020 (0.0008) +[2023-10-08 12:01:00,743][102898] Updated weights for policy 1, policy_version 6030 (0.0008) +[2023-10-08 12:01:01,098][102898] Updated weights for policy 1, policy_version 6040 (0.0008) +[2023-10-08 12:01:01,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 12386304. Throughput: 0: 1781.0, 1: 1773.0. Samples: 3103940. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:01:01,876][101941] Avg episode reward: [(0, '6.310'), (1, '6.000')] +[2023-10-08 12:01:03,145][102897] Updated weights for policy 0, policy_version 6050 (0.0007) +[2023-10-08 12:01:03,526][102897] Updated weights for policy 0, policy_version 6060 (0.0008) +[2023-10-08 12:01:03,898][102897] Updated weights for policy 0, policy_version 6070 (0.0009) +[2023-10-08 12:01:04,267][102897] Updated weights for policy 0, policy_version 6080 (0.0008) +[2023-10-08 12:01:04,941][102898] Updated weights for policy 1, policy_version 6050 (0.0009) +[2023-10-08 12:01:05,304][102898] Updated weights for policy 1, policy_version 6060 (0.0010) +[2023-10-08 12:01:05,677][102898] Updated weights for policy 1, policy_version 6070 (0.0009) +[2023-10-08 12:01:06,039][102898] Updated weights for policy 1, policy_version 6080 (0.0008) +[2023-10-08 12:01:06,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 12451840. Throughput: 0: 1779.1, 1: 1789.1. Samples: 3115100. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:01:06,876][101941] Avg episode reward: [(0, '5.830'), (1, '5.850')] +[2023-10-08 12:01:08,314][102897] Updated weights for policy 0, policy_version 6090 (0.0008) +[2023-10-08 12:01:08,691][102897] Updated weights for policy 0, policy_version 6100 (0.0009) +[2023-10-08 12:01:09,075][102897] Updated weights for policy 0, policy_version 6110 (0.0010) +[2023-10-08 12:01:09,741][102898] Updated weights for policy 1, policy_version 6090 (0.0011) +[2023-10-08 12:01:10,113][102898] Updated weights for policy 1, policy_version 6100 (0.0011) +[2023-10-08 12:01:10,474][102898] Updated weights for policy 1, policy_version 6110 (0.0008) +[2023-10-08 12:01:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 12517376. Throughput: 0: 1779.1, 1: 1786.0. Samples: 3136104. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:01:11,876][101941] Avg episode reward: [(0, '5.960'), (1, '5.710')] +[2023-10-08 12:01:12,822][102897] Updated weights for policy 0, policy_version 6120 (0.0008) +[2023-10-08 12:01:13,188][102897] Updated weights for policy 0, policy_version 6130 (0.0007) +[2023-10-08 12:01:13,568][102897] Updated weights for policy 0, policy_version 6140 (0.0007) +[2023-10-08 12:01:14,487][102898] Updated weights for policy 1, policy_version 6120 (0.0007) +[2023-10-08 12:01:14,848][102898] Updated weights for policy 1, policy_version 6130 (0.0007) +[2023-10-08 12:01:15,214][102898] Updated weights for policy 1, policy_version 6140 (0.0007) +[2023-10-08 12:01:16,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 12582912. Throughput: 0: 1785.0, 1: 1780.3. Samples: 3158310. Policy #0 lag: (min: 10.0, avg: 10.8, max: 28.0) +[2023-10-08 12:01:16,876][101941] Avg episode reward: [(0, '6.370'), (1, '5.730')] +[2023-10-08 12:01:17,145][102897] Updated weights for policy 0, policy_version 6150 (0.0008) +[2023-10-08 12:01:17,519][102897] Updated weights for policy 0, policy_version 6160 (0.0009) +[2023-10-08 12:01:17,884][102897] Updated weights for policy 0, policy_version 6170 (0.0008) +[2023-10-08 12:01:19,058][102898] Updated weights for policy 1, policy_version 6150 (0.0007) +[2023-10-08 12:01:19,442][102898] Updated weights for policy 1, policy_version 6160 (0.0010) +[2023-10-08 12:01:19,822][102898] Updated weights for policy 1, policy_version 6170 (0.0007) +[2023-10-08 12:01:21,803][102897] Updated weights for policy 0, policy_version 6180 (0.0008) +[2023-10-08 12:01:21,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 12648448. Throughput: 0: 1781.2, 1: 1797.5. Samples: 3168590. Policy #0 lag: (min: 10.0, avg: 10.8, max: 28.0) +[2023-10-08 12:01:21,876][101941] Avg episode reward: [(0, '6.270'), (1, '5.550')] +[2023-10-08 12:01:22,161][102897] Updated weights for policy 0, policy_version 6190 (0.0010) +[2023-10-08 12:01:22,533][102897] Updated weights for policy 0, policy_version 6200 (0.0009) +[2023-10-08 12:01:23,614][102898] Updated weights for policy 1, policy_version 6180 (0.0009) +[2023-10-08 12:01:23,986][102898] Updated weights for policy 1, policy_version 6190 (0.0009) +[2023-10-08 12:01:24,360][102898] Updated weights for policy 1, policy_version 6200 (0.0007) +[2023-10-08 12:01:26,231][102897] Updated weights for policy 0, policy_version 6210 (0.0007) +[2023-10-08 12:01:26,609][102897] Updated weights for policy 0, policy_version 6220 (0.0008) +[2023-10-08 12:01:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 12713984. Throughput: 0: 1780.7, 1: 1782.0. Samples: 3190124. Policy #0 lag: (min: 30.0, avg: 37.6, max: 62.0) +[2023-10-08 12:01:26,875][101941] Avg episode reward: [(0, '6.670'), (1, '5.370')] +[2023-10-08 12:01:26,984][102897] Updated weights for policy 0, policy_version 6230 (0.0010) +[2023-10-08 12:01:27,348][102897] Updated weights for policy 0, policy_version 6240 (0.0009) +[2023-10-08 12:01:27,890][102898] Updated weights for policy 1, policy_version 6210 (0.0009) +[2023-10-08 12:01:28,258][102898] Updated weights for policy 1, policy_version 6220 (0.0008) +[2023-10-08 12:01:28,617][102898] Updated weights for policy 1, policy_version 6230 (0.0007) +[2023-10-08 12:01:28,985][102898] Updated weights for policy 1, policy_version 6240 (0.0008) +[2023-10-08 12:01:31,097][102897] Updated weights for policy 0, policy_version 6250 (0.0009) +[2023-10-08 12:01:31,477][102897] Updated weights for policy 0, policy_version 6260 (0.0010) +[2023-10-08 12:01:31,856][102897] Updated weights for policy 0, policy_version 6270 (0.0009) +[2023-10-08 12:01:31,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 12779520. Throughput: 0: 1801.8, 1: 1788.7. Samples: 3212186. Policy #0 lag: (min: 30.0, avg: 37.6, max: 62.0) +[2023-10-08 12:01:31,876][101941] Avg episode reward: [(0, '6.250'), (1, '5.280')] +[2023-10-08 12:01:32,759][102898] Updated weights for policy 1, policy_version 6250 (0.0010) +[2023-10-08 12:01:33,127][102898] Updated weights for policy 1, policy_version 6260 (0.0010) +[2023-10-08 12:01:33,490][102898] Updated weights for policy 1, policy_version 6270 (0.0010) +[2023-10-08 12:01:35,372][102897] Updated weights for policy 0, policy_version 6280 (0.0010) +[2023-10-08 12:01:35,746][102897] Updated weights for policy 0, policy_version 6290 (0.0009) +[2023-10-08 12:01:36,112][102897] Updated weights for policy 0, policy_version 6300 (0.0008) +[2023-10-08 12:01:36,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14745.5, 300 sec: 14329.1). Total num frames: 12877824. Throughput: 0: 1784.4, 1: 1788.2. Samples: 3222800. Policy #0 lag: (min: 31.0, avg: 32.0, max: 53.0) +[2023-10-08 12:01:36,876][101941] Avg episode reward: [(0, '6.140'), (1, '5.240')] +[2023-10-08 12:01:37,322][102898] Updated weights for policy 1, policy_version 6280 (0.0008) +[2023-10-08 12:01:37,695][102898] Updated weights for policy 1, policy_version 6290 (0.0008) +[2023-10-08 12:01:38,059][102898] Updated weights for policy 1, policy_version 6300 (0.0008) +[2023-10-08 12:01:39,751][102897] Updated weights for policy 0, policy_version 6310 (0.0007) +[2023-10-08 12:01:40,115][102897] Updated weights for policy 0, policy_version 6320 (0.0007) +[2023-10-08 12:01:40,491][102897] Updated weights for policy 0, policy_version 6330 (0.0007) +[2023-10-08 12:01:41,781][102898] Updated weights for policy 1, policy_version 6310 (0.0008) +[2023-10-08 12:01:41,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 12943360. Throughput: 0: 1798.3, 1: 1791.9. Samples: 3244498. Policy #0 lag: (min: 31.0, avg: 45.7, max: 63.0) +[2023-10-08 12:01:41,876][101941] Avg episode reward: [(0, '6.700'), (1, '5.530')] +[2023-10-08 12:01:42,150][102898] Updated weights for policy 1, policy_version 6320 (0.0007) +[2023-10-08 12:01:42,505][102898] Updated weights for policy 1, policy_version 6330 (0.0011) +[2023-10-08 12:01:44,299][102897] Updated weights for policy 0, policy_version 6340 (0.0009) +[2023-10-08 12:01:44,678][102897] Updated weights for policy 0, policy_version 6350 (0.0010) +[2023-10-08 12:01:45,049][102897] Updated weights for policy 0, policy_version 6360 (0.0009) +[2023-10-08 12:01:46,308][102898] Updated weights for policy 1, policy_version 6340 (0.0008) +[2023-10-08 12:01:46,685][102898] Updated weights for policy 1, policy_version 6350 (0.0008) +[2023-10-08 12:01:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 13008896. Throughput: 0: 1785.4, 1: 1815.8. Samples: 3265994. Policy #0 lag: (min: 31.0, avg: 45.7, max: 63.0) +[2023-10-08 12:01:46,876][101941] Avg episode reward: [(0, '6.410'), (1, '5.680')] +[2023-10-08 12:01:47,061][102898] Updated weights for policy 1, policy_version 6360 (0.0007) +[2023-10-08 12:01:48,848][102897] Updated weights for policy 0, policy_version 6370 (0.0008) +[2023-10-08 12:01:49,227][102897] Updated weights for policy 0, policy_version 6380 (0.0009) +[2023-10-08 12:01:49,595][102897] Updated weights for policy 0, policy_version 6390 (0.0007) +[2023-10-08 12:01:49,971][102897] Updated weights for policy 0, policy_version 6400 (0.0007) +[2023-10-08 12:01:50,774][102898] Updated weights for policy 1, policy_version 6370 (0.0008) +[2023-10-08 12:01:51,149][102898] Updated weights for policy 1, policy_version 6380 (0.0010) +[2023-10-08 12:01:51,510][102898] Updated weights for policy 1, policy_version 6390 (0.0009) +[2023-10-08 12:01:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 13074432. Throughput: 0: 1803.9, 1: 1788.4. Samples: 3276750. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:01:51,876][101941] Avg episode reward: [(0, '6.320'), (1, '5.490')] +[2023-10-08 12:01:51,878][102898] Updated weights for policy 1, policy_version 6400 (0.0009) +[2023-10-08 12:01:53,825][102897] Updated weights for policy 0, policy_version 6410 (0.0009) +[2023-10-08 12:01:54,206][102897] Updated weights for policy 0, policy_version 6420 (0.0010) +[2023-10-08 12:01:54,572][102897] Updated weights for policy 0, policy_version 6430 (0.0010) +[2023-10-08 12:01:55,727][102898] Updated weights for policy 1, policy_version 6410 (0.0011) +[2023-10-08 12:01:56,095][102898] Updated weights for policy 1, policy_version 6420 (0.0009) +[2023-10-08 12:01:56,469][102898] Updated weights for policy 1, policy_version 6430 (0.0010) +[2023-10-08 12:01:56,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 13172736. Throughput: 0: 1787.4, 1: 1801.9. Samples: 3297620. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:01:56,876][101941] Avg episode reward: [(0, '6.100'), (1, '5.510')] +[2023-10-08 12:01:58,299][102897] Updated weights for policy 0, policy_version 6440 (0.0009) +[2023-10-08 12:01:58,688][102897] Updated weights for policy 0, policy_version 6450 (0.0007) +[2023-10-08 12:01:59,058][102897] Updated weights for policy 0, policy_version 6460 (0.0009) +[2023-10-08 12:02:00,273][102898] Updated weights for policy 1, policy_version 6440 (0.0008) +[2023-10-08 12:02:00,647][102898] Updated weights for policy 1, policy_version 6450 (0.0010) +[2023-10-08 12:02:01,012][102898] Updated weights for policy 1, policy_version 6460 (0.0010) +[2023-10-08 12:02:01,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 13238272. Throughput: 0: 1781.3, 1: 1775.3. Samples: 3318356. Policy #0 lag: (min: 31.0, avg: 37.1, max: 63.0) +[2023-10-08 12:02:01,876][101941] Avg episode reward: [(0, '5.890'), (1, '4.710')] +[2023-10-08 12:02:02,925][102897] Updated weights for policy 0, policy_version 6470 (0.0008) +[2023-10-08 12:02:03,304][102897] Updated weights for policy 0, policy_version 6480 (0.0007) +[2023-10-08 12:02:03,681][102897] Updated weights for policy 0, policy_version 6490 (0.0010) +[2023-10-08 12:02:04,955][102898] Updated weights for policy 1, policy_version 6470 (0.0008) +[2023-10-08 12:02:05,349][102898] Updated weights for policy 1, policy_version 6480 (0.0008) +[2023-10-08 12:02:05,711][102898] Updated weights for policy 1, policy_version 6490 (0.0008) +[2023-10-08 12:02:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 13303808. Throughput: 0: 1782.2, 1: 1794.5. Samples: 3329542. Policy #0 lag: (min: 31.0, avg: 37.1, max: 63.0) +[2023-10-08 12:02:06,875][101941] Avg episode reward: [(0, '6.480'), (1, '4.850')] +[2023-10-08 12:02:07,492][102897] Updated weights for policy 0, policy_version 6500 (0.0008) +[2023-10-08 12:02:07,866][102897] Updated weights for policy 0, policy_version 6510 (0.0010) +[2023-10-08 12:02:08,230][102897] Updated weights for policy 0, policy_version 6520 (0.0008) +[2023-10-08 12:02:09,308][102898] Updated weights for policy 1, policy_version 6500 (0.0008) +[2023-10-08 12:02:09,664][102898] Updated weights for policy 1, policy_version 6510 (0.0007) +[2023-10-08 12:02:10,031][102898] Updated weights for policy 1, policy_version 6520 (0.0007) +[2023-10-08 12:02:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 13369344. Throughput: 0: 1785.8, 1: 1775.0. Samples: 3350358. Policy #0 lag: (min: 0.0, avg: 27.8, max: 32.0) +[2023-10-08 12:02:11,876][101941] Avg episode reward: [(0, '6.730'), (1, '5.350')] +[2023-10-08 12:02:11,965][102897] Updated weights for policy 0, policy_version 6530 (0.0009) +[2023-10-08 12:02:12,336][102897] Updated weights for policy 0, policy_version 6540 (0.0010) +[2023-10-08 12:02:12,714][102897] Updated weights for policy 0, policy_version 6550 (0.0009) +[2023-10-08 12:02:13,082][102897] Updated weights for policy 0, policy_version 6560 (0.0008) +[2023-10-08 12:02:13,744][102898] Updated weights for policy 1, policy_version 6530 (0.0008) +[2023-10-08 12:02:14,111][102898] Updated weights for policy 1, policy_version 6540 (0.0008) +[2023-10-08 12:02:14,474][102898] Updated weights for policy 1, policy_version 6550 (0.0009) +[2023-10-08 12:02:14,841][102898] Updated weights for policy 1, policy_version 6560 (0.0009) +[2023-10-08 12:02:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 13434880. Throughput: 0: 1798.9, 1: 1765.4. Samples: 3372576. Policy #0 lag: (min: 0.0, avg: 27.8, max: 32.0) +[2023-10-08 12:02:16,875][101941] Avg episode reward: [(0, '6.640'), (1, '5.760')] +[2023-10-08 12:02:16,882][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000006560_6717440.pth... +[2023-10-08 12:02:16,919][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000004896_5013504.pth +[2023-10-08 12:02:16,921][102897] Updated weights for policy 0, policy_version 6570 (0.0008) +[2023-10-08 12:02:17,304][102897] Updated weights for policy 0, policy_version 6580 (0.0009) +[2023-10-08 12:02:17,683][102897] Updated weights for policy 0, policy_version 6590 (0.0008) +[2023-10-08 12:02:17,749][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000006592_6750208.pth... +[2023-10-08 12:02:17,787][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000004896_5013504.pth +[2023-10-08 12:02:18,507][102898] Updated weights for policy 1, policy_version 6570 (0.0010) +[2023-10-08 12:02:18,867][102898] Updated weights for policy 1, policy_version 6580 (0.0009) +[2023-10-08 12:02:19,230][102898] Updated weights for policy 1, policy_version 6590 (0.0010) +[2023-10-08 12:02:21,417][102897] Updated weights for policy 0, policy_version 6600 (0.0010) +[2023-10-08 12:02:21,786][102897] Updated weights for policy 0, policy_version 6610 (0.0009) +[2023-10-08 12:02:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 13500416. Throughput: 0: 1780.1, 1: 1768.6. Samples: 3382488. Policy #0 lag: (min: 31.0, avg: 32.3, max: 56.0) +[2023-10-08 12:02:21,876][101941] Avg episode reward: [(0, '6.700'), (1, '5.590')] +[2023-10-08 12:02:22,164][102897] Updated weights for policy 0, policy_version 6620 (0.0009) +[2023-10-08 12:02:23,282][102898] Updated weights for policy 1, policy_version 6600 (0.0009) +[2023-10-08 12:02:23,645][102898] Updated weights for policy 1, policy_version 6610 (0.0010) +[2023-10-08 12:02:24,011][102898] Updated weights for policy 1, policy_version 6620 (0.0011) +[2023-10-08 12:02:25,835][102897] Updated weights for policy 0, policy_version 6630 (0.0009) +[2023-10-08 12:02:26,213][102897] Updated weights for policy 0, policy_version 6640 (0.0008) +[2023-10-08 12:02:26,581][102897] Updated weights for policy 0, policy_version 6650 (0.0008) +[2023-10-08 12:02:26,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 13598720. Throughput: 0: 1799.3, 1: 1767.5. Samples: 3405004. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:02:26,875][101941] Avg episode reward: [(0, '6.120'), (1, '4.850')] +[2023-10-08 12:02:27,974][102898] Updated weights for policy 1, policy_version 6630 (0.0008) +[2023-10-08 12:02:28,349][102898] Updated weights for policy 1, policy_version 6640 (0.0007) +[2023-10-08 12:02:28,708][102898] Updated weights for policy 1, policy_version 6650 (0.0009) +[2023-10-08 12:02:30,334][102897] Updated weights for policy 0, policy_version 6660 (0.0007) +[2023-10-08 12:02:30,713][102897] Updated weights for policy 0, policy_version 6670 (0.0009) +[2023-10-08 12:02:31,085][102897] Updated weights for policy 0, policy_version 6680 (0.0008) +[2023-10-08 12:02:31,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 13664256. Throughput: 0: 1778.2, 1: 1774.6. Samples: 3425872. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:02:31,876][101941] Avg episode reward: [(0, '5.350'), (1, '5.230')] +[2023-10-08 12:02:32,507][102898] Updated weights for policy 1, policy_version 6660 (0.0008) +[2023-10-08 12:02:32,878][102898] Updated weights for policy 1, policy_version 6670 (0.0009) +[2023-10-08 12:02:33,242][102898] Updated weights for policy 1, policy_version 6680 (0.0007) +[2023-10-08 12:02:34,931][102897] Updated weights for policy 0, policy_version 6690 (0.0007) +[2023-10-08 12:02:35,305][102897] Updated weights for policy 0, policy_version 6700 (0.0008) +[2023-10-08 12:02:35,673][102897] Updated weights for policy 0, policy_version 6710 (0.0007) +[2023-10-08 12:02:36,049][102897] Updated weights for policy 0, policy_version 6720 (0.0009) +[2023-10-08 12:02:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 13729792. Throughput: 0: 1790.9, 1: 1768.9. Samples: 3436940. Policy #0 lag: (min: 31.0, avg: 31.7, max: 49.0) +[2023-10-08 12:02:36,876][101941] Avg episode reward: [(0, '5.230'), (1, '5.050')] +[2023-10-08 12:02:37,079][102898] Updated weights for policy 1, policy_version 6690 (0.0008) +[2023-10-08 12:02:37,440][102898] Updated weights for policy 1, policy_version 6700 (0.0009) +[2023-10-08 12:02:37,808][102898] Updated weights for policy 1, policy_version 6710 (0.0010) +[2023-10-08 12:02:38,180][102898] Updated weights for policy 1, policy_version 6720 (0.0010) +[2023-10-08 12:02:39,803][102897] Updated weights for policy 0, policy_version 6730 (0.0008) +[2023-10-08 12:02:40,179][102897] Updated weights for policy 0, policy_version 6740 (0.0007) +[2023-10-08 12:02:40,563][102897] Updated weights for policy 0, policy_version 6750 (0.0008) +[2023-10-08 12:02:41,872][102898] Updated weights for policy 1, policy_version 6730 (0.0009) +[2023-10-08 12:02:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 13795328. Throughput: 0: 1788.8, 1: 1775.2. Samples: 3458002. Policy #0 lag: (min: 31.0, avg: 31.7, max: 49.0) +[2023-10-08 12:02:41,876][101941] Avg episode reward: [(0, '5.820'), (1, '4.810')] +[2023-10-08 12:02:42,248][102898] Updated weights for policy 1, policy_version 6740 (0.0009) +[2023-10-08 12:02:42,611][102898] Updated weights for policy 1, policy_version 6750 (0.0008) +[2023-10-08 12:02:44,409][102897] Updated weights for policy 0, policy_version 6760 (0.0008) +[2023-10-08 12:02:44,792][102897] Updated weights for policy 0, policy_version 6770 (0.0007) +[2023-10-08 12:02:45,167][102897] Updated weights for policy 0, policy_version 6780 (0.0007) +[2023-10-08 12:02:46,469][102898] Updated weights for policy 1, policy_version 6760 (0.0008) +[2023-10-08 12:02:46,845][102898] Updated weights for policy 1, policy_version 6770 (0.0007) +[2023-10-08 12:02:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 13860864. Throughput: 0: 1781.9, 1: 1798.3. Samples: 3479462. Policy #0 lag: (min: 31.0, avg: 40.3, max: 63.0) +[2023-10-08 12:02:46,876][101941] Avg episode reward: [(0, '6.150'), (1, '5.640')] +[2023-10-08 12:02:47,212][102898] Updated weights for policy 1, policy_version 6780 (0.0008) +[2023-10-08 12:02:48,902][102897] Updated weights for policy 0, policy_version 6790 (0.0009) +[2023-10-08 12:02:49,274][102897] Updated weights for policy 0, policy_version 6800 (0.0007) +[2023-10-08 12:02:49,651][102897] Updated weights for policy 0, policy_version 6810 (0.0008) +[2023-10-08 12:02:50,871][102898] Updated weights for policy 1, policy_version 6790 (0.0009) +[2023-10-08 12:02:51,248][102898] Updated weights for policy 1, policy_version 6800 (0.0007) +[2023-10-08 12:02:51,616][102898] Updated weights for policy 1, policy_version 6810 (0.0007) +[2023-10-08 12:02:51,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 13959168. Throughput: 0: 1793.5, 1: 1771.8. Samples: 3489980. Policy #0 lag: (min: 31.0, avg: 40.3, max: 63.0) +[2023-10-08 12:02:51,875][101941] Avg episode reward: [(0, '6.330'), (1, '5.240')] +[2023-10-08 12:02:53,475][102897] Updated weights for policy 0, policy_version 6820 (0.0010) +[2023-10-08 12:02:53,848][102897] Updated weights for policy 0, policy_version 6830 (0.0011) +[2023-10-08 12:02:54,214][102897] Updated weights for policy 0, policy_version 6840 (0.0010) +[2023-10-08 12:02:55,461][102898] Updated weights for policy 1, policy_version 6820 (0.0009) +[2023-10-08 12:02:55,829][102898] Updated weights for policy 1, policy_version 6830 (0.0010) +[2023-10-08 12:02:56,208][102898] Updated weights for policy 1, policy_version 6840 (0.0010) +[2023-10-08 12:02:56,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 14024704. Throughput: 0: 1777.1, 1: 1804.9. Samples: 3511550. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 12:02:56,876][101941] Avg episode reward: [(0, '6.110'), (1, '4.990')] +[2023-10-08 12:02:57,923][102897] Updated weights for policy 0, policy_version 6850 (0.0008) +[2023-10-08 12:02:58,301][102897] Updated weights for policy 0, policy_version 6860 (0.0010) +[2023-10-08 12:02:58,670][102897] Updated weights for policy 0, policy_version 6870 (0.0008) +[2023-10-08 12:02:59,048][102897] Updated weights for policy 0, policy_version 6880 (0.0011) +[2023-10-08 12:02:59,918][102898] Updated weights for policy 1, policy_version 6850 (0.0008) +[2023-10-08 12:03:00,280][102898] Updated weights for policy 1, policy_version 6860 (0.0009) +[2023-10-08 12:03:00,654][102898] Updated weights for policy 1, policy_version 6870 (0.0011) +[2023-10-08 12:03:01,027][102898] Updated weights for policy 1, policy_version 6880 (0.0010) +[2023-10-08 12:03:01,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 14090240. Throughput: 0: 1781.9, 1: 1783.1. Samples: 3533002. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 12:03:01,876][101941] Avg episode reward: [(0, '6.000'), (1, '5.360')] +[2023-10-08 12:03:02,860][102897] Updated weights for policy 0, policy_version 6890 (0.0008) +[2023-10-08 12:03:03,230][102897] Updated weights for policy 0, policy_version 6900 (0.0008) +[2023-10-08 12:03:03,605][102897] Updated weights for policy 0, policy_version 6910 (0.0007) +[2023-10-08 12:03:04,738][102898] Updated weights for policy 1, policy_version 6890 (0.0008) +[2023-10-08 12:03:05,103][102898] Updated weights for policy 1, policy_version 6900 (0.0009) +[2023-10-08 12:03:05,472][102898] Updated weights for policy 1, policy_version 6910 (0.0009) +[2023-10-08 12:03:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 14155776. Throughput: 0: 1781.9, 1: 1806.5. Samples: 3543970. Policy #0 lag: (min: 24.0, avg: 52.1, max: 56.0) +[2023-10-08 12:03:06,876][101941] Avg episode reward: [(0, '5.980'), (1, '5.290')] +[2023-10-08 12:03:07,278][102897] Updated weights for policy 0, policy_version 6920 (0.0008) +[2023-10-08 12:03:07,650][102897] Updated weights for policy 0, policy_version 6930 (0.0009) +[2023-10-08 12:03:08,017][102897] Updated weights for policy 0, policy_version 6940 (0.0009) +[2023-10-08 12:03:09,163][102898] Updated weights for policy 1, policy_version 6920 (0.0010) +[2023-10-08 12:03:09,531][102898] Updated weights for policy 1, policy_version 6930 (0.0010) +[2023-10-08 12:03:09,904][102898] Updated weights for policy 1, policy_version 6940 (0.0011) +[2023-10-08 12:03:11,690][102897] Updated weights for policy 0, policy_version 6950 (0.0008) +[2023-10-08 12:03:11,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 14221312. Throughput: 0: 1783.2, 1: 1780.6. Samples: 3565372. Policy #0 lag: (min: 24.0, avg: 52.1, max: 56.0) +[2023-10-08 12:03:11,876][101941] Avg episode reward: [(0, '6.010'), (1, '5.480')] +[2023-10-08 12:03:12,061][102897] Updated weights for policy 0, policy_version 6960 (0.0007) +[2023-10-08 12:03:12,424][102897] Updated weights for policy 0, policy_version 6970 (0.0008) +[2023-10-08 12:03:13,695][102898] Updated weights for policy 1, policy_version 6950 (0.0008) +[2023-10-08 12:03:14,059][102898] Updated weights for policy 1, policy_version 6960 (0.0008) +[2023-10-08 12:03:14,425][102898] Updated weights for policy 1, policy_version 6970 (0.0008) +[2023-10-08 12:03:16,073][102897] Updated weights for policy 0, policy_version 6980 (0.0007) +[2023-10-08 12:03:16,455][102897] Updated weights for policy 0, policy_version 6990 (0.0008) +[2023-10-08 12:03:16,824][102897] Updated weights for policy 0, policy_version 7000 (0.0008) +[2023-10-08 12:03:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 14286848. Throughput: 0: 1800.8, 1: 1779.1. Samples: 3586964. Policy #0 lag: (min: 31.0, avg: 33.6, max: 63.0) +[2023-10-08 12:03:16,876][101941] Avg episode reward: [(0, '6.150'), (1, '5.580')] +[2023-10-08 12:03:18,345][102898] Updated weights for policy 1, policy_version 6980 (0.0009) +[2023-10-08 12:03:18,717][102898] Updated weights for policy 1, policy_version 6990 (0.0009) +[2023-10-08 12:03:19,098][102898] Updated weights for policy 1, policy_version 7000 (0.0010) +[2023-10-08 12:03:20,575][102897] Updated weights for policy 0, policy_version 7010 (0.0007) +[2023-10-08 12:03:20,951][102897] Updated weights for policy 0, policy_version 7020 (0.0008) +[2023-10-08 12:03:21,310][102897] Updated weights for policy 0, policy_version 7030 (0.0007) +[2023-10-08 12:03:21,689][102897] Updated weights for policy 0, policy_version 7040 (0.0008) +[2023-10-08 12:03:21,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 14385152. Throughput: 0: 1782.7, 1: 1776.0. Samples: 3597080. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:03:21,876][101941] Avg episode reward: [(0, '5.520'), (1, '5.070')] +[2023-10-08 12:03:22,818][102898] Updated weights for policy 1, policy_version 7010 (0.0010) +[2023-10-08 12:03:23,188][102898] Updated weights for policy 1, policy_version 7020 (0.0008) +[2023-10-08 12:03:23,565][102898] Updated weights for policy 1, policy_version 7030 (0.0011) +[2023-10-08 12:03:23,930][102898] Updated weights for policy 1, policy_version 7040 (0.0010) +[2023-10-08 12:03:25,413][102897] Updated weights for policy 0, policy_version 7050 (0.0009) +[2023-10-08 12:03:25,789][102897] Updated weights for policy 0, policy_version 7060 (0.0008) +[2023-10-08 12:03:26,166][102897] Updated weights for policy 0, policy_version 7070 (0.0007) +[2023-10-08 12:03:26,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 14450688. Throughput: 0: 1800.6, 1: 1779.1. Samples: 3619086. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:03:26,876][101941] Avg episode reward: [(0, '5.970'), (1, '5.000')] +[2023-10-08 12:03:27,811][102898] Updated weights for policy 1, policy_version 7050 (0.0008) +[2023-10-08 12:03:28,172][102898] Updated weights for policy 1, policy_version 7060 (0.0008) +[2023-10-08 12:03:28,546][102898] Updated weights for policy 1, policy_version 7070 (0.0007) +[2023-10-08 12:03:30,150][102897] Updated weights for policy 0, policy_version 7080 (0.0009) +[2023-10-08 12:03:30,530][102897] Updated weights for policy 0, policy_version 7090 (0.0010) +[2023-10-08 12:03:30,908][102897] Updated weights for policy 0, policy_version 7100 (0.0009) +[2023-10-08 12:03:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 14516224. Throughput: 0: 1780.0, 1: 1785.6. Samples: 3639916. Policy #0 lag: (min: 31.0, avg: 32.4, max: 57.0) +[2023-10-08 12:03:31,875][101941] Avg episode reward: [(0, '5.710'), (1, '5.520')] +[2023-10-08 12:03:32,292][102898] Updated weights for policy 1, policy_version 7080 (0.0010) +[2023-10-08 12:03:32,661][102898] Updated weights for policy 1, policy_version 7090 (0.0007) +[2023-10-08 12:03:33,030][102898] Updated weights for policy 1, policy_version 7100 (0.0007) +[2023-10-08 12:03:34,698][102897] Updated weights for policy 0, policy_version 7110 (0.0008) +[2023-10-08 12:03:35,069][102897] Updated weights for policy 0, policy_version 7120 (0.0007) +[2023-10-08 12:03:35,444][102897] Updated weights for policy 0, policy_version 7130 (0.0007) +[2023-10-08 12:03:36,848][102898] Updated weights for policy 1, policy_version 7110 (0.0008) +[2023-10-08 12:03:36,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 14581760. Throughput: 0: 1801.6, 1: 1779.3. Samples: 3651122. Policy #0 lag: (min: 31.0, avg: 32.4, max: 57.0) +[2023-10-08 12:03:36,876][101941] Avg episode reward: [(0, '6.400'), (1, '5.550')] +[2023-10-08 12:03:37,223][102898] Updated weights for policy 1, policy_version 7120 (0.0009) +[2023-10-08 12:03:37,590][102898] Updated weights for policy 1, policy_version 7130 (0.0007) +[2023-10-08 12:03:39,122][102897] Updated weights for policy 0, policy_version 7140 (0.0009) +[2023-10-08 12:03:39,494][102897] Updated weights for policy 0, policy_version 7150 (0.0010) +[2023-10-08 12:03:39,872][102897] Updated weights for policy 0, policy_version 7160 (0.0009) +[2023-10-08 12:03:41,451][102898] Updated weights for policy 1, policy_version 7140 (0.0008) +[2023-10-08 12:03:41,817][102898] Updated weights for policy 1, policy_version 7150 (0.0008) +[2023-10-08 12:03:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 14647296. Throughput: 0: 1787.6, 1: 1777.9. Samples: 3671998. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:03:41,875][101941] Avg episode reward: [(0, '6.720'), (1, '5.020')] +[2023-10-08 12:03:42,185][102898] Updated weights for policy 1, policy_version 7160 (0.0008) +[2023-10-08 12:03:43,643][102897] Updated weights for policy 0, policy_version 7170 (0.0008) +[2023-10-08 12:03:44,020][102897] Updated weights for policy 0, policy_version 7180 (0.0007) +[2023-10-08 12:03:44,398][102897] Updated weights for policy 0, policy_version 7190 (0.0008) +[2023-10-08 12:03:44,761][102897] Updated weights for policy 0, policy_version 7200 (0.0009) +[2023-10-08 12:03:45,816][102898] Updated weights for policy 1, policy_version 7170 (0.0009) +[2023-10-08 12:03:46,184][102898] Updated weights for policy 1, policy_version 7180 (0.0010) +[2023-10-08 12:03:46,554][102898] Updated weights for policy 1, policy_version 7190 (0.0009) +[2023-10-08 12:03:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 14712832. Throughput: 0: 1786.3, 1: 1790.0. Samples: 3693934. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:03:46,876][101941] Avg episode reward: [(0, '6.260'), (1, '5.450')] +[2023-10-08 12:03:46,922][102898] Updated weights for policy 1, policy_version 7200 (0.0007) +[2023-10-08 12:03:48,578][102897] Updated weights for policy 0, policy_version 7210 (0.0008) +[2023-10-08 12:03:48,950][102897] Updated weights for policy 0, policy_version 7220 (0.0008) +[2023-10-08 12:03:49,325][102897] Updated weights for policy 0, policy_version 7230 (0.0007) +[2023-10-08 12:03:50,620][102898] Updated weights for policy 1, policy_version 7210 (0.0007) +[2023-10-08 12:03:50,987][102898] Updated weights for policy 1, policy_version 7220 (0.0009) +[2023-10-08 12:03:51,364][102898] Updated weights for policy 1, policy_version 7230 (0.0007) +[2023-10-08 12:03:51,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 14811136. Throughput: 0: 1786.4, 1: 1782.8. Samples: 3704584. Policy #0 lag: (min: 29.0, avg: 29.4, max: 42.0) +[2023-10-08 12:03:51,875][101941] Avg episode reward: [(0, '5.660'), (1, '5.960')] +[2023-10-08 12:03:52,966][102897] Updated weights for policy 0, policy_version 7240 (0.0007) +[2023-10-08 12:03:53,335][102897] Updated weights for policy 0, policy_version 7250 (0.0007) +[2023-10-08 12:03:53,701][102897] Updated weights for policy 0, policy_version 7260 (0.0007) +[2023-10-08 12:03:55,012][102898] Updated weights for policy 1, policy_version 7240 (0.0009) +[2023-10-08 12:03:55,370][102898] Updated weights for policy 1, policy_version 7250 (0.0010) +[2023-10-08 12:03:55,732][102898] Updated weights for policy 1, policy_version 7260 (0.0009) +[2023-10-08 12:03:56,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 14876672. Throughput: 0: 1784.8, 1: 1788.9. Samples: 3726188. Policy #0 lag: (min: 29.0, avg: 29.4, max: 42.0) +[2023-10-08 12:03:56,876][101941] Avg episode reward: [(0, '5.850'), (1, '5.540')] +[2023-10-08 12:03:57,488][102897] Updated weights for policy 0, policy_version 7270 (0.0009) +[2023-10-08 12:03:57,861][102897] Updated weights for policy 0, policy_version 7280 (0.0009) +[2023-10-08 12:03:58,237][102897] Updated weights for policy 0, policy_version 7290 (0.0009) +[2023-10-08 12:03:59,394][102898] Updated weights for policy 1, policy_version 7270 (0.0008) +[2023-10-08 12:03:59,760][102898] Updated weights for policy 1, policy_version 7280 (0.0010) +[2023-10-08 12:04:00,132][102898] Updated weights for policy 1, policy_version 7290 (0.0009) +[2023-10-08 12:04:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 14942208. Throughput: 0: 1795.2, 1: 1783.0. Samples: 3747982. Policy #0 lag: (min: 1.0, avg: 6.2, max: 33.0) +[2023-10-08 12:04:01,876][101941] Avg episode reward: [(0, '5.790'), (1, '5.660')] +[2023-10-08 12:04:01,962][102897] Updated weights for policy 0, policy_version 7300 (0.0009) +[2023-10-08 12:04:02,330][102897] Updated weights for policy 0, policy_version 7310 (0.0007) +[2023-10-08 12:04:02,701][102897] Updated weights for policy 0, policy_version 7320 (0.0007) +[2023-10-08 12:04:03,923][102898] Updated weights for policy 1, policy_version 7300 (0.0010) +[2023-10-08 12:04:04,292][102898] Updated weights for policy 1, policy_version 7310 (0.0011) +[2023-10-08 12:04:04,652][102898] Updated weights for policy 1, policy_version 7320 (0.0009) +[2023-10-08 12:04:06,516][102897] Updated weights for policy 0, policy_version 7330 (0.0010) +[2023-10-08 12:04:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 15007744. Throughput: 0: 1781.3, 1: 1806.7. Samples: 3758542. Policy #0 lag: (min: 1.0, avg: 6.2, max: 33.0) +[2023-10-08 12:04:06,875][101941] Avg episode reward: [(0, '5.520'), (1, '5.540')] +[2023-10-08 12:04:06,884][102897] Updated weights for policy 0, policy_version 7340 (0.0010) +[2023-10-08 12:04:07,266][102897] Updated weights for policy 0, policy_version 7350 (0.0010) +[2023-10-08 12:04:07,625][102897] Updated weights for policy 0, policy_version 7360 (0.0010) +[2023-10-08 12:04:08,416][102898] Updated weights for policy 1, policy_version 7330 (0.0010) +[2023-10-08 12:04:08,776][102898] Updated weights for policy 1, policy_version 7340 (0.0008) +[2023-10-08 12:04:09,146][102898] Updated weights for policy 1, policy_version 7350 (0.0010) +[2023-10-08 12:04:09,516][102898] Updated weights for policy 1, policy_version 7360 (0.0009) +[2023-10-08 12:04:11,407][102897] Updated weights for policy 0, policy_version 7370 (0.0008) +[2023-10-08 12:04:11,778][102897] Updated weights for policy 0, policy_version 7380 (0.0008) +[2023-10-08 12:04:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 15073280. Throughput: 0: 1791.4, 1: 1792.1. Samples: 3780342. Policy #0 lag: (min: 13.0, avg: 23.6, max: 45.0) +[2023-10-08 12:04:11,875][101941] Avg episode reward: [(0, '5.920'), (1, '5.770')] +[2023-10-08 12:04:12,151][102897] Updated weights for policy 0, policy_version 7390 (0.0009) +[2023-10-08 12:04:13,358][102898] Updated weights for policy 1, policy_version 7370 (0.0008) +[2023-10-08 12:04:13,729][102898] Updated weights for policy 1, policy_version 7380 (0.0011) +[2023-10-08 12:04:14,103][102898] Updated weights for policy 1, policy_version 7390 (0.0009) +[2023-10-08 12:04:16,139][102897] Updated weights for policy 0, policy_version 7400 (0.0009) +[2023-10-08 12:04:16,514][102897] Updated weights for policy 0, policy_version 7410 (0.0009) +[2023-10-08 12:04:16,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 15138816. Throughput: 0: 1801.7, 1: 1799.7. Samples: 3801982. Policy #0 lag: (min: 13.0, avg: 23.6, max: 45.0) +[2023-10-08 12:04:16,876][101941] Avg episode reward: [(0, '6.340'), (1, '5.830')] +[2023-10-08 12:04:16,885][102897] Updated weights for policy 0, policy_version 7420 (0.0007) +[2023-10-08 12:04:16,891][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000007392_7569408.pth... +[2023-10-08 12:04:16,925][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000005728_5865472.pth +[2023-10-08 12:04:17,035][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000007424_7602176.pth... +[2023-10-08 12:04:17,066][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000005728_5865472.pth +[2023-10-08 12:04:17,747][102898] Updated weights for policy 1, policy_version 7400 (0.0009) +[2023-10-08 12:04:18,111][102898] Updated weights for policy 1, policy_version 7410 (0.0007) +[2023-10-08 12:04:18,477][102898] Updated weights for policy 1, policy_version 7420 (0.0010) +[2023-10-08 12:04:20,518][102897] Updated weights for policy 0, policy_version 7430 (0.0008) +[2023-10-08 12:04:20,896][102897] Updated weights for policy 0, policy_version 7440 (0.0008) +[2023-10-08 12:04:21,258][102897] Updated weights for policy 0, policy_version 7450 (0.0008) +[2023-10-08 12:04:21,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 15237120. Throughput: 0: 1783.1, 1: 1800.3. Samples: 3812378. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:04:21,876][101941] Avg episode reward: [(0, '6.410'), (1, '5.180')] +[2023-10-08 12:04:22,413][102898] Updated weights for policy 1, policy_version 7430 (0.0009) +[2023-10-08 12:04:22,779][102898] Updated weights for policy 1, policy_version 7440 (0.0011) +[2023-10-08 12:04:23,147][102898] Updated weights for policy 1, policy_version 7450 (0.0008) +[2023-10-08 12:04:24,945][102897] Updated weights for policy 0, policy_version 7460 (0.0007) +[2023-10-08 12:04:25,317][102897] Updated weights for policy 0, policy_version 7470 (0.0008) +[2023-10-08 12:04:25,694][102897] Updated weights for policy 0, policy_version 7480 (0.0011) +[2023-10-08 12:04:26,840][102898] Updated weights for policy 1, policy_version 7460 (0.0008) +[2023-10-08 12:04:26,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 15302656. Throughput: 0: 1799.5, 1: 1801.4. Samples: 3834038. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) +[2023-10-08 12:04:26,875][101941] Avg episode reward: [(0, '6.820'), (1, '4.810')] +[2023-10-08 12:04:26,876][102634] Saving new best policy, reward=6.820! +[2023-10-08 12:04:27,207][102898] Updated weights for policy 1, policy_version 7470 (0.0007) +[2023-10-08 12:04:27,571][102898] Updated weights for policy 1, policy_version 7480 (0.0007) +[2023-10-08 12:04:29,470][102897] Updated weights for policy 0, policy_version 7490 (0.0009) +[2023-10-08 12:04:29,839][102897] Updated weights for policy 0, policy_version 7500 (0.0007) +[2023-10-08 12:04:30,222][102897] Updated weights for policy 0, policy_version 7510 (0.0007) +[2023-10-08 12:04:30,598][102897] Updated weights for policy 0, policy_version 7520 (0.0008) +[2023-10-08 12:04:31,121][102898] Updated weights for policy 1, policy_version 7490 (0.0011) +[2023-10-08 12:04:31,480][102898] Updated weights for policy 1, policy_version 7500 (0.0010) +[2023-10-08 12:04:31,852][102898] Updated weights for policy 1, policy_version 7510 (0.0007) +[2023-10-08 12:04:31,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 15368192. Throughput: 0: 1777.0, 1: 1807.6. Samples: 3855244. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) +[2023-10-08 12:04:31,875][101941] Avg episode reward: [(0, '6.800'), (1, '4.850')] +[2023-10-08 12:04:32,225][102898] Updated weights for policy 1, policy_version 7520 (0.0008) +[2023-10-08 12:04:34,282][102897] Updated weights for policy 0, policy_version 7530 (0.0010) +[2023-10-08 12:04:34,654][102897] Updated weights for policy 0, policy_version 7540 (0.0007) +[2023-10-08 12:04:35,030][102897] Updated weights for policy 0, policy_version 7550 (0.0007) +[2023-10-08 12:04:35,984][102898] Updated weights for policy 1, policy_version 7530 (0.0007) +[2023-10-08 12:04:36,352][102898] Updated weights for policy 1, policy_version 7540 (0.0008) +[2023-10-08 12:04:36,726][102898] Updated weights for policy 1, policy_version 7550 (0.0007) +[2023-10-08 12:04:36,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 15466496. Throughput: 0: 1796.2, 1: 1801.7. Samples: 3866488. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 12:04:36,875][101941] Avg episode reward: [(0, '6.230'), (1, '4.970')] +[2023-10-08 12:04:38,872][102897] Updated weights for policy 0, policy_version 7560 (0.0009) +[2023-10-08 12:04:39,240][102897] Updated weights for policy 0, policy_version 7570 (0.0009) +[2023-10-08 12:04:39,616][102897] Updated weights for policy 0, policy_version 7580 (0.0009) +[2023-10-08 12:04:40,438][102898] Updated weights for policy 1, policy_version 7560 (0.0007) +[2023-10-08 12:04:40,801][102898] Updated weights for policy 1, policy_version 7570 (0.0011) +[2023-10-08 12:04:41,176][102898] Updated weights for policy 1, policy_version 7580 (0.0007) +[2023-10-08 12:04:41,875][101941] Fps is (10 sec: 16383.4, 60 sec: 14745.5, 300 sec: 14329.1). Total num frames: 15532032. Throughput: 0: 1773.1, 1: 1814.1. Samples: 3887614. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 12:04:41,877][101941] Avg episode reward: [(0, '6.290'), (1, '4.670')] +[2023-10-08 12:04:43,437][102897] Updated weights for policy 0, policy_version 7590 (0.0009) +[2023-10-08 12:04:43,806][102897] Updated weights for policy 0, policy_version 7600 (0.0008) +[2023-10-08 12:04:44,183][102897] Updated weights for policy 0, policy_version 7610 (0.0009) +[2023-10-08 12:04:44,892][102898] Updated weights for policy 1, policy_version 7590 (0.0010) +[2023-10-08 12:04:45,261][102898] Updated weights for policy 1, policy_version 7600 (0.0009) +[2023-10-08 12:04:45,626][102898] Updated weights for policy 1, policy_version 7610 (0.0007) +[2023-10-08 12:04:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 15597568. Throughput: 0: 1780.1, 1: 1800.9. Samples: 3909126. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 12:04:46,876][101941] Avg episode reward: [(0, '6.070'), (1, '4.630')] +[2023-10-08 12:04:47,780][102897] Updated weights for policy 0, policy_version 7620 (0.0009) +[2023-10-08 12:04:48,149][102897] Updated weights for policy 0, policy_version 7630 (0.0010) +[2023-10-08 12:04:48,520][102897] Updated weights for policy 0, policy_version 7640 (0.0011) +[2023-10-08 12:04:49,432][102898] Updated weights for policy 1, policy_version 7620 (0.0008) +[2023-10-08 12:04:49,815][102898] Updated weights for policy 1, policy_version 7630 (0.0010) +[2023-10-08 12:04:50,181][102898] Updated weights for policy 1, policy_version 7640 (0.0009) +[2023-10-08 12:04:51,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 15663104. Throughput: 0: 1779.7, 1: 1807.5. Samples: 3919968. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 12:04:51,876][101941] Avg episode reward: [(0, '6.690'), (1, '4.700')] +[2023-10-08 12:04:52,490][102897] Updated weights for policy 0, policy_version 7650 (0.0009) +[2023-10-08 12:04:52,857][102897] Updated weights for policy 0, policy_version 7660 (0.0008) +[2023-10-08 12:04:53,231][102897] Updated weights for policy 0, policy_version 7670 (0.0008) +[2023-10-08 12:04:53,608][102897] Updated weights for policy 0, policy_version 7680 (0.0009) +[2023-10-08 12:04:54,050][102898] Updated weights for policy 1, policy_version 7650 (0.0008) +[2023-10-08 12:04:54,419][102898] Updated weights for policy 1, policy_version 7660 (0.0008) +[2023-10-08 12:04:54,782][102898] Updated weights for policy 1, policy_version 7670 (0.0007) +[2023-10-08 12:04:55,148][102898] Updated weights for policy 1, policy_version 7680 (0.0008) +[2023-10-08 12:04:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 15728640. Throughput: 0: 1776.8, 1: 1791.9. Samples: 3940932. Policy #0 lag: (min: 25.0, avg: 34.9, max: 57.0) +[2023-10-08 12:04:56,875][101941] Avg episode reward: [(0, '5.520'), (1, '4.750')] +[2023-10-08 12:04:57,350][102897] Updated weights for policy 0, policy_version 7690 (0.0007) +[2023-10-08 12:04:57,719][102897] Updated weights for policy 0, policy_version 7700 (0.0007) +[2023-10-08 12:04:58,091][102897] Updated weights for policy 0, policy_version 7710 (0.0007) +[2023-10-08 12:04:58,938][102898] Updated weights for policy 1, policy_version 7690 (0.0007) +[2023-10-08 12:04:59,311][102898] Updated weights for policy 1, policy_version 7700 (0.0008) +[2023-10-08 12:04:59,673][102898] Updated weights for policy 1, policy_version 7710 (0.0009) +[2023-10-08 12:05:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 15794176. Throughput: 0: 1798.2, 1: 1787.4. Samples: 3963334. Policy #0 lag: (min: 25.0, avg: 34.9, max: 57.0) +[2023-10-08 12:05:01,875][101941] Avg episode reward: [(0, '5.200'), (1, '5.480')] +[2023-10-08 12:05:02,025][102897] Updated weights for policy 0, policy_version 7720 (0.0010) +[2023-10-08 12:05:02,412][102897] Updated weights for policy 0, policy_version 7730 (0.0010) +[2023-10-08 12:05:02,791][102897] Updated weights for policy 0, policy_version 7740 (0.0011) +[2023-10-08 12:05:03,175][102898] Updated weights for policy 1, policy_version 7720 (0.0008) +[2023-10-08 12:05:03,538][102898] Updated weights for policy 1, policy_version 7730 (0.0007) +[2023-10-08 12:05:03,903][102898] Updated weights for policy 1, policy_version 7740 (0.0007) +[2023-10-08 12:05:06,422][102897] Updated weights for policy 0, policy_version 7750 (0.0007) +[2023-10-08 12:05:06,801][102897] Updated weights for policy 0, policy_version 7760 (0.0008) +[2023-10-08 12:05:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 15859712. Throughput: 0: 1782.5, 1: 1790.7. Samples: 3973170. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 12:05:06,875][101941] Avg episode reward: [(0, '5.270'), (1, '5.270')] +[2023-10-08 12:05:07,168][102897] Updated weights for policy 0, policy_version 7770 (0.0007) +[2023-10-08 12:05:07,793][102898] Updated weights for policy 1, policy_version 7750 (0.0008) +[2023-10-08 12:05:08,178][102898] Updated weights for policy 1, policy_version 7760 (0.0007) +[2023-10-08 12:05:08,553][102898] Updated weights for policy 1, policy_version 7770 (0.0008) +[2023-10-08 12:05:10,804][102897] Updated weights for policy 0, policy_version 7780 (0.0007) +[2023-10-08 12:05:11,185][102897] Updated weights for policy 0, policy_version 7790 (0.0007) +[2023-10-08 12:05:11,557][102897] Updated weights for policy 0, policy_version 7800 (0.0008) +[2023-10-08 12:05:11,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 15958016. Throughput: 0: 1791.7, 1: 1794.6. Samples: 3995420. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:05:11,875][101941] Avg episode reward: [(0, '5.760'), (1, '5.550')] +[2023-10-08 12:05:12,270][102898] Updated weights for policy 1, policy_version 7780 (0.0008) +[2023-10-08 12:05:12,648][102898] Updated weights for policy 1, policy_version 7790 (0.0009) +[2023-10-08 12:05:13,022][102898] Updated weights for policy 1, policy_version 7800 (0.0009) +[2023-10-08 12:05:15,287][102897] Updated weights for policy 0, policy_version 7810 (0.0009) +[2023-10-08 12:05:15,659][102897] Updated weights for policy 0, policy_version 7820 (0.0007) +[2023-10-08 12:05:16,037][102897] Updated weights for policy 0, policy_version 7830 (0.0008) +[2023-10-08 12:05:16,397][102897] Updated weights for policy 0, policy_version 7840 (0.0008) +[2023-10-08 12:05:16,699][102898] Updated weights for policy 1, policy_version 7810 (0.0010) +[2023-10-08 12:05:16,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 16023552. Throughput: 0: 1780.8, 1: 1802.8. Samples: 4016502. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:05:16,875][101941] Avg episode reward: [(0, '5.280'), (1, '6.010')] +[2023-10-08 12:05:17,055][102898] Updated weights for policy 1, policy_version 7820 (0.0008) +[2023-10-08 12:05:17,426][102898] Updated weights for policy 1, policy_version 7830 (0.0010) +[2023-10-08 12:05:17,789][102898] Updated weights for policy 1, policy_version 7840 (0.0008) +[2023-10-08 12:05:20,190][102897] Updated weights for policy 0, policy_version 7850 (0.0010) +[2023-10-08 12:05:20,554][102897] Updated weights for policy 0, policy_version 7860 (0.0010) +[2023-10-08 12:05:20,925][102897] Updated weights for policy 0, policy_version 7870 (0.0008) +[2023-10-08 12:05:21,602][102898] Updated weights for policy 1, policy_version 7850 (0.0007) +[2023-10-08 12:05:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 16089088. Throughput: 0: 1793.6, 1: 1785.8. Samples: 4027560. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:05:21,875][101941] Avg episode reward: [(0, '5.580'), (1, '5.500')] +[2023-10-08 12:05:21,962][102898] Updated weights for policy 1, policy_version 7860 (0.0009) +[2023-10-08 12:05:22,334][102898] Updated weights for policy 1, policy_version 7870 (0.0009) +[2023-10-08 12:05:24,511][102897] Updated weights for policy 0, policy_version 7880 (0.0007) +[2023-10-08 12:05:24,885][102897] Updated weights for policy 0, policy_version 7890 (0.0007) +[2023-10-08 12:05:25,257][102897] Updated weights for policy 0, policy_version 7900 (0.0007) +[2023-10-08 12:05:26,156][102898] Updated weights for policy 1, policy_version 7880 (0.0008) +[2023-10-08 12:05:26,531][102898] Updated weights for policy 1, policy_version 7890 (0.0008) +[2023-10-08 12:05:26,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 16154624. Throughput: 0: 1787.7, 1: 1797.2. Samples: 4048938. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:05:26,876][101941] Avg episode reward: [(0, '5.650'), (1, '5.460')] +[2023-10-08 12:05:26,895][102898] Updated weights for policy 1, policy_version 7900 (0.0009) +[2023-10-08 12:05:29,191][102897] Updated weights for policy 0, policy_version 7910 (0.0009) +[2023-10-08 12:05:29,568][102897] Updated weights for policy 0, policy_version 7920 (0.0009) +[2023-10-08 12:05:29,944][102897] Updated weights for policy 0, policy_version 7930 (0.0007) +[2023-10-08 12:05:30,743][102898] Updated weights for policy 1, policy_version 7910 (0.0008) +[2023-10-08 12:05:31,112][102898] Updated weights for policy 1, policy_version 7920 (0.0010) +[2023-10-08 12:05:31,474][102898] Updated weights for policy 1, policy_version 7930 (0.0009) +[2023-10-08 12:05:31,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 16252928. Throughput: 0: 1784.7, 1: 1790.5. Samples: 4070012. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 12:05:31,876][101941] Avg episode reward: [(0, '5.750'), (1, '5.280')] +[2023-10-08 12:05:33,728][102897] Updated weights for policy 0, policy_version 7940 (0.0007) +[2023-10-08 12:05:34,115][102897] Updated weights for policy 0, policy_version 7950 (0.0008) +[2023-10-08 12:05:34,491][102897] Updated weights for policy 0, policy_version 7960 (0.0007) +[2023-10-08 12:05:35,099][102898] Updated weights for policy 1, policy_version 7940 (0.0008) +[2023-10-08 12:05:35,463][102898] Updated weights for policy 1, policy_version 7950 (0.0009) +[2023-10-08 12:05:35,831][102898] Updated weights for policy 1, policy_version 7960 (0.0010) +[2023-10-08 12:05:36,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 16318464. Throughput: 0: 1796.7, 1: 1791.8. Samples: 4081450. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 12:05:36,876][101941] Avg episode reward: [(0, '5.550'), (1, '5.340')] +[2023-10-08 12:05:38,277][102897] Updated weights for policy 0, policy_version 7970 (0.0007) +[2023-10-08 12:05:38,633][102897] Updated weights for policy 0, policy_version 7980 (0.0007) +[2023-10-08 12:05:39,004][102897] Updated weights for policy 0, policy_version 7990 (0.0009) +[2023-10-08 12:05:39,372][102897] Updated weights for policy 0, policy_version 8000 (0.0010) +[2023-10-08 12:05:39,512][102898] Updated weights for policy 1, policy_version 7970 (0.0009) +[2023-10-08 12:05:39,885][102898] Updated weights for policy 1, policy_version 7980 (0.0008) +[2023-10-08 12:05:40,246][102898] Updated weights for policy 1, policy_version 7990 (0.0010) +[2023-10-08 12:05:40,614][102898] Updated weights for policy 1, policy_version 8000 (0.0007) +[2023-10-08 12:05:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 16384000. Throughput: 0: 1784.9, 1: 1797.5. Samples: 4102140. Policy #0 lag: (min: 1.0, avg: 5.7, max: 33.0) +[2023-10-08 12:05:41,876][101941] Avg episode reward: [(0, '6.300'), (1, '5.260')] +[2023-10-08 12:05:43,049][102897] Updated weights for policy 0, policy_version 8010 (0.0007) +[2023-10-08 12:05:43,409][102897] Updated weights for policy 0, policy_version 8020 (0.0007) +[2023-10-08 12:05:43,787][102897] Updated weights for policy 0, policy_version 8030 (0.0009) +[2023-10-08 12:05:44,382][102898] Updated weights for policy 1, policy_version 8010 (0.0007) +[2023-10-08 12:05:44,744][102898] Updated weights for policy 1, policy_version 8020 (0.0007) +[2023-10-08 12:05:45,113][102898] Updated weights for policy 1, policy_version 8030 (0.0008) +[2023-10-08 12:05:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 16449536. Throughput: 0: 1788.4, 1: 1791.1. Samples: 4124412. Policy #0 lag: (min: 1.0, avg: 5.7, max: 33.0) +[2023-10-08 12:05:46,876][101941] Avg episode reward: [(0, '6.620'), (1, '5.190')] +[2023-10-08 12:05:47,528][102897] Updated weights for policy 0, policy_version 8040 (0.0009) +[2023-10-08 12:05:47,913][102897] Updated weights for policy 0, policy_version 8050 (0.0010) +[2023-10-08 12:05:48,289][102897] Updated weights for policy 0, policy_version 8060 (0.0008) +[2023-10-08 12:05:48,897][102898] Updated weights for policy 1, policy_version 8040 (0.0009) +[2023-10-08 12:05:49,264][102898] Updated weights for policy 1, policy_version 8050 (0.0009) +[2023-10-08 12:05:49,643][102898] Updated weights for policy 1, policy_version 8060 (0.0010) +[2023-10-08 12:05:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 16515072. Throughput: 0: 1783.9, 1: 1802.0. Samples: 4134534. Policy #0 lag: (min: 21.0, avg: 24.0, max: 53.0) +[2023-10-08 12:05:51,876][101941] Avg episode reward: [(0, '6.280'), (1, '5.230')] +[2023-10-08 12:05:52,221][102897] Updated weights for policy 0, policy_version 8070 (0.0009) +[2023-10-08 12:05:52,589][102897] Updated weights for policy 0, policy_version 8080 (0.0008) +[2023-10-08 12:05:52,957][102897] Updated weights for policy 0, policy_version 8090 (0.0010) +[2023-10-08 12:05:53,456][102898] Updated weights for policy 1, policy_version 8070 (0.0009) +[2023-10-08 12:05:53,826][102898] Updated weights for policy 1, policy_version 8080 (0.0010) +[2023-10-08 12:05:54,203][102898] Updated weights for policy 1, policy_version 8090 (0.0008) +[2023-10-08 12:05:56,694][102897] Updated weights for policy 0, policy_version 8100 (0.0009) +[2023-10-08 12:05:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 16580608. Throughput: 0: 1787.3, 1: 1792.1. Samples: 4156496. Policy #0 lag: (min: 21.0, avg: 24.0, max: 53.0) +[2023-10-08 12:05:56,876][101941] Avg episode reward: [(0, '5.410'), (1, '5.430')] +[2023-10-08 12:05:57,073][102897] Updated weights for policy 0, policy_version 8110 (0.0010) +[2023-10-08 12:05:57,434][102897] Updated weights for policy 0, policy_version 8120 (0.0008) +[2023-10-08 12:05:57,837][102898] Updated weights for policy 1, policy_version 8100 (0.0009) +[2023-10-08 12:05:58,222][102898] Updated weights for policy 1, policy_version 8110 (0.0010) +[2023-10-08 12:05:58,588][102898] Updated weights for policy 1, policy_version 8120 (0.0008) +[2023-10-08 12:06:01,158][102897] Updated weights for policy 0, policy_version 8130 (0.0009) +[2023-10-08 12:06:01,524][102897] Updated weights for policy 0, policy_version 8140 (0.0007) +[2023-10-08 12:06:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 16646144. Throughput: 0: 1808.5, 1: 1789.5. Samples: 4178412. Policy #0 lag: (min: 2.0, avg: 7.8, max: 34.0) +[2023-10-08 12:06:01,876][101941] Avg episode reward: [(0, '5.390'), (1, '5.350')] +[2023-10-08 12:06:01,902][102897] Updated weights for policy 0, policy_version 8150 (0.0008) +[2023-10-08 12:06:02,269][102897] Updated weights for policy 0, policy_version 8160 (0.0008) +[2023-10-08 12:06:02,435][102898] Updated weights for policy 1, policy_version 8130 (0.0009) +[2023-10-08 12:06:02,803][102898] Updated weights for policy 1, policy_version 8140 (0.0009) +[2023-10-08 12:06:03,168][102898] Updated weights for policy 1, policy_version 8150 (0.0009) +[2023-10-08 12:06:03,538][102898] Updated weights for policy 1, policy_version 8160 (0.0009) +[2023-10-08 12:06:05,986][102897] Updated weights for policy 0, policy_version 8170 (0.0009) +[2023-10-08 12:06:06,355][102897] Updated weights for policy 0, policy_version 8180 (0.0008) +[2023-10-08 12:06:06,729][102897] Updated weights for policy 0, policy_version 8190 (0.0008) +[2023-10-08 12:06:06,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 16744448. Throughput: 0: 1788.0, 1: 1790.4. Samples: 4188588. Policy #0 lag: (min: 15.0, avg: 22.9, max: 47.0) +[2023-10-08 12:06:06,875][101941] Avg episode reward: [(0, '6.070'), (1, '4.940')] +[2023-10-08 12:06:07,269][102898] Updated weights for policy 1, policy_version 8170 (0.0008) +[2023-10-08 12:06:07,642][102898] Updated weights for policy 1, policy_version 8180 (0.0011) +[2023-10-08 12:06:08,014][102898] Updated weights for policy 1, policy_version 8190 (0.0009) +[2023-10-08 12:06:10,514][102897] Updated weights for policy 0, policy_version 8200 (0.0008) +[2023-10-08 12:06:10,889][102897] Updated weights for policy 0, policy_version 8210 (0.0007) +[2023-10-08 12:06:11,254][102897] Updated weights for policy 0, policy_version 8220 (0.0008) +[2023-10-08 12:06:11,812][102898] Updated weights for policy 1, policy_version 8200 (0.0009) +[2023-10-08 12:06:11,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 16809984. Throughput: 0: 1809.8, 1: 1786.9. Samples: 4210790. Policy #0 lag: (min: 15.0, avg: 22.9, max: 47.0) +[2023-10-08 12:06:11,876][101941] Avg episode reward: [(0, '6.840'), (1, '5.050')] +[2023-10-08 12:06:11,877][102634] Saving new best policy, reward=6.840! +[2023-10-08 12:06:12,181][102898] Updated weights for policy 1, policy_version 8210 (0.0008) +[2023-10-08 12:06:12,540][102898] Updated weights for policy 1, policy_version 8220 (0.0007) +[2023-10-08 12:06:14,736][102897] Updated weights for policy 0, policy_version 8230 (0.0007) +[2023-10-08 12:06:15,103][102897] Updated weights for policy 0, policy_version 8240 (0.0007) +[2023-10-08 12:06:15,476][102897] Updated weights for policy 0, policy_version 8250 (0.0009) +[2023-10-08 12:06:16,312][102898] Updated weights for policy 1, policy_version 8230 (0.0007) +[2023-10-08 12:06:16,681][102898] Updated weights for policy 1, policy_version 8240 (0.0009) +[2023-10-08 12:06:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 16875520. Throughput: 0: 1787.4, 1: 1806.7. Samples: 4231746. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 12:06:16,875][101941] Avg episode reward: [(0, '5.900'), (1, '5.630')] +[2023-10-08 12:06:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000008256_8454144.pth... +[2023-10-08 12:06:16,912][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000006592_6750208.pth +[2023-10-08 12:06:16,916][102634] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p0/milestones/checkpoint_000008256_8454144.pth +[2023-10-08 12:06:17,045][102898] Updated weights for policy 1, policy_version 8250 (0.0007) +[2023-10-08 12:06:17,266][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000008256_8454144.pth... +[2023-10-08 12:06:17,294][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000006560_6717440.pth +[2023-10-08 12:06:17,298][102760] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p1/milestones/checkpoint_000008256_8454144.pth +[2023-10-08 12:06:19,240][102897] Updated weights for policy 0, policy_version 8260 (0.0010) +[2023-10-08 12:06:19,614][102897] Updated weights for policy 0, policy_version 8270 (0.0008) +[2023-10-08 12:06:19,991][102897] Updated weights for policy 0, policy_version 8280 (0.0007) +[2023-10-08 12:06:20,866][102898] Updated weights for policy 1, policy_version 8260 (0.0008) +[2023-10-08 12:06:21,239][102898] Updated weights for policy 1, policy_version 8270 (0.0008) +[2023-10-08 12:06:21,602][102898] Updated weights for policy 1, policy_version 8280 (0.0008) +[2023-10-08 12:06:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 16941056. Throughput: 0: 1805.9, 1: 1787.2. Samples: 4243140. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 12:06:21,876][101941] Avg episode reward: [(0, '5.170'), (1, '5.440')] +[2023-10-08 12:06:23,897][102897] Updated weights for policy 0, policy_version 8290 (0.0007) +[2023-10-08 12:06:24,267][102897] Updated weights for policy 0, policy_version 8300 (0.0007) +[2023-10-08 12:06:24,648][102897] Updated weights for policy 0, policy_version 8310 (0.0007) +[2023-10-08 12:06:25,021][102897] Updated weights for policy 0, policy_version 8320 (0.0011) +[2023-10-08 12:06:25,235][102898] Updated weights for policy 1, policy_version 8290 (0.0009) +[2023-10-08 12:06:25,593][102898] Updated weights for policy 1, policy_version 8300 (0.0009) +[2023-10-08 12:06:25,960][102898] Updated weights for policy 1, policy_version 8310 (0.0011) +[2023-10-08 12:06:26,327][102898] Updated weights for policy 1, policy_version 8320 (0.0009) +[2023-10-08 12:06:26,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 17039360. Throughput: 0: 1789.3, 1: 1808.4. Samples: 4264036. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 12:06:26,876][101941] Avg episode reward: [(0, '5.050'), (1, '5.000')] +[2023-10-08 12:06:28,795][102897] Updated weights for policy 0, policy_version 8330 (0.0008) +[2023-10-08 12:06:29,174][102897] Updated weights for policy 0, policy_version 8340 (0.0009) +[2023-10-08 12:06:29,549][102897] Updated weights for policy 0, policy_version 8350 (0.0008) +[2023-10-08 12:06:29,982][102898] Updated weights for policy 1, policy_version 8330 (0.0010) +[2023-10-08 12:06:30,341][102898] Updated weights for policy 1, policy_version 8340 (0.0009) +[2023-10-08 12:06:30,708][102898] Updated weights for policy 1, policy_version 8350 (0.0007) +[2023-10-08 12:06:31,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 17104896. Throughput: 0: 1779.6, 1: 1795.8. Samples: 4285302. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 12:06:31,875][101941] Avg episode reward: [(0, '5.240'), (1, '5.130')] +[2023-10-08 12:06:33,447][102897] Updated weights for policy 0, policy_version 8360 (0.0007) +[2023-10-08 12:06:33,825][102897] Updated weights for policy 0, policy_version 8370 (0.0009) +[2023-10-08 12:06:34,204][102897] Updated weights for policy 0, policy_version 8380 (0.0008) +[2023-10-08 12:06:34,551][102898] Updated weights for policy 1, policy_version 8360 (0.0010) +[2023-10-08 12:06:34,915][102898] Updated weights for policy 1, policy_version 8370 (0.0010) +[2023-10-08 12:06:35,281][102898] Updated weights for policy 1, policy_version 8380 (0.0011) +[2023-10-08 12:06:36,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 17170432. Throughput: 0: 1782.3, 1: 1805.2. Samples: 4295972. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 12:06:36,876][101941] Avg episode reward: [(0, '5.710'), (1, '4.650')] +[2023-10-08 12:06:37,986][102897] Updated weights for policy 0, policy_version 8390 (0.0007) +[2023-10-08 12:06:38,363][102897] Updated weights for policy 0, policy_version 8400 (0.0009) +[2023-10-08 12:06:38,726][102897] Updated weights for policy 0, policy_version 8410 (0.0008) +[2023-10-08 12:06:39,112][102898] Updated weights for policy 1, policy_version 8390 (0.0008) +[2023-10-08 12:06:39,477][102898] Updated weights for policy 1, policy_version 8400 (0.0007) +[2023-10-08 12:06:39,843][102898] Updated weights for policy 1, policy_version 8410 (0.0007) +[2023-10-08 12:06:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 17235968. Throughput: 0: 1789.0, 1: 1789.1. Samples: 4317510. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 12:06:41,876][101941] Avg episode reward: [(0, '6.310'), (1, '4.950')] +[2023-10-08 12:06:42,418][102897] Updated weights for policy 0, policy_version 8420 (0.0008) +[2023-10-08 12:06:42,786][102897] Updated weights for policy 0, policy_version 8430 (0.0007) +[2023-10-08 12:06:43,145][102897] Updated weights for policy 0, policy_version 8440 (0.0009) +[2023-10-08 12:06:43,687][102898] Updated weights for policy 1, policy_version 8420 (0.0008) +[2023-10-08 12:06:44,083][102898] Updated weights for policy 1, policy_version 8430 (0.0010) +[2023-10-08 12:06:44,458][102898] Updated weights for policy 1, policy_version 8440 (0.0010) +[2023-10-08 12:06:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 17301504. Throughput: 0: 1792.1, 1: 1787.7. Samples: 4339506. Policy #0 lag: (min: 21.0, avg: 26.3, max: 53.0) +[2023-10-08 12:06:46,876][101941] Avg episode reward: [(0, '5.870'), (1, '5.470')] +[2023-10-08 12:06:47,043][102897] Updated weights for policy 0, policy_version 8450 (0.0008) +[2023-10-08 12:06:47,412][102897] Updated weights for policy 0, policy_version 8460 (0.0008) +[2023-10-08 12:06:47,784][102897] Updated weights for policy 0, policy_version 8470 (0.0010) +[2023-10-08 12:06:48,158][102897] Updated weights for policy 0, policy_version 8480 (0.0009) +[2023-10-08 12:06:48,168][102898] Updated weights for policy 1, policy_version 8450 (0.0009) +[2023-10-08 12:06:48,536][102898] Updated weights for policy 1, policy_version 8460 (0.0009) +[2023-10-08 12:06:48,904][102898] Updated weights for policy 1, policy_version 8470 (0.0011) +[2023-10-08 12:06:49,266][102898] Updated weights for policy 1, policy_version 8480 (0.0010) +[2023-10-08 12:06:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 17367040. Throughput: 0: 1782.6, 1: 1791.8. Samples: 4349438. Policy #0 lag: (min: 21.0, avg: 26.3, max: 53.0) +[2023-10-08 12:06:51,876][101941] Avg episode reward: [(0, '6.240'), (1, '5.580')] +[2023-10-08 12:06:51,919][102897] Updated weights for policy 0, policy_version 8490 (0.0010) +[2023-10-08 12:06:52,297][102897] Updated weights for policy 0, policy_version 8500 (0.0008) +[2023-10-08 12:06:52,670][102897] Updated weights for policy 0, policy_version 8510 (0.0007) +[2023-10-08 12:06:53,121][102898] Updated weights for policy 1, policy_version 8490 (0.0007) +[2023-10-08 12:06:53,489][102898] Updated weights for policy 1, policy_version 8500 (0.0008) +[2023-10-08 12:06:53,863][102898] Updated weights for policy 1, policy_version 8510 (0.0007) +[2023-10-08 12:06:56,414][102897] Updated weights for policy 0, policy_version 8520 (0.0009) +[2023-10-08 12:06:56,785][102897] Updated weights for policy 0, policy_version 8530 (0.0009) +[2023-10-08 12:06:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 17432576. Throughput: 0: 1791.2, 1: 1790.5. Samples: 4371964. Policy #0 lag: (min: 26.0, avg: 27.2, max: 49.0) +[2023-10-08 12:06:56,876][101941] Avg episode reward: [(0, '6.260'), (1, '5.280')] +[2023-10-08 12:06:57,165][102897] Updated weights for policy 0, policy_version 8540 (0.0010) +[2023-10-08 12:06:57,507][102898] Updated weights for policy 1, policy_version 8520 (0.0010) +[2023-10-08 12:06:57,881][102898] Updated weights for policy 1, policy_version 8530 (0.0008) +[2023-10-08 12:06:58,245][102898] Updated weights for policy 1, policy_version 8540 (0.0007) +[2023-10-08 12:07:00,856][102897] Updated weights for policy 0, policy_version 8550 (0.0008) +[2023-10-08 12:07:01,219][102897] Updated weights for policy 0, policy_version 8560 (0.0009) +[2023-10-08 12:07:01,598][102897] Updated weights for policy 0, policy_version 8570 (0.0007) +[2023-10-08 12:07:01,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 17530880. Throughput: 0: 1788.6, 1: 1800.3. Samples: 4393248. Policy #0 lag: (min: 31.0, avg: 32.0, max: 48.0) +[2023-10-08 12:07:01,875][101941] Avg episode reward: [(0, '6.510'), (1, '5.140')] +[2023-10-08 12:07:02,082][102898] Updated weights for policy 1, policy_version 8550 (0.0007) +[2023-10-08 12:07:02,449][102898] Updated weights for policy 1, policy_version 8560 (0.0007) +[2023-10-08 12:07:02,816][102898] Updated weights for policy 1, policy_version 8570 (0.0009) +[2023-10-08 12:07:05,306][102897] Updated weights for policy 0, policy_version 8580 (0.0008) +[2023-10-08 12:07:05,680][102897] Updated weights for policy 0, policy_version 8590 (0.0007) +[2023-10-08 12:07:06,054][102897] Updated weights for policy 0, policy_version 8600 (0.0010) +[2023-10-08 12:07:06,509][102898] Updated weights for policy 1, policy_version 8580 (0.0007) +[2023-10-08 12:07:06,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 17596416. Throughput: 0: 1782.8, 1: 1792.5. Samples: 4404030. Policy #0 lag: (min: 31.0, avg: 32.0, max: 48.0) +[2023-10-08 12:07:06,875][101941] Avg episode reward: [(0, '6.570'), (1, '5.600')] +[2023-10-08 12:07:06,882][102898] Updated weights for policy 1, policy_version 8590 (0.0007) +[2023-10-08 12:07:07,250][102898] Updated weights for policy 1, policy_version 8600 (0.0008) +[2023-10-08 12:07:09,816][102897] Updated weights for policy 0, policy_version 8610 (0.0008) +[2023-10-08 12:07:10,194][102897] Updated weights for policy 0, policy_version 8620 (0.0008) +[2023-10-08 12:07:10,560][102897] Updated weights for policy 0, policy_version 8630 (0.0007) +[2023-10-08 12:07:10,930][102897] Updated weights for policy 0, policy_version 8640 (0.0008) +[2023-10-08 12:07:11,010][102898] Updated weights for policy 1, policy_version 8610 (0.0008) +[2023-10-08 12:07:11,373][102898] Updated weights for policy 1, policy_version 8620 (0.0009) +[2023-10-08 12:07:11,740][102898] Updated weights for policy 1, policy_version 8630 (0.0010) +[2023-10-08 12:07:11,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 17661952. Throughput: 0: 1797.7, 1: 1801.0. Samples: 4425980. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:07:11,876][101941] Avg episode reward: [(0, '6.540'), (1, '5.350')] +[2023-10-08 12:07:12,104][102898] Updated weights for policy 1, policy_version 8640 (0.0010) +[2023-10-08 12:07:14,609][102897] Updated weights for policy 0, policy_version 8650 (0.0009) +[2023-10-08 12:07:14,991][102897] Updated weights for policy 0, policy_version 8660 (0.0010) +[2023-10-08 12:07:15,352][102897] Updated weights for policy 0, policy_version 8670 (0.0008) +[2023-10-08 12:07:15,838][102898] Updated weights for policy 1, policy_version 8650 (0.0007) +[2023-10-08 12:07:16,209][102898] Updated weights for policy 1, policy_version 8660 (0.0007) +[2023-10-08 12:07:16,571][102898] Updated weights for policy 1, policy_version 8670 (0.0009) +[2023-10-08 12:07:16,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 17760256. Throughput: 0: 1789.3, 1: 1797.5. Samples: 4446708. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:07:16,875][101941] Avg episode reward: [(0, '5.930'), (1, '5.200')] +[2023-10-08 12:07:19,286][102897] Updated weights for policy 0, policy_version 8680 (0.0008) +[2023-10-08 12:07:19,673][102897] Updated weights for policy 0, policy_version 8690 (0.0008) +[2023-10-08 12:07:20,047][102897] Updated weights for policy 0, policy_version 8700 (0.0007) +[2023-10-08 12:07:20,394][102898] Updated weights for policy 1, policy_version 8680 (0.0008) +[2023-10-08 12:07:20,763][102898] Updated weights for policy 1, policy_version 8690 (0.0009) +[2023-10-08 12:07:21,124][102898] Updated weights for policy 1, policy_version 8700 (0.0008) +[2023-10-08 12:07:21,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 17825792. Throughput: 0: 1808.6, 1: 1800.6. Samples: 4458386. Policy #0 lag: (min: 15.0, avg: 23.1, max: 47.0) +[2023-10-08 12:07:21,876][101941] Avg episode reward: [(0, '5.340'), (1, '5.820')] +[2023-10-08 12:07:23,651][102897] Updated weights for policy 0, policy_version 8710 (0.0008) +[2023-10-08 12:07:24,033][102897] Updated weights for policy 0, policy_version 8720 (0.0009) +[2023-10-08 12:07:24,413][102897] Updated weights for policy 0, policy_version 8730 (0.0008) +[2023-10-08 12:07:24,759][102898] Updated weights for policy 1, policy_version 8710 (0.0010) +[2023-10-08 12:07:25,130][102898] Updated weights for policy 1, policy_version 8720 (0.0008) +[2023-10-08 12:07:25,490][102898] Updated weights for policy 1, policy_version 8730 (0.0008) +[2023-10-08 12:07:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 17891328. Throughput: 0: 1781.2, 1: 1803.5. Samples: 4478822. Policy #0 lag: (min: 15.0, avg: 23.1, max: 47.0) +[2023-10-08 12:07:26,875][101941] Avg episode reward: [(0, '5.440'), (1, '5.680')] +[2023-10-08 12:07:28,250][102897] Updated weights for policy 0, policy_version 8740 (0.0007) +[2023-10-08 12:07:28,627][102897] Updated weights for policy 0, policy_version 8750 (0.0007) +[2023-10-08 12:07:28,999][102897] Updated weights for policy 0, policy_version 8760 (0.0009) +[2023-10-08 12:07:29,232][102898] Updated weights for policy 1, policy_version 8740 (0.0008) +[2023-10-08 12:07:29,622][102898] Updated weights for policy 1, policy_version 8750 (0.0008) +[2023-10-08 12:07:29,992][102898] Updated weights for policy 1, policy_version 8760 (0.0008) +[2023-10-08 12:07:31,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 17956864. Throughput: 0: 1787.2, 1: 1795.4. Samples: 4500722. Policy #0 lag: (min: 9.0, avg: 26.7, max: 41.0) +[2023-10-08 12:07:31,876][101941] Avg episode reward: [(0, '5.800'), (1, '5.680')] +[2023-10-08 12:07:32,658][102897] Updated weights for policy 0, policy_version 8770 (0.0008) +[2023-10-08 12:07:33,033][102897] Updated weights for policy 0, policy_version 8780 (0.0007) +[2023-10-08 12:07:33,401][102897] Updated weights for policy 0, policy_version 8790 (0.0007) +[2023-10-08 12:07:33,779][102897] Updated weights for policy 0, policy_version 8800 (0.0008) +[2023-10-08 12:07:33,892][102898] Updated weights for policy 1, policy_version 8770 (0.0008) +[2023-10-08 12:07:34,258][102898] Updated weights for policy 1, policy_version 8780 (0.0009) +[2023-10-08 12:07:34,623][102898] Updated weights for policy 1, policy_version 8790 (0.0009) +[2023-10-08 12:07:34,995][102898] Updated weights for policy 1, policy_version 8800 (0.0009) +[2023-10-08 12:07:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 18022400. Throughput: 0: 1787.2, 1: 1807.5. Samples: 4511196. Policy #0 lag: (min: 9.0, avg: 26.7, max: 41.0) +[2023-10-08 12:07:36,875][101941] Avg episode reward: [(0, '5.750'), (1, '5.580')] +[2023-10-08 12:07:37,534][102897] Updated weights for policy 0, policy_version 8810 (0.0011) +[2023-10-08 12:07:37,907][102897] Updated weights for policy 0, policy_version 8820 (0.0008) +[2023-10-08 12:07:38,291][102897] Updated weights for policy 0, policy_version 8830 (0.0009) +[2023-10-08 12:07:38,638][102898] Updated weights for policy 1, policy_version 8810 (0.0007) +[2023-10-08 12:07:39,010][102898] Updated weights for policy 1, policy_version 8820 (0.0008) +[2023-10-08 12:07:39,371][102898] Updated weights for policy 1, policy_version 8830 (0.0007) +[2023-10-08 12:07:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 18087936. Throughput: 0: 1789.0, 1: 1790.2. Samples: 4533028. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 12:07:41,876][101941] Avg episode reward: [(0, '5.660'), (1, '5.190')] +[2023-10-08 12:07:42,096][102897] Updated weights for policy 0, policy_version 8840 (0.0008) +[2023-10-08 12:07:42,462][102897] Updated weights for policy 0, policy_version 8850 (0.0009) +[2023-10-08 12:07:42,837][102897] Updated weights for policy 0, policy_version 8860 (0.0009) +[2023-10-08 12:07:43,137][102898] Updated weights for policy 1, policy_version 8840 (0.0007) +[2023-10-08 12:07:43,510][102898] Updated weights for policy 1, policy_version 8850 (0.0011) +[2023-10-08 12:07:43,873][102898] Updated weights for policy 1, policy_version 8860 (0.0007) +[2023-10-08 12:07:46,736][102897] Updated weights for policy 0, policy_version 8870 (0.0007) +[2023-10-08 12:07:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 18153472. Throughput: 0: 1807.7, 1: 1792.5. Samples: 4555258. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 12:07:46,875][101941] Avg episode reward: [(0, '5.750'), (1, '5.280')] +[2023-10-08 12:07:47,106][102897] Updated weights for policy 0, policy_version 8880 (0.0008) +[2023-10-08 12:07:47,474][102897] Updated weights for policy 0, policy_version 8890 (0.0008) +[2023-10-08 12:07:47,583][102898] Updated weights for policy 1, policy_version 8870 (0.0007) +[2023-10-08 12:07:47,956][102898] Updated weights for policy 1, policy_version 8880 (0.0011) +[2023-10-08 12:07:48,324][102898] Updated weights for policy 1, policy_version 8890 (0.0010) +[2023-10-08 12:07:51,148][102897] Updated weights for policy 0, policy_version 8900 (0.0008) +[2023-10-08 12:07:51,520][102897] Updated weights for policy 0, policy_version 8910 (0.0007) +[2023-10-08 12:07:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 18219008. Throughput: 0: 1786.6, 1: 1790.3. Samples: 4564990. Policy #0 lag: (min: 17.0, avg: 33.0, max: 49.0) +[2023-10-08 12:07:51,876][101941] Avg episode reward: [(0, '5.980'), (1, '5.220')] +[2023-10-08 12:07:51,907][102897] Updated weights for policy 0, policy_version 8920 (0.0010) +[2023-10-08 12:07:52,098][102898] Updated weights for policy 1, policy_version 8900 (0.0008) +[2023-10-08 12:07:52,469][102898] Updated weights for policy 1, policy_version 8910 (0.0008) +[2023-10-08 12:07:52,838][102898] Updated weights for policy 1, policy_version 8920 (0.0008) +[2023-10-08 12:07:55,580][102897] Updated weights for policy 0, policy_version 8930 (0.0007) +[2023-10-08 12:07:55,961][102897] Updated weights for policy 0, policy_version 8940 (0.0007) +[2023-10-08 12:07:56,328][102897] Updated weights for policy 0, policy_version 8950 (0.0009) +[2023-10-08 12:07:56,659][102898] Updated weights for policy 1, policy_version 8930 (0.0008) +[2023-10-08 12:07:56,692][102897] Updated weights for policy 0, policy_version 8960 (0.0009) +[2023-10-08 12:07:56,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 18317312. Throughput: 0: 1798.8, 1: 1782.5. Samples: 4587138. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:07:56,877][101941] Avg episode reward: [(0, '6.020'), (1, '5.700')] +[2023-10-08 12:07:57,024][102898] Updated weights for policy 1, policy_version 8940 (0.0007) +[2023-10-08 12:07:57,393][102898] Updated weights for policy 1, policy_version 8950 (0.0007) +[2023-10-08 12:07:57,759][102898] Updated weights for policy 1, policy_version 8960 (0.0008) +[2023-10-08 12:08:00,203][102897] Updated weights for policy 0, policy_version 8970 (0.0007) +[2023-10-08 12:08:00,586][102897] Updated weights for policy 0, policy_version 8980 (0.0010) +[2023-10-08 12:08:00,953][102897] Updated weights for policy 0, policy_version 8990 (0.0010) +[2023-10-08 12:08:01,623][102898] Updated weights for policy 1, policy_version 8970 (0.0009) +[2023-10-08 12:08:01,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 18382848. Throughput: 0: 1786.6, 1: 1795.9. Samples: 4607918. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:08:01,876][101941] Avg episode reward: [(0, '5.800'), (1, '5.570')] +[2023-10-08 12:08:01,987][102898] Updated weights for policy 1, policy_version 8980 (0.0007) +[2023-10-08 12:08:02,350][102898] Updated weights for policy 1, policy_version 8990 (0.0007) +[2023-10-08 12:08:04,690][102897] Updated weights for policy 0, policy_version 9000 (0.0008) +[2023-10-08 12:08:05,069][102897] Updated weights for policy 0, policy_version 9010 (0.0008) +[2023-10-08 12:08:05,444][102897] Updated weights for policy 0, policy_version 9020 (0.0009) +[2023-10-08 12:08:06,078][102898] Updated weights for policy 1, policy_version 9000 (0.0007) +[2023-10-08 12:08:06,445][102898] Updated weights for policy 1, policy_version 9010 (0.0008) +[2023-10-08 12:08:06,808][102898] Updated weights for policy 1, policy_version 9020 (0.0008) +[2023-10-08 12:08:06,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 18448384. Throughput: 0: 1801.6, 1: 1779.2. Samples: 4619518. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:08:06,875][101941] Avg episode reward: [(0, '5.880'), (1, '5.560')] +[2023-10-08 12:08:09,168][102897] Updated weights for policy 0, policy_version 9030 (0.0009) +[2023-10-08 12:08:09,544][102897] Updated weights for policy 0, policy_version 9040 (0.0009) +[2023-10-08 12:08:09,913][102897] Updated weights for policy 0, policy_version 9050 (0.0010) +[2023-10-08 12:08:10,468][102898] Updated weights for policy 1, policy_version 9030 (0.0009) +[2023-10-08 12:08:10,841][102898] Updated weights for policy 1, policy_version 9040 (0.0009) +[2023-10-08 12:08:11,211][102898] Updated weights for policy 1, policy_version 9050 (0.0007) +[2023-10-08 12:08:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 18546688. Throughput: 0: 1787.6, 1: 1796.9. Samples: 4640126. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:08:11,875][101941] Avg episode reward: [(0, '5.870'), (1, '5.700')] +[2023-10-08 12:08:13,774][102897] Updated weights for policy 0, policy_version 9060 (0.0010) +[2023-10-08 12:08:14,152][102897] Updated weights for policy 0, policy_version 9070 (0.0007) +[2023-10-08 12:08:14,519][102897] Updated weights for policy 0, policy_version 9080 (0.0007) +[2023-10-08 12:08:15,089][102898] Updated weights for policy 1, policy_version 9060 (0.0008) +[2023-10-08 12:08:15,487][102898] Updated weights for policy 1, policy_version 9070 (0.0010) +[2023-10-08 12:08:15,844][102898] Updated weights for policy 1, policy_version 9080 (0.0009) +[2023-10-08 12:08:16,875][101941] Fps is (10 sec: 16383.4, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 18612224. Throughput: 0: 1782.3, 1: 1781.2. Samples: 4661080. Policy #0 lag: (min: 26.0, avg: 33.3, max: 58.0) +[2023-10-08 12:08:16,876][101941] Avg episode reward: [(0, '5.610'), (1, '5.630')] +[2023-10-08 12:08:16,887][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000009088_9306112.pth... +[2023-10-08 12:08:16,887][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000009088_9306112.pth... +[2023-10-08 12:08:16,938][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000007424_7602176.pth +[2023-10-08 12:08:16,938][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000007392_7569408.pth +[2023-10-08 12:08:18,448][102897] Updated weights for policy 0, policy_version 9090 (0.0007) +[2023-10-08 12:08:18,820][102897] Updated weights for policy 0, policy_version 9100 (0.0009) +[2023-10-08 12:08:19,191][102897] Updated weights for policy 0, policy_version 9110 (0.0009) +[2023-10-08 12:08:19,527][102898] Updated weights for policy 1, policy_version 9090 (0.0007) +[2023-10-08 12:08:19,573][102897] Updated weights for policy 0, policy_version 9120 (0.0008) +[2023-10-08 12:08:19,898][102898] Updated weights for policy 1, policy_version 9100 (0.0007) +[2023-10-08 12:08:20,272][102898] Updated weights for policy 1, policy_version 9110 (0.0009) +[2023-10-08 12:08:20,641][102898] Updated weights for policy 1, policy_version 9120 (0.0009) +[2023-10-08 12:08:21,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 18677760. Throughput: 0: 1781.3, 1: 1801.6. Samples: 4672428. Policy #0 lag: (min: 26.0, avg: 33.3, max: 58.0) +[2023-10-08 12:08:21,876][101941] Avg episode reward: [(0, '6.010'), (1, '5.920')] +[2023-10-08 12:08:23,308][102897] Updated weights for policy 0, policy_version 9130 (0.0011) +[2023-10-08 12:08:23,671][102897] Updated weights for policy 0, policy_version 9140 (0.0007) +[2023-10-08 12:08:24,051][102897] Updated weights for policy 0, policy_version 9150 (0.0007) +[2023-10-08 12:08:24,357][102898] Updated weights for policy 1, policy_version 9130 (0.0008) +[2023-10-08 12:08:24,721][102898] Updated weights for policy 1, policy_version 9140 (0.0008) +[2023-10-08 12:08:25,089][102898] Updated weights for policy 1, policy_version 9150 (0.0011) +[2023-10-08 12:08:26,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 18743296. Throughput: 0: 1770.1, 1: 1785.2. Samples: 4693020. Policy #0 lag: (min: 31.0, avg: 31.3, max: 43.0) +[2023-10-08 12:08:26,875][101941] Avg episode reward: [(0, '5.910'), (1, '6.070')] +[2023-10-08 12:08:27,703][102897] Updated weights for policy 0, policy_version 9160 (0.0009) +[2023-10-08 12:08:28,073][102897] Updated weights for policy 0, policy_version 9170 (0.0008) +[2023-10-08 12:08:28,450][102897] Updated weights for policy 0, policy_version 9180 (0.0007) +[2023-10-08 12:08:28,872][102898] Updated weights for policy 1, policy_version 9160 (0.0009) +[2023-10-08 12:08:29,237][102898] Updated weights for policy 1, policy_version 9170 (0.0010) +[2023-10-08 12:08:29,611][102898] Updated weights for policy 1, policy_version 9180 (0.0009) +[2023-10-08 12:08:31,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 18808832. Throughput: 0: 1777.5, 1: 1783.1. Samples: 4715482. Policy #0 lag: (min: 31.0, avg: 31.3, max: 43.0) +[2023-10-08 12:08:31,876][101941] Avg episode reward: [(0, '5.800'), (1, '5.710')] +[2023-10-08 12:08:32,245][102897] Updated weights for policy 0, policy_version 9190 (0.0008) +[2023-10-08 12:08:32,620][102897] Updated weights for policy 0, policy_version 9200 (0.0007) +[2023-10-08 12:08:32,989][102897] Updated weights for policy 0, policy_version 9210 (0.0008) +[2023-10-08 12:08:33,401][102898] Updated weights for policy 1, policy_version 9190 (0.0010) +[2023-10-08 12:08:33,759][102898] Updated weights for policy 1, policy_version 9200 (0.0010) +[2023-10-08 12:08:34,126][102898] Updated weights for policy 1, policy_version 9210 (0.0010) +[2023-10-08 12:08:36,675][102897] Updated weights for policy 0, policy_version 9220 (0.0007) +[2023-10-08 12:08:36,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 18874368. Throughput: 0: 1778.1, 1: 1784.2. Samples: 4725292. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:08:36,876][101941] Avg episode reward: [(0, '5.420'), (1, '5.180')] +[2023-10-08 12:08:37,051][102897] Updated weights for policy 0, policy_version 9230 (0.0007) +[2023-10-08 12:08:37,427][102897] Updated weights for policy 0, policy_version 9240 (0.0007) +[2023-10-08 12:08:37,922][102898] Updated weights for policy 1, policy_version 9220 (0.0009) +[2023-10-08 12:08:38,296][102898] Updated weights for policy 1, policy_version 9230 (0.0007) +[2023-10-08 12:08:38,669][102898] Updated weights for policy 1, policy_version 9240 (0.0008) +[2023-10-08 12:08:41,437][102897] Updated weights for policy 0, policy_version 9250 (0.0007) +[2023-10-08 12:08:41,805][102897] Updated weights for policy 0, policy_version 9260 (0.0010) +[2023-10-08 12:08:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 18939904. Throughput: 0: 1779.0, 1: 1791.6. Samples: 4747818. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:08:41,876][101941] Avg episode reward: [(0, '5.320'), (1, '5.510')] +[2023-10-08 12:08:42,177][102897] Updated weights for policy 0, policy_version 9270 (0.0009) +[2023-10-08 12:08:42,390][102898] Updated weights for policy 1, policy_version 9250 (0.0007) +[2023-10-08 12:08:42,546][102897] Updated weights for policy 0, policy_version 9280 (0.0007) +[2023-10-08 12:08:42,754][102898] Updated weights for policy 1, policy_version 9260 (0.0009) +[2023-10-08 12:08:43,136][102898] Updated weights for policy 1, policy_version 9270 (0.0008) +[2023-10-08 12:08:43,501][102898] Updated weights for policy 1, policy_version 9280 (0.0010) +[2023-10-08 12:08:46,381][102897] Updated weights for policy 0, policy_version 9290 (0.0009) +[2023-10-08 12:08:46,745][102897] Updated weights for policy 0, policy_version 9300 (0.0008) +[2023-10-08 12:08:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 19005440. Throughput: 0: 1792.7, 1: 1799.9. Samples: 4769584. Policy #0 lag: (min: 31.0, avg: 31.4, max: 44.0) +[2023-10-08 12:08:46,875][101941] Avg episode reward: [(0, '5.510'), (1, '5.510')] +[2023-10-08 12:08:47,123][102897] Updated weights for policy 0, policy_version 9310 (0.0007) +[2023-10-08 12:08:47,187][102898] Updated weights for policy 1, policy_version 9290 (0.0007) +[2023-10-08 12:08:47,564][102898] Updated weights for policy 1, policy_version 9300 (0.0011) +[2023-10-08 12:08:47,934][102898] Updated weights for policy 1, policy_version 9310 (0.0009) +[2023-10-08 12:08:50,873][102897] Updated weights for policy 0, policy_version 9320 (0.0008) +[2023-10-08 12:08:51,251][102897] Updated weights for policy 0, policy_version 9330 (0.0007) +[2023-10-08 12:08:51,628][102897] Updated weights for policy 0, policy_version 9340 (0.0007) +[2023-10-08 12:08:51,806][102898] Updated weights for policy 1, policy_version 9320 (0.0008) +[2023-10-08 12:08:51,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 19103744. Throughput: 0: 1769.7, 1: 1786.3. Samples: 4779536. Policy #0 lag: (min: 31.0, avg: 37.0, max: 63.0) +[2023-10-08 12:08:51,876][101941] Avg episode reward: [(0, '5.890'), (1, '5.570')] +[2023-10-08 12:08:52,170][102898] Updated weights for policy 1, policy_version 9330 (0.0009) +[2023-10-08 12:08:52,545][102898] Updated weights for policy 1, policy_version 9340 (0.0009) +[2023-10-08 12:08:55,527][102897] Updated weights for policy 0, policy_version 9350 (0.0010) +[2023-10-08 12:08:55,907][102897] Updated weights for policy 0, policy_version 9360 (0.0008) +[2023-10-08 12:08:56,176][102898] Updated weights for policy 1, policy_version 9350 (0.0008) +[2023-10-08 12:08:56,278][102897] Updated weights for policy 0, policy_version 9370 (0.0008) +[2023-10-08 12:08:56,539][102898] Updated weights for policy 1, policy_version 9360 (0.0011) +[2023-10-08 12:08:56,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 19169280. Throughput: 0: 1795.8, 1: 1793.4. Samples: 4801640. Policy #0 lag: (min: 31.0, avg: 37.0, max: 63.0) +[2023-10-08 12:08:56,875][101941] Avg episode reward: [(0, '6.070'), (1, '5.550')] +[2023-10-08 12:08:56,909][102898] Updated weights for policy 1, policy_version 9370 (0.0010) +[2023-10-08 12:08:59,992][102897] Updated weights for policy 0, policy_version 9380 (0.0008) +[2023-10-08 12:09:00,369][102897] Updated weights for policy 0, policy_version 9390 (0.0007) +[2023-10-08 12:09:00,654][102898] Updated weights for policy 1, policy_version 9380 (0.0008) +[2023-10-08 12:09:00,738][102897] Updated weights for policy 0, policy_version 9400 (0.0007) +[2023-10-08 12:09:01,037][102898] Updated weights for policy 1, policy_version 9390 (0.0007) +[2023-10-08 12:09:01,405][102898] Updated weights for policy 1, policy_version 9400 (0.0007) +[2023-10-08 12:09:01,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 19267584. Throughput: 0: 1772.1, 1: 1796.1. Samples: 4821648. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:09:01,876][101941] Avg episode reward: [(0, '6.210'), (1, '5.870')] +[2023-10-08 12:09:04,459][102897] Updated weights for policy 0, policy_version 9410 (0.0008) +[2023-10-08 12:09:04,830][102897] Updated weights for policy 0, policy_version 9420 (0.0007) +[2023-10-08 12:09:05,194][102897] Updated weights for policy 0, policy_version 9430 (0.0007) +[2023-10-08 12:09:05,199][102898] Updated weights for policy 1, policy_version 9410 (0.0008) +[2023-10-08 12:09:05,563][102897] Updated weights for policy 0, policy_version 9440 (0.0009) +[2023-10-08 12:09:05,568][102898] Updated weights for policy 1, policy_version 9420 (0.0009) +[2023-10-08 12:09:05,925][102898] Updated weights for policy 1, policy_version 9430 (0.0010) +[2023-10-08 12:09:06,293][102898] Updated weights for policy 1, policy_version 9440 (0.0010) +[2023-10-08 12:09:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 19333120. Throughput: 0: 1807.2, 1: 1783.8. Samples: 4834020. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:09:06,876][101941] Avg episode reward: [(0, '6.480'), (1, '5.850')] +[2023-10-08 12:09:09,248][102897] Updated weights for policy 0, policy_version 9450 (0.0010) +[2023-10-08 12:09:09,619][102897] Updated weights for policy 0, policy_version 9460 (0.0010) +[2023-10-08 12:09:09,996][102897] Updated weights for policy 0, policy_version 9470 (0.0009) +[2023-10-08 12:09:10,107][102898] Updated weights for policy 1, policy_version 9450 (0.0007) +[2023-10-08 12:09:10,472][102898] Updated weights for policy 1, policy_version 9460 (0.0008) +[2023-10-08 12:09:10,844][102898] Updated weights for policy 1, policy_version 9470 (0.0008) +[2023-10-08 12:09:11,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14440.2). Total num frames: 19398656. Throughput: 0: 1781.4, 1: 1801.6. Samples: 4854258. Policy #0 lag: (min: 31.0, avg: 31.6, max: 48.0) +[2023-10-08 12:09:11,875][101941] Avg episode reward: [(0, '6.100'), (1, '5.590')] +[2023-10-08 12:09:13,821][102897] Updated weights for policy 0, policy_version 9480 (0.0010) +[2023-10-08 12:09:14,192][102897] Updated weights for policy 0, policy_version 9490 (0.0007) +[2023-10-08 12:09:14,565][102897] Updated weights for policy 0, policy_version 9500 (0.0007) +[2023-10-08 12:09:14,676][102898] Updated weights for policy 1, policy_version 9480 (0.0009) +[2023-10-08 12:09:15,044][102898] Updated weights for policy 1, policy_version 9490 (0.0009) +[2023-10-08 12:09:15,405][102898] Updated weights for policy 1, policy_version 9500 (0.0008) +[2023-10-08 12:09:16,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 19464192. Throughput: 0: 1783.7, 1: 1784.8. Samples: 4876066. Policy #0 lag: (min: 31.0, avg: 31.6, max: 48.0) +[2023-10-08 12:09:16,876][101941] Avg episode reward: [(0, '5.970'), (1, '5.480')] +[2023-10-08 12:09:18,199][102897] Updated weights for policy 0, policy_version 9510 (0.0008) +[2023-10-08 12:09:18,568][102897] Updated weights for policy 0, policy_version 9520 (0.0009) +[2023-10-08 12:09:18,942][102897] Updated weights for policy 0, policy_version 9530 (0.0008) +[2023-10-08 12:09:19,159][102898] Updated weights for policy 1, policy_version 9510 (0.0010) +[2023-10-08 12:09:19,523][102898] Updated weights for policy 1, policy_version 9520 (0.0007) +[2023-10-08 12:09:19,883][102898] Updated weights for policy 1, policy_version 9530 (0.0010) +[2023-10-08 12:09:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 19529728. Throughput: 0: 1780.6, 1: 1804.9. Samples: 4886640. Policy #0 lag: (min: 9.0, avg: 14.8, max: 41.0) +[2023-10-08 12:09:21,876][101941] Avg episode reward: [(0, '6.320'), (1, '5.520')] +[2023-10-08 12:09:22,648][102897] Updated weights for policy 0, policy_version 9540 (0.0009) +[2023-10-08 12:09:23,020][102897] Updated weights for policy 0, policy_version 9550 (0.0007) +[2023-10-08 12:09:23,392][102897] Updated weights for policy 0, policy_version 9560 (0.0007) +[2023-10-08 12:09:23,730][102898] Updated weights for policy 1, policy_version 9540 (0.0007) +[2023-10-08 12:09:24,106][102898] Updated weights for policy 1, policy_version 9550 (0.0009) +[2023-10-08 12:09:24,473][102898] Updated weights for policy 1, policy_version 9560 (0.0009) +[2023-10-08 12:09:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 19595264. Throughput: 0: 1785.9, 1: 1779.0. Samples: 4908238. Policy #0 lag: (min: 9.0, avg: 14.8, max: 41.0) +[2023-10-08 12:09:26,876][101941] Avg episode reward: [(0, '5.950'), (1, '5.270')] +[2023-10-08 12:09:27,218][102897] Updated weights for policy 0, policy_version 9570 (0.0007) +[2023-10-08 12:09:27,597][102897] Updated weights for policy 0, policy_version 9580 (0.0007) +[2023-10-08 12:09:27,981][102897] Updated weights for policy 0, policy_version 9590 (0.0008) +[2023-10-08 12:09:28,346][102897] Updated weights for policy 0, policy_version 9600 (0.0007) +[2023-10-08 12:09:28,376][102898] Updated weights for policy 1, policy_version 9570 (0.0008) +[2023-10-08 12:09:28,743][102898] Updated weights for policy 1, policy_version 9580 (0.0007) +[2023-10-08 12:09:29,113][102898] Updated weights for policy 1, policy_version 9590 (0.0009) +[2023-10-08 12:09:29,479][102898] Updated weights for policy 1, policy_version 9600 (0.0008) +[2023-10-08 12:09:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 19660800. Throughput: 0: 1798.7, 1: 1776.3. Samples: 4930460. Policy #0 lag: (min: 31.0, avg: 31.5, max: 45.0) +[2023-10-08 12:09:31,876][101941] Avg episode reward: [(0, '5.940'), (1, '5.040')] +[2023-10-08 12:09:32,147][102897] Updated weights for policy 0, policy_version 9610 (0.0007) +[2023-10-08 12:09:32,513][102897] Updated weights for policy 0, policy_version 9620 (0.0008) +[2023-10-08 12:09:32,891][102897] Updated weights for policy 0, policy_version 9630 (0.0008) +[2023-10-08 12:09:33,250][102898] Updated weights for policy 1, policy_version 9610 (0.0008) +[2023-10-08 12:09:33,627][102898] Updated weights for policy 1, policy_version 9620 (0.0007) +[2023-10-08 12:09:33,990][102898] Updated weights for policy 1, policy_version 9630 (0.0008) +[2023-10-08 12:09:36,605][102897] Updated weights for policy 0, policy_version 9640 (0.0009) +[2023-10-08 12:09:36,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 19726336. Throughput: 0: 1790.4, 1: 1782.1. Samples: 4940298. Policy #0 lag: (min: 31.0, avg: 31.5, max: 45.0) +[2023-10-08 12:09:36,876][101941] Avg episode reward: [(0, '5.570'), (1, '5.230')] +[2023-10-08 12:09:36,984][102897] Updated weights for policy 0, policy_version 9650 (0.0008) +[2023-10-08 12:09:37,357][102897] Updated weights for policy 0, policy_version 9660 (0.0008) +[2023-10-08 12:09:37,615][102898] Updated weights for policy 1, policy_version 9640 (0.0007) +[2023-10-08 12:09:37,981][102898] Updated weights for policy 1, policy_version 9650 (0.0009) +[2023-10-08 12:09:38,350][102898] Updated weights for policy 1, policy_version 9660 (0.0009) +[2023-10-08 12:09:41,145][102897] Updated weights for policy 0, policy_version 9670 (0.0007) +[2023-10-08 12:09:41,520][102897] Updated weights for policy 0, policy_version 9680 (0.0007) +[2023-10-08 12:09:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 19791872. Throughput: 0: 1791.3, 1: 1779.0. Samples: 4962306. Policy #0 lag: (min: 25.0, avg: 33.5, max: 57.0) +[2023-10-08 12:09:41,875][101941] Avg episode reward: [(0, '5.930'), (1, '5.090')] +[2023-10-08 12:09:41,891][102897] Updated weights for policy 0, policy_version 9690 (0.0008) +[2023-10-08 12:09:42,144][102898] Updated weights for policy 1, policy_version 9670 (0.0009) +[2023-10-08 12:09:42,495][102898] Updated weights for policy 1, policy_version 9680 (0.0010) +[2023-10-08 12:09:42,856][102898] Updated weights for policy 1, policy_version 9690 (0.0009) +[2023-10-08 12:09:45,668][102897] Updated weights for policy 0, policy_version 9700 (0.0009) +[2023-10-08 12:09:46,053][102897] Updated weights for policy 0, policy_version 9710 (0.0011) +[2023-10-08 12:09:46,426][102897] Updated weights for policy 0, policy_version 9720 (0.0008) +[2023-10-08 12:09:46,793][102898] Updated weights for policy 1, policy_version 9700 (0.0009) +[2023-10-08 12:09:46,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 19890176. Throughput: 0: 1795.2, 1: 1801.7. Samples: 4983508. Policy #0 lag: (min: 31.0, avg: 31.0, max: 35.0) +[2023-10-08 12:09:46,876][101941] Avg episode reward: [(0, '5.800'), (1, '4.990')] +[2023-10-08 12:09:47,179][102898] Updated weights for policy 1, policy_version 9710 (0.0007) +[2023-10-08 12:09:47,545][102898] Updated weights for policy 1, policy_version 9720 (0.0007) +[2023-10-08 12:09:50,170][102897] Updated weights for policy 0, policy_version 9730 (0.0008) +[2023-10-08 12:09:50,541][102897] Updated weights for policy 0, policy_version 9740 (0.0008) +[2023-10-08 12:09:50,910][102897] Updated weights for policy 0, policy_version 9750 (0.0007) +[2023-10-08 12:09:51,212][102898] Updated weights for policy 1, policy_version 9730 (0.0008) +[2023-10-08 12:09:51,284][102897] Updated weights for policy 0, policy_version 9760 (0.0008) +[2023-10-08 12:09:51,580][102898] Updated weights for policy 1, policy_version 9740 (0.0009) +[2023-10-08 12:09:51,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 19955712. Throughput: 0: 1778.3, 1: 1776.7. Samples: 4994000. Policy #0 lag: (min: 31.0, avg: 31.0, max: 35.0) +[2023-10-08 12:09:51,876][101941] Avg episode reward: [(0, '5.730'), (1, '5.450')] +[2023-10-08 12:09:51,947][102898] Updated weights for policy 1, policy_version 9750 (0.0007) +[2023-10-08 12:09:52,311][102898] Updated weights for policy 1, policy_version 9760 (0.0007) +[2023-10-08 12:09:55,140][102897] Updated weights for policy 0, policy_version 9770 (0.0008) +[2023-10-08 12:09:55,521][102897] Updated weights for policy 0, policy_version 9780 (0.0008) +[2023-10-08 12:09:55,886][102897] Updated weights for policy 0, policy_version 9790 (0.0008) +[2023-10-08 12:09:56,128][102898] Updated weights for policy 1, policy_version 9770 (0.0007) +[2023-10-08 12:09:56,496][102898] Updated weights for policy 1, policy_version 9780 (0.0009) +[2023-10-08 12:09:56,867][102898] Updated weights for policy 1, policy_version 9790 (0.0009) +[2023-10-08 12:09:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 20021248. Throughput: 0: 1792.0, 1: 1791.5. Samples: 5015518. Policy #0 lag: (min: 31.0, avg: 36.3, max: 63.0) +[2023-10-08 12:09:56,875][101941] Avg episode reward: [(0, '5.950'), (1, '5.590')] +[2023-10-08 12:09:59,671][102897] Updated weights for policy 0, policy_version 9800 (0.0007) +[2023-10-08 12:10:00,053][102897] Updated weights for policy 0, policy_version 9810 (0.0007) +[2023-10-08 12:10:00,430][102897] Updated weights for policy 0, policy_version 9820 (0.0008) +[2023-10-08 12:10:00,682][102898] Updated weights for policy 1, policy_version 9800 (0.0009) +[2023-10-08 12:10:01,052][102898] Updated weights for policy 1, policy_version 9810 (0.0009) +[2023-10-08 12:10:01,423][102898] Updated weights for policy 1, policy_version 9820 (0.0009) +[2023-10-08 12:10:01,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 20119552. Throughput: 0: 1770.5, 1: 1780.0. Samples: 5035834. Policy #0 lag: (min: 31.0, avg: 36.3, max: 63.0) +[2023-10-08 12:10:01,875][101941] Avg episode reward: [(0, '5.920'), (1, '6.050')] +[2023-10-08 12:10:04,090][102897] Updated weights for policy 0, policy_version 9830 (0.0007) +[2023-10-08 12:10:04,457][102897] Updated weights for policy 0, policy_version 9840 (0.0008) +[2023-10-08 12:10:04,839][102897] Updated weights for policy 0, policy_version 9850 (0.0007) +[2023-10-08 12:10:05,228][102898] Updated weights for policy 1, policy_version 9830 (0.0007) +[2023-10-08 12:10:05,591][102898] Updated weights for policy 1, policy_version 9840 (0.0009) +[2023-10-08 12:10:05,953][102898] Updated weights for policy 1, policy_version 9850 (0.0010) +[2023-10-08 12:10:06,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 20185088. Throughput: 0: 1793.8, 1: 1788.1. Samples: 5047826. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 12:10:06,876][101941] Avg episode reward: [(0, '6.120'), (1, '6.000')] +[2023-10-08 12:10:08,714][102897] Updated weights for policy 0, policy_version 9860 (0.0007) +[2023-10-08 12:10:09,086][102897] Updated weights for policy 0, policy_version 9870 (0.0009) +[2023-10-08 12:10:09,457][102897] Updated weights for policy 0, policy_version 9880 (0.0008) +[2023-10-08 12:10:09,848][102898] Updated weights for policy 1, policy_version 9860 (0.0009) +[2023-10-08 12:10:10,221][102898] Updated weights for policy 1, policy_version 9870 (0.0010) +[2023-10-08 12:10:10,584][102898] Updated weights for policy 1, policy_version 9880 (0.0009) +[2023-10-08 12:10:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 20250624. Throughput: 0: 1770.9, 1: 1785.0. Samples: 5068250. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 12:10:11,876][101941] Avg episode reward: [(0, '6.490'), (1, '5.650')] +[2023-10-08 12:10:13,302][102897] Updated weights for policy 0, policy_version 9890 (0.0008) +[2023-10-08 12:10:13,679][102897] Updated weights for policy 0, policy_version 9900 (0.0010) +[2023-10-08 12:10:14,050][102897] Updated weights for policy 0, policy_version 9910 (0.0010) +[2023-10-08 12:10:14,420][102898] Updated weights for policy 1, policy_version 9890 (0.0008) +[2023-10-08 12:10:14,425][102897] Updated weights for policy 0, policy_version 9920 (0.0008) +[2023-10-08 12:10:14,780][102898] Updated weights for policy 1, policy_version 9900 (0.0008) +[2023-10-08 12:10:15,142][102898] Updated weights for policy 1, policy_version 9910 (0.0008) +[2023-10-08 12:10:15,512][102898] Updated weights for policy 1, policy_version 9920 (0.0009) +[2023-10-08 12:10:16,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 20316160. Throughput: 0: 1770.6, 1: 1775.2. Samples: 5090020. Policy #0 lag: (min: 27.0, avg: 54.2, max: 56.0) +[2023-10-08 12:10:16,875][101941] Avg episode reward: [(0, '6.600'), (1, '5.470')] +[2023-10-08 12:10:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000009920_10158080.pth... +[2023-10-08 12:10:16,883][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000009920_10158080.pth... +[2023-10-08 12:10:16,917][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000008256_8454144.pth +[2023-10-08 12:10:16,922][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000008256_8454144.pth +[2023-10-08 12:10:18,162][102897] Updated weights for policy 0, policy_version 9930 (0.0010) +[2023-10-08 12:10:18,536][102897] Updated weights for policy 0, policy_version 9940 (0.0007) +[2023-10-08 12:10:18,909][102897] Updated weights for policy 0, policy_version 9950 (0.0008) +[2023-10-08 12:10:19,078][102898] Updated weights for policy 1, policy_version 9930 (0.0008) +[2023-10-08 12:10:19,447][102898] Updated weights for policy 1, policy_version 9940 (0.0008) +[2023-10-08 12:10:19,816][102898] Updated weights for policy 1, policy_version 9950 (0.0009) +[2023-10-08 12:10:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 20381696. Throughput: 0: 1768.1, 1: 1791.9. Samples: 5100498. Policy #0 lag: (min: 27.0, avg: 54.2, max: 56.0) +[2023-10-08 12:10:21,876][101941] Avg episode reward: [(0, '6.690'), (1, '5.400')] +[2023-10-08 12:10:22,736][102897] Updated weights for policy 0, policy_version 9960 (0.0009) +[2023-10-08 12:10:23,113][102897] Updated weights for policy 0, policy_version 9970 (0.0008) +[2023-10-08 12:10:23,474][102897] Updated weights for policy 0, policy_version 9980 (0.0011) +[2023-10-08 12:10:23,574][102898] Updated weights for policy 1, policy_version 9960 (0.0010) +[2023-10-08 12:10:23,943][102898] Updated weights for policy 1, policy_version 9970 (0.0009) +[2023-10-08 12:10:24,316][102898] Updated weights for policy 1, policy_version 9980 (0.0007) +[2023-10-08 12:10:26,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 20447232. Throughput: 0: 1773.9, 1: 1782.8. Samples: 5122362. Policy #0 lag: (min: 31.0, avg: 32.8, max: 60.0) +[2023-10-08 12:10:26,877][101941] Avg episode reward: [(0, '6.310'), (1, '5.100')] +[2023-10-08 12:10:27,280][102897] Updated weights for policy 0, policy_version 9990 (0.0008) +[2023-10-08 12:10:27,665][102897] Updated weights for policy 0, policy_version 10000 (0.0008) +[2023-10-08 12:10:27,995][102898] Updated weights for policy 1, policy_version 9990 (0.0009) +[2023-10-08 12:10:28,036][102897] Updated weights for policy 0, policy_version 10010 (0.0008) +[2023-10-08 12:10:28,356][102898] Updated weights for policy 1, policy_version 10000 (0.0007) +[2023-10-08 12:10:28,731][102898] Updated weights for policy 1, policy_version 10010 (0.0008) +[2023-10-08 12:10:31,685][102897] Updated weights for policy 0, policy_version 10020 (0.0008) +[2023-10-08 12:10:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 20512768. Throughput: 0: 1795.3, 1: 1783.7. Samples: 5144564. Policy #0 lag: (min: 31.0, avg: 32.8, max: 60.0) +[2023-10-08 12:10:31,876][101941] Avg episode reward: [(0, '6.540'), (1, '5.460')] +[2023-10-08 12:10:32,053][102897] Updated weights for policy 0, policy_version 10030 (0.0008) +[2023-10-08 12:10:32,429][102897] Updated weights for policy 0, policy_version 10040 (0.0009) +[2023-10-08 12:10:32,507][102898] Updated weights for policy 1, policy_version 10020 (0.0007) +[2023-10-08 12:10:32,905][102898] Updated weights for policy 1, policy_version 10030 (0.0008) +[2023-10-08 12:10:33,274][102898] Updated weights for policy 1, policy_version 10040 (0.0008) +[2023-10-08 12:10:36,148][102897] Updated weights for policy 0, policy_version 10050 (0.0008) +[2023-10-08 12:10:36,525][102897] Updated weights for policy 0, policy_version 10060 (0.0011) +[2023-10-08 12:10:36,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 20578304. Throughput: 0: 1774.9, 1: 1786.6. Samples: 5154264. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:10:36,875][101941] Avg episode reward: [(0, '5.780'), (1, '5.500')] +[2023-10-08 12:10:36,892][102897] Updated weights for policy 0, policy_version 10070 (0.0009) +[2023-10-08 12:10:36,903][102898] Updated weights for policy 1, policy_version 10050 (0.0007) +[2023-10-08 12:10:37,266][102898] Updated weights for policy 1, policy_version 10060 (0.0009) +[2023-10-08 12:10:37,269][102897] Updated weights for policy 0, policy_version 10080 (0.0009) +[2023-10-08 12:10:37,627][102898] Updated weights for policy 1, policy_version 10070 (0.0008) +[2023-10-08 12:10:37,995][102898] Updated weights for policy 1, policy_version 10080 (0.0007) +[2023-10-08 12:10:41,045][102897] Updated weights for policy 0, policy_version 10090 (0.0009) +[2023-10-08 12:10:41,408][102897] Updated weights for policy 0, policy_version 10100 (0.0009) +[2023-10-08 12:10:41,771][102898] Updated weights for policy 1, policy_version 10090 (0.0008) +[2023-10-08 12:10:41,778][102897] Updated weights for policy 0, policy_version 10110 (0.0007) +[2023-10-08 12:10:41,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 20676608. Throughput: 0: 1789.9, 1: 1789.0. Samples: 5176568. Policy #0 lag: (min: 31.0, avg: 37.3, max: 63.0) +[2023-10-08 12:10:41,876][101941] Avg episode reward: [(0, '5.660'), (1, '5.280')] +[2023-10-08 12:10:42,135][102898] Updated weights for policy 1, policy_version 10100 (0.0007) +[2023-10-08 12:10:42,506][102898] Updated weights for policy 1, policy_version 10110 (0.0010) +[2023-10-08 12:10:45,440][102897] Updated weights for policy 0, policy_version 10120 (0.0008) +[2023-10-08 12:10:45,819][102897] Updated weights for policy 0, policy_version 10130 (0.0007) +[2023-10-08 12:10:46,181][102897] Updated weights for policy 0, policy_version 10140 (0.0007) +[2023-10-08 12:10:46,396][102898] Updated weights for policy 1, policy_version 10120 (0.0008) +[2023-10-08 12:10:46,763][102898] Updated weights for policy 1, policy_version 10130 (0.0010) +[2023-10-08 12:10:46,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 20742144. Throughput: 0: 1779.0, 1: 1806.8. Samples: 5197194. Policy #0 lag: (min: 31.0, avg: 37.3, max: 63.0) +[2023-10-08 12:10:46,876][101941] Avg episode reward: [(0, '5.570'), (1, '6.080')] +[2023-10-08 12:10:47,139][102898] Updated weights for policy 1, policy_version 10140 (0.0011) +[2023-10-08 12:10:49,994][102897] Updated weights for policy 0, policy_version 10150 (0.0008) +[2023-10-08 12:10:50,362][102897] Updated weights for policy 0, policy_version 10160 (0.0008) +[2023-10-08 12:10:50,729][102897] Updated weights for policy 0, policy_version 10170 (0.0007) +[2023-10-08 12:10:50,880][102898] Updated weights for policy 1, policy_version 10150 (0.0009) +[2023-10-08 12:10:51,252][102898] Updated weights for policy 1, policy_version 10160 (0.0009) +[2023-10-08 12:10:51,620][102898] Updated weights for policy 1, policy_version 10170 (0.0007) +[2023-10-08 12:10:51,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 20840448. Throughput: 0: 1793.9, 1: 1790.1. Samples: 5209108. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:10:51,875][101941] Avg episode reward: [(0, '6.060'), (1, '6.160')] +[2023-10-08 12:10:54,618][102897] Updated weights for policy 0, policy_version 10180 (0.0009) +[2023-10-08 12:10:54,988][102897] Updated weights for policy 0, policy_version 10190 (0.0009) +[2023-10-08 12:10:55,201][102898] Updated weights for policy 1, policy_version 10180 (0.0007) +[2023-10-08 12:10:55,354][102897] Updated weights for policy 0, policy_version 10200 (0.0010) +[2023-10-08 12:10:55,566][102898] Updated weights for policy 1, policy_version 10190 (0.0007) +[2023-10-08 12:10:55,939][102898] Updated weights for policy 1, policy_version 10200 (0.0008) +[2023-10-08 12:10:56,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 20905984. Throughput: 0: 1784.4, 1: 1809.5. Samples: 5229974. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:10:56,876][101941] Avg episode reward: [(0, '6.340'), (1, '5.360')] +[2023-10-08 12:10:59,220][102897] Updated weights for policy 0, policy_version 10210 (0.0007) +[2023-10-08 12:10:59,591][102897] Updated weights for policy 0, policy_version 10220 (0.0007) +[2023-10-08 12:10:59,622][102898] Updated weights for policy 1, policy_version 10210 (0.0008) +[2023-10-08 12:10:59,965][102897] Updated weights for policy 0, policy_version 10230 (0.0007) +[2023-10-08 12:10:59,997][102898] Updated weights for policy 1, policy_version 10220 (0.0008) +[2023-10-08 12:11:00,339][102897] Updated weights for policy 0, policy_version 10240 (0.0009) +[2023-10-08 12:11:00,374][102898] Updated weights for policy 1, policy_version 10230 (0.0009) +[2023-10-08 12:11:00,737][102898] Updated weights for policy 1, policy_version 10240 (0.0011) +[2023-10-08 12:11:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 20971520. Throughput: 0: 1770.6, 1: 1800.0. Samples: 5250696. Policy #0 lag: (min: 5.0, avg: 13.0, max: 37.0) +[2023-10-08 12:11:01,876][101941] Avg episode reward: [(0, '6.280'), (1, '5.490')] +[2023-10-08 12:11:04,059][102897] Updated weights for policy 0, policy_version 10250 (0.0010) +[2023-10-08 12:11:04,428][102897] Updated weights for policy 0, policy_version 10260 (0.0008) +[2023-10-08 12:11:04,502][102898] Updated weights for policy 1, policy_version 10250 (0.0007) +[2023-10-08 12:11:04,802][102897] Updated weights for policy 0, policy_version 10270 (0.0008) +[2023-10-08 12:11:04,859][102898] Updated weights for policy 1, policy_version 10260 (0.0007) +[2023-10-08 12:11:05,228][102898] Updated weights for policy 1, policy_version 10270 (0.0009) +[2023-10-08 12:11:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 21037056. Throughput: 0: 1790.0, 1: 1806.2. Samples: 5262326. Policy #0 lag: (min: 5.0, avg: 13.0, max: 37.0) +[2023-10-08 12:11:06,876][101941] Avg episode reward: [(0, '6.000'), (1, '5.530')] +[2023-10-08 12:11:08,648][102897] Updated weights for policy 0, policy_version 10280 (0.0009) +[2023-10-08 12:11:09,022][102897] Updated weights for policy 0, policy_version 10290 (0.0008) +[2023-10-08 12:11:09,031][102898] Updated weights for policy 1, policy_version 10280 (0.0010) +[2023-10-08 12:11:09,391][102897] Updated weights for policy 0, policy_version 10300 (0.0008) +[2023-10-08 12:11:09,397][102898] Updated weights for policy 1, policy_version 10290 (0.0007) +[2023-10-08 12:11:09,763][102898] Updated weights for policy 1, policy_version 10300 (0.0009) +[2023-10-08 12:11:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 21102592. Throughput: 0: 1776.7, 1: 1789.8. Samples: 5282852. Policy #0 lag: (min: 19.0, avg: 22.5, max: 51.0) +[2023-10-08 12:11:11,876][101941] Avg episode reward: [(0, '5.710'), (1, '5.580')] +[2023-10-08 12:11:13,331][102897] Updated weights for policy 0, policy_version 10310 (0.0010) +[2023-10-08 12:11:13,525][102898] Updated weights for policy 1, policy_version 10310 (0.0007) +[2023-10-08 12:11:13,709][102897] Updated weights for policy 0, policy_version 10320 (0.0008) +[2023-10-08 12:11:13,890][102898] Updated weights for policy 1, policy_version 10320 (0.0009) +[2023-10-08 12:11:14,080][102897] Updated weights for policy 0, policy_version 10330 (0.0007) +[2023-10-08 12:11:14,257][102898] Updated weights for policy 1, policy_version 10330 (0.0008) +[2023-10-08 12:11:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 21168128. Throughput: 0: 1771.6, 1: 1788.0. Samples: 5304742. Policy #0 lag: (min: 19.0, avg: 22.5, max: 51.0) +[2023-10-08 12:11:16,875][101941] Avg episode reward: [(0, '5.880'), (1, '5.550')] +[2023-10-08 12:11:17,926][102897] Updated weights for policy 0, policy_version 10340 (0.0008) +[2023-10-08 12:11:18,187][102898] Updated weights for policy 1, policy_version 10340 (0.0007) +[2023-10-08 12:11:18,305][102897] Updated weights for policy 0, policy_version 10350 (0.0007) +[2023-10-08 12:11:18,584][102898] Updated weights for policy 1, policy_version 10350 (0.0007) +[2023-10-08 12:11:18,682][102897] Updated weights for policy 0, policy_version 10360 (0.0007) +[2023-10-08 12:11:18,952][102898] Updated weights for policy 1, policy_version 10360 (0.0007) +[2023-10-08 12:11:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 21233664. Throughput: 0: 1768.0, 1: 1784.8. Samples: 5314140. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 12:11:21,875][101941] Avg episode reward: [(0, '5.370'), (1, '5.220')] +[2023-10-08 12:11:22,473][102897] Updated weights for policy 0, policy_version 10370 (0.0008) +[2023-10-08 12:11:22,605][102898] Updated weights for policy 1, policy_version 10370 (0.0007) +[2023-10-08 12:11:22,852][102897] Updated weights for policy 0, policy_version 10380 (0.0009) +[2023-10-08 12:11:22,969][102898] Updated weights for policy 1, policy_version 10380 (0.0008) +[2023-10-08 12:11:23,220][102897] Updated weights for policy 0, policy_version 10390 (0.0009) +[2023-10-08 12:11:23,333][102898] Updated weights for policy 1, policy_version 10390 (0.0007) +[2023-10-08 12:11:23,593][102897] Updated weights for policy 0, policy_version 10400 (0.0009) +[2023-10-08 12:11:23,704][102898] Updated weights for policy 1, policy_version 10400 (0.0009) +[2023-10-08 12:11:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 21299200. Throughput: 0: 1767.7, 1: 1780.9. Samples: 5336256. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 12:11:26,876][101941] Avg episode reward: [(0, '5.540'), (1, '5.520')] +[2023-10-08 12:11:27,269][102897] Updated weights for policy 0, policy_version 10410 (0.0007) +[2023-10-08 12:11:27,567][102898] Updated weights for policy 1, policy_version 10410 (0.0007) +[2023-10-08 12:11:27,641][102897] Updated weights for policy 0, policy_version 10420 (0.0007) +[2023-10-08 12:11:27,935][102898] Updated weights for policy 1, policy_version 10420 (0.0009) +[2023-10-08 12:11:28,010][102897] Updated weights for policy 0, policy_version 10430 (0.0008) +[2023-10-08 12:11:28,307][102898] Updated weights for policy 1, policy_version 10430 (0.0009) +[2023-10-08 12:11:31,872][102897] Updated weights for policy 0, policy_version 10440 (0.0008) +[2023-10-08 12:11:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 21364736. Throughput: 0: 1794.4, 1: 1788.8. Samples: 5358436. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:11:31,875][101941] Avg episode reward: [(0, '5.900'), (1, '5.810')] +[2023-10-08 12:11:32,110][102898] Updated weights for policy 1, policy_version 10440 (0.0009) +[2023-10-08 12:11:32,253][102897] Updated weights for policy 0, policy_version 10450 (0.0009) +[2023-10-08 12:11:32,476][102898] Updated weights for policy 1, policy_version 10450 (0.0007) +[2023-10-08 12:11:32,637][102897] Updated weights for policy 0, policy_version 10460 (0.0007) +[2023-10-08 12:11:32,847][102898] Updated weights for policy 1, policy_version 10460 (0.0009) +[2023-10-08 12:11:36,461][102897] Updated weights for policy 0, policy_version 10470 (0.0007) +[2023-10-08 12:11:36,586][102898] Updated weights for policy 1, policy_version 10470 (0.0008) +[2023-10-08 12:11:36,833][102897] Updated weights for policy 0, policy_version 10480 (0.0007) +[2023-10-08 12:11:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 21430272. Throughput: 0: 1755.8, 1: 1776.3. Samples: 5368054. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:11:36,875][101941] Avg episode reward: [(0, '6.060'), (1, '5.530')] +[2023-10-08 12:11:36,942][102898] Updated weights for policy 1, policy_version 10480 (0.0007) +[2023-10-08 12:11:37,210][102897] Updated weights for policy 0, policy_version 10490 (0.0007) +[2023-10-08 12:11:37,304][102898] Updated weights for policy 1, policy_version 10490 (0.0007) +[2023-10-08 12:11:41,067][102897] Updated weights for policy 0, policy_version 10500 (0.0008) +[2023-10-08 12:11:41,151][102898] Updated weights for policy 1, policy_version 10500 (0.0007) +[2023-10-08 12:11:41,435][102897] Updated weights for policy 0, policy_version 10510 (0.0007) +[2023-10-08 12:11:41,525][102898] Updated weights for policy 1, policy_version 10510 (0.0009) +[2023-10-08 12:11:41,805][102897] Updated weights for policy 0, policy_version 10520 (0.0009) +[2023-10-08 12:11:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 14218.0). Total num frames: 21495808. Throughput: 0: 1782.8, 1: 1782.3. Samples: 5390404. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 12:11:41,876][101941] Avg episode reward: [(0, '6.020'), (1, '4.840')] +[2023-10-08 12:11:41,898][102898] Updated weights for policy 1, policy_version 10520 (0.0008) +[2023-10-08 12:11:45,403][102897] Updated weights for policy 0, policy_version 10530 (0.0007) +[2023-10-08 12:11:45,685][102898] Updated weights for policy 1, policy_version 10530 (0.0008) +[2023-10-08 12:11:45,785][102897] Updated weights for policy 0, policy_version 10540 (0.0009) +[2023-10-08 12:11:46,050][102898] Updated weights for policy 1, policy_version 10540 (0.0008) +[2023-10-08 12:11:46,152][102897] Updated weights for policy 0, policy_version 10550 (0.0007) +[2023-10-08 12:11:46,410][102898] Updated weights for policy 1, policy_version 10550 (0.0007) +[2023-10-08 12:11:46,512][102897] Updated weights for policy 0, policy_version 10560 (0.0008) +[2023-10-08 12:11:46,775][102898] Updated weights for policy 1, policy_version 10560 (0.0007) +[2023-10-08 12:11:46,875][101941] Fps is (10 sec: 19660.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 21626880. Throughput: 0: 1766.0, 1: 1788.5. Samples: 5410650. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 12:11:46,875][101941] Avg episode reward: [(0, '6.730'), (1, '5.170')] +[2023-10-08 12:11:50,291][102897] Updated weights for policy 0, policy_version 10570 (0.0008) +[2023-10-08 12:11:50,408][102898] Updated weights for policy 1, policy_version 10570 (0.0009) +[2023-10-08 12:11:50,671][102897] Updated weights for policy 0, policy_version 10580 (0.0008) +[2023-10-08 12:11:50,784][102898] Updated weights for policy 1, policy_version 10580 (0.0007) +[2023-10-08 12:11:51,043][102897] Updated weights for policy 0, policy_version 10590 (0.0009) +[2023-10-08 12:11:51,155][102898] Updated weights for policy 1, policy_version 10590 (0.0007) +[2023-10-08 12:11:51,875][101941] Fps is (10 sec: 19661.0, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 21692416. Throughput: 0: 1776.3, 1: 1785.9. Samples: 5422626. Policy #0 lag: (min: 25.0, avg: 29.3, max: 57.0) +[2023-10-08 12:11:51,875][101941] Avg episode reward: [(0, '6.810'), (1, '5.360')] +[2023-10-08 12:11:54,804][102897] Updated weights for policy 0, policy_version 10600 (0.0009) +[2023-10-08 12:11:55,046][102898] Updated weights for policy 1, policy_version 10600 (0.0008) +[2023-10-08 12:11:55,176][102897] Updated weights for policy 0, policy_version 10610 (0.0008) +[2023-10-08 12:11:55,409][102898] Updated weights for policy 1, policy_version 10610 (0.0010) +[2023-10-08 12:11:55,540][102897] Updated weights for policy 0, policy_version 10620 (0.0008) +[2023-10-08 12:11:55,777][102898] Updated weights for policy 1, policy_version 10620 (0.0010) +[2023-10-08 12:11:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 21757952. Throughput: 0: 1763.2, 1: 1792.2. Samples: 5442844. Policy #0 lag: (min: 25.0, avg: 29.3, max: 57.0) +[2023-10-08 12:11:56,875][101941] Avg episode reward: [(0, '6.260'), (1, '5.290')] +[2023-10-08 12:11:59,290][102897] Updated weights for policy 0, policy_version 10630 (0.0007) +[2023-10-08 12:11:59,398][102898] Updated weights for policy 1, policy_version 10630 (0.0007) +[2023-10-08 12:11:59,669][102897] Updated weights for policy 0, policy_version 10640 (0.0008) +[2023-10-08 12:11:59,764][102898] Updated weights for policy 1, policy_version 10640 (0.0007) +[2023-10-08 12:12:00,041][102897] Updated weights for policy 0, policy_version 10650 (0.0007) +[2023-10-08 12:12:00,133][102898] Updated weights for policy 1, policy_version 10650 (0.0008) +[2023-10-08 12:12:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 21823488. Throughput: 0: 1759.2, 1: 1782.5. Samples: 5464120. Policy #0 lag: (min: 25.0, avg: 29.3, max: 57.0) +[2023-10-08 12:12:01,875][101941] Avg episode reward: [(0, '6.110'), (1, '5.620')] +[2023-10-08 12:12:03,855][102897] Updated weights for policy 0, policy_version 10660 (0.0007) +[2023-10-08 12:12:04,227][102897] Updated weights for policy 0, policy_version 10670 (0.0007) +[2023-10-08 12:12:04,270][102898] Updated weights for policy 1, policy_version 10660 (0.0008) +[2023-10-08 12:12:04,602][102897] Updated weights for policy 0, policy_version 10680 (0.0007) +[2023-10-08 12:12:04,658][102898] Updated weights for policy 1, policy_version 10670 (0.0008) +[2023-10-08 12:12:05,022][102898] Updated weights for policy 1, policy_version 10680 (0.0007) +[2023-10-08 12:12:06,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 21889024. Throughput: 0: 1779.7, 1: 1799.6. Samples: 5475212. Policy #0 lag: (min: 27.0, avg: 27.2, max: 37.0) +[2023-10-08 12:12:06,876][101941] Avg episode reward: [(0, '5.850'), (1, '5.350')] +[2023-10-08 12:12:08,438][102897] Updated weights for policy 0, policy_version 10690 (0.0008) +[2023-10-08 12:12:08,723][102898] Updated weights for policy 1, policy_version 10690 (0.0009) +[2023-10-08 12:12:08,807][102897] Updated weights for policy 0, policy_version 10700 (0.0008) +[2023-10-08 12:12:09,095][102898] Updated weights for policy 1, policy_version 10700 (0.0009) +[2023-10-08 12:12:09,184][102897] Updated weights for policy 0, policy_version 10710 (0.0008) +[2023-10-08 12:12:09,453][102898] Updated weights for policy 1, policy_version 10710 (0.0008) +[2023-10-08 12:12:09,548][102897] Updated weights for policy 0, policy_version 10720 (0.0007) +[2023-10-08 12:12:09,833][102898] Updated weights for policy 1, policy_version 10720 (0.0008) +[2023-10-08 12:12:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 21954560. Throughput: 0: 1765.2, 1: 1779.1. Samples: 5495750. Policy #0 lag: (min: 27.0, avg: 27.2, max: 37.0) +[2023-10-08 12:12:11,876][101941] Avg episode reward: [(0, '5.680'), (1, '5.410')] +[2023-10-08 12:12:13,562][102897] Updated weights for policy 0, policy_version 10730 (0.0009) +[2023-10-08 12:12:13,635][102898] Updated weights for policy 1, policy_version 10730 (0.0008) +[2023-10-08 12:12:13,932][102897] Updated weights for policy 0, policy_version 10740 (0.0009) +[2023-10-08 12:12:14,005][102898] Updated weights for policy 1, policy_version 10740 (0.0007) +[2023-10-08 12:12:14,301][102897] Updated weights for policy 0, policy_version 10750 (0.0008) +[2023-10-08 12:12:14,371][102898] Updated weights for policy 1, policy_version 10750 (0.0008) +[2023-10-08 12:12:16,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 22020096. Throughput: 0: 1760.0, 1: 1782.0. Samples: 5517824. Policy #0 lag: (min: 2.0, avg: 6.9, max: 34.0) +[2023-10-08 12:12:16,876][101941] Avg episode reward: [(0, '5.900'), (1, '5.750')] +[2023-10-08 12:12:16,884][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000010752_11010048.pth... +[2023-10-08 12:12:16,884][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000010752_11010048.pth... +[2023-10-08 12:12:16,917][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000009088_9306112.pth +[2023-10-08 12:12:16,923][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000009088_9306112.pth +[2023-10-08 12:12:18,191][102897] Updated weights for policy 0, policy_version 10760 (0.0008) +[2023-10-08 12:12:18,225][102898] Updated weights for policy 1, policy_version 10760 (0.0009) +[2023-10-08 12:12:18,567][102897] Updated weights for policy 0, policy_version 10770 (0.0009) +[2023-10-08 12:12:18,586][102898] Updated weights for policy 1, policy_version 10770 (0.0007) +[2023-10-08 12:12:18,929][102897] Updated weights for policy 0, policy_version 10780 (0.0009) +[2023-10-08 12:12:18,960][102898] Updated weights for policy 1, policy_version 10780 (0.0009) +[2023-10-08 12:12:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 22085632. Throughput: 0: 1762.2, 1: 1780.7. Samples: 5527484. Policy #0 lag: (min: 2.0, avg: 6.9, max: 34.0) +[2023-10-08 12:12:21,876][101941] Avg episode reward: [(0, '6.300'), (1, '5.970')] +[2023-10-08 12:12:22,708][102898] Updated weights for policy 1, policy_version 10790 (0.0007) +[2023-10-08 12:12:22,710][102897] Updated weights for policy 0, policy_version 10790 (0.0007) +[2023-10-08 12:12:23,074][102898] Updated weights for policy 1, policy_version 10800 (0.0007) +[2023-10-08 12:12:23,085][102897] Updated weights for policy 0, policy_version 10800 (0.0007) +[2023-10-08 12:12:23,447][102898] Updated weights for policy 1, policy_version 10810 (0.0007) +[2023-10-08 12:12:23,451][102897] Updated weights for policy 0, policy_version 10810 (0.0007) +[2023-10-08 12:12:26,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 22151168. Throughput: 0: 1760.3, 1: 1777.7. Samples: 5549614. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 12:12:26,876][101941] Avg episode reward: [(0, '6.340'), (1, '5.910')] +[2023-10-08 12:12:27,241][102898] Updated weights for policy 1, policy_version 10820 (0.0007) +[2023-10-08 12:12:27,311][102897] Updated weights for policy 0, policy_version 10820 (0.0007) +[2023-10-08 12:12:27,605][102898] Updated weights for policy 1, policy_version 10830 (0.0007) +[2023-10-08 12:12:27,682][102897] Updated weights for policy 0, policy_version 10830 (0.0007) +[2023-10-08 12:12:27,975][102898] Updated weights for policy 1, policy_version 10840 (0.0008) +[2023-10-08 12:12:28,057][102897] Updated weights for policy 0, policy_version 10840 (0.0008) +[2023-10-08 12:12:31,714][102898] Updated weights for policy 1, policy_version 10850 (0.0009) +[2023-10-08 12:12:31,788][102897] Updated weights for policy 0, policy_version 10850 (0.0008) +[2023-10-08 12:12:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 22216704. Throughput: 0: 1785.9, 1: 1795.5. Samples: 5571812. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 12:12:31,875][101941] Avg episode reward: [(0, '6.070'), (1, '5.920')] +[2023-10-08 12:12:32,078][102898] Updated weights for policy 1, policy_version 10860 (0.0007) +[2023-10-08 12:12:32,161][102897] Updated weights for policy 0, policy_version 10860 (0.0007) +[2023-10-08 12:12:32,443][102898] Updated weights for policy 1, policy_version 10870 (0.0007) +[2023-10-08 12:12:32,526][102897] Updated weights for policy 0, policy_version 10870 (0.0008) +[2023-10-08 12:12:32,803][102898] Updated weights for policy 1, policy_version 10880 (0.0008) +[2023-10-08 12:12:32,888][102897] Updated weights for policy 0, policy_version 10880 (0.0009) +[2023-10-08 12:12:36,554][102898] Updated weights for policy 1, policy_version 10890 (0.0008) +[2023-10-08 12:12:36,557][102897] Updated weights for policy 0, policy_version 10890 (0.0007) +[2023-10-08 12:12:36,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 22282240. Throughput: 0: 1758.7, 1: 1772.8. Samples: 5581544. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 12:12:36,875][101941] Avg episode reward: [(0, '6.420'), (1, '5.690')] +[2023-10-08 12:12:36,919][102898] Updated weights for policy 1, policy_version 10900 (0.0007) +[2023-10-08 12:12:36,932][102897] Updated weights for policy 0, policy_version 10900 (0.0007) +[2023-10-08 12:12:37,283][102898] Updated weights for policy 1, policy_version 10910 (0.0008) +[2023-10-08 12:12:37,310][102897] Updated weights for policy 0, policy_version 10910 (0.0007) +[2023-10-08 12:12:41,003][102897] Updated weights for policy 0, policy_version 10920 (0.0008) +[2023-10-08 12:12:41,103][102898] Updated weights for policy 1, policy_version 10920 (0.0008) +[2023-10-08 12:12:41,382][102897] Updated weights for policy 0, policy_version 10930 (0.0008) +[2023-10-08 12:12:41,466][102898] Updated weights for policy 1, policy_version 10930 (0.0007) +[2023-10-08 12:12:41,741][102897] Updated weights for policy 0, policy_version 10940 (0.0008) +[2023-10-08 12:12:41,840][102898] Updated weights for policy 1, policy_version 10940 (0.0007) +[2023-10-08 12:12:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 22347776. Throughput: 0: 1787.1, 1: 1792.7. Samples: 5603940. Policy #0 lag: (min: 2.0, avg: 3.5, max: 24.0) +[2023-10-08 12:12:41,876][101941] Avg episode reward: [(0, '6.450'), (1, '5.710')] +[2023-10-08 12:12:45,627][102898] Updated weights for policy 1, policy_version 10950 (0.0009) +[2023-10-08 12:12:45,678][102897] Updated weights for policy 0, policy_version 10950 (0.0009) +[2023-10-08 12:12:45,995][102898] Updated weights for policy 1, policy_version 10960 (0.0007) +[2023-10-08 12:12:46,064][102897] Updated weights for policy 0, policy_version 10960 (0.0008) +[2023-10-08 12:12:46,359][102898] Updated weights for policy 1, policy_version 10970 (0.0007) +[2023-10-08 12:12:46,432][102897] Updated weights for policy 0, policy_version 10970 (0.0009) +[2023-10-08 12:12:46,875][101941] Fps is (10 sec: 19660.7, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 22478848. Throughput: 0: 1769.3, 1: 1772.4. Samples: 5623494. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:12:46,875][101941] Avg episode reward: [(0, '5.450'), (1, '5.460')] +[2023-10-08 12:12:50,267][102898] Updated weights for policy 1, policy_version 10980 (0.0010) +[2023-10-08 12:12:50,331][102897] Updated weights for policy 0, policy_version 10980 (0.0007) +[2023-10-08 12:12:50,669][102898] Updated weights for policy 1, policy_version 10990 (0.0008) +[2023-10-08 12:12:50,702][102897] Updated weights for policy 0, policy_version 10990 (0.0007) +[2023-10-08 12:12:51,041][102898] Updated weights for policy 1, policy_version 11000 (0.0007) +[2023-10-08 12:12:51,074][102897] Updated weights for policy 0, policy_version 11000 (0.0008) +[2023-10-08 12:12:51,875][101941] Fps is (10 sec: 19661.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 22544384. Throughput: 0: 1769.6, 1: 1781.2. Samples: 5634994. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:12:51,875][101941] Avg episode reward: [(0, '5.210'), (1, '4.810')] +[2023-10-08 12:12:54,789][102898] Updated weights for policy 1, policy_version 11010 (0.0007) +[2023-10-08 12:12:54,935][102897] Updated weights for policy 0, policy_version 11010 (0.0008) +[2023-10-08 12:12:55,163][102898] Updated weights for policy 1, policy_version 11020 (0.0008) +[2023-10-08 12:12:55,317][102897] Updated weights for policy 0, policy_version 11020 (0.0009) +[2023-10-08 12:12:55,528][102898] Updated weights for policy 1, policy_version 11030 (0.0008) +[2023-10-08 12:12:55,677][102897] Updated weights for policy 0, policy_version 11030 (0.0008) +[2023-10-08 12:12:55,897][102898] Updated weights for policy 1, policy_version 11040 (0.0008) +[2023-10-08 12:12:56,057][102897] Updated weights for policy 0, policy_version 11040 (0.0008) +[2023-10-08 12:12:56,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 22609920. Throughput: 0: 1773.6, 1: 1778.7. Samples: 5655602. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:12:56,876][101941] Avg episode reward: [(0, '5.330'), (1, '5.060')] +[2023-10-08 12:12:59,624][102898] Updated weights for policy 1, policy_version 11050 (0.0008) +[2023-10-08 12:12:59,830][102897] Updated weights for policy 0, policy_version 11050 (0.0007) +[2023-10-08 12:12:59,989][102898] Updated weights for policy 1, policy_version 11060 (0.0008) +[2023-10-08 12:13:00,201][102897] Updated weights for policy 0, policy_version 11060 (0.0007) +[2023-10-08 12:13:00,366][102898] Updated weights for policy 1, policy_version 11070 (0.0009) +[2023-10-08 12:13:00,581][102897] Updated weights for policy 0, policy_version 11070 (0.0008) +[2023-10-08 12:13:01,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 22675456. Throughput: 0: 1758.4, 1: 1765.5. Samples: 5676402. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:13:01,876][101941] Avg episode reward: [(0, '5.640'), (1, '5.620')] +[2023-10-08 12:13:04,176][102898] Updated weights for policy 1, policy_version 11080 (0.0008) +[2023-10-08 12:13:04,436][102897] Updated weights for policy 0, policy_version 11080 (0.0009) +[2023-10-08 12:13:04,549][102898] Updated weights for policy 1, policy_version 11090 (0.0008) +[2023-10-08 12:13:04,800][102897] Updated weights for policy 0, policy_version 11090 (0.0008) +[2023-10-08 12:13:04,919][102898] Updated weights for policy 1, policy_version 11100 (0.0007) +[2023-10-08 12:13:05,172][102897] Updated weights for policy 0, policy_version 11100 (0.0009) +[2023-10-08 12:13:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 22740992. Throughput: 0: 1779.6, 1: 1783.1. Samples: 5687808. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:13:06,876][101941] Avg episode reward: [(0, '5.570'), (1, '5.790')] +[2023-10-08 12:13:08,751][102898] Updated weights for policy 1, policy_version 11110 (0.0008) +[2023-10-08 12:13:09,089][102897] Updated weights for policy 0, policy_version 11110 (0.0008) +[2023-10-08 12:13:09,113][102898] Updated weights for policy 1, policy_version 11120 (0.0008) +[2023-10-08 12:13:09,460][102897] Updated weights for policy 0, policy_version 11120 (0.0007) +[2023-10-08 12:13:09,479][102898] Updated weights for policy 1, policy_version 11130 (0.0008) +[2023-10-08 12:13:09,828][102897] Updated weights for policy 0, policy_version 11130 (0.0007) +[2023-10-08 12:13:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 22806528. Throughput: 0: 1750.6, 1: 1763.6. Samples: 5707754. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:13:11,876][101941] Avg episode reward: [(0, '5.590'), (1, '5.630')] +[2023-10-08 12:13:13,174][102898] Updated weights for policy 1, policy_version 11140 (0.0007) +[2023-10-08 12:13:13,543][102898] Updated weights for policy 1, policy_version 11150 (0.0010) +[2023-10-08 12:13:13,638][102897] Updated weights for policy 0, policy_version 11140 (0.0008) +[2023-10-08 12:13:13,915][102898] Updated weights for policy 1, policy_version 11160 (0.0008) +[2023-10-08 12:13:14,010][102897] Updated weights for policy 0, policy_version 11150 (0.0008) +[2023-10-08 12:13:14,390][102897] Updated weights for policy 0, policy_version 11160 (0.0008) +[2023-10-08 12:13:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 22872064. Throughput: 0: 1752.0, 1: 1768.2. Samples: 5730218. Policy #0 lag: (min: 29.0, avg: 29.4, max: 43.0) +[2023-10-08 12:13:16,876][101941] Avg episode reward: [(0, '5.370'), (1, '5.920')] +[2023-10-08 12:13:17,675][102898] Updated weights for policy 1, policy_version 11170 (0.0008) +[2023-10-08 12:13:18,038][102898] Updated weights for policy 1, policy_version 11180 (0.0007) +[2023-10-08 12:13:18,127][102897] Updated weights for policy 0, policy_version 11170 (0.0009) +[2023-10-08 12:13:18,410][102898] Updated weights for policy 1, policy_version 11190 (0.0008) +[2023-10-08 12:13:18,498][102897] Updated weights for policy 0, policy_version 11180 (0.0007) +[2023-10-08 12:13:18,770][102898] Updated weights for policy 1, policy_version 11200 (0.0008) +[2023-10-08 12:13:18,869][102897] Updated weights for policy 0, policy_version 11190 (0.0008) +[2023-10-08 12:13:19,246][102897] Updated weights for policy 0, policy_version 11200 (0.0008) +[2023-10-08 12:13:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 22937600. Throughput: 0: 1755.1, 1: 1769.0. Samples: 5740128. Policy #0 lag: (min: 29.0, avg: 29.4, max: 43.0) +[2023-10-08 12:13:21,876][101941] Avg episode reward: [(0, '5.420'), (1, '5.770')] +[2023-10-08 12:13:22,522][102898] Updated weights for policy 1, policy_version 11210 (0.0007) +[2023-10-08 12:13:22,890][102898] Updated weights for policy 1, policy_version 11220 (0.0007) +[2023-10-08 12:13:22,956][102897] Updated weights for policy 0, policy_version 11210 (0.0009) +[2023-10-08 12:13:23,263][102898] Updated weights for policy 1, policy_version 11230 (0.0008) +[2023-10-08 12:13:23,334][102897] Updated weights for policy 0, policy_version 11220 (0.0009) +[2023-10-08 12:13:23,713][102897] Updated weights for policy 0, policy_version 11230 (0.0009) +[2023-10-08 12:13:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.6, 300 sec: 14218.0). Total num frames: 23003136. Throughput: 0: 1752.5, 1: 1770.0. Samples: 5762450. Policy #0 lag: (min: 29.0, avg: 29.4, max: 43.0) +[2023-10-08 12:13:26,875][101941] Avg episode reward: [(0, '5.800'), (1, '5.600')] +[2023-10-08 12:13:27,033][102898] Updated weights for policy 1, policy_version 11240 (0.0008) +[2023-10-08 12:13:27,405][102898] Updated weights for policy 1, policy_version 11250 (0.0008) +[2023-10-08 12:13:27,523][102897] Updated weights for policy 0, policy_version 11240 (0.0009) +[2023-10-08 12:13:27,767][102898] Updated weights for policy 1, policy_version 11260 (0.0008) +[2023-10-08 12:13:27,899][102897] Updated weights for policy 0, policy_version 11250 (0.0009) +[2023-10-08 12:13:28,265][102897] Updated weights for policy 0, policy_version 11260 (0.0010) +[2023-10-08 12:13:31,644][102898] Updated weights for policy 1, policy_version 11270 (0.0009) +[2023-10-08 12:13:31,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 23068672. Throughput: 0: 1781.4, 1: 1798.4. Samples: 5784588. Policy #0 lag: (min: 28.0, avg: 33.6, max: 60.0) +[2023-10-08 12:13:31,875][101941] Avg episode reward: [(0, '5.960'), (1, '5.860')] +[2023-10-08 12:13:32,004][102898] Updated weights for policy 1, policy_version 11280 (0.0009) +[2023-10-08 12:13:32,223][102897] Updated weights for policy 0, policy_version 11270 (0.0007) +[2023-10-08 12:13:32,380][102898] Updated weights for policy 1, policy_version 11290 (0.0008) +[2023-10-08 12:13:32,606][102897] Updated weights for policy 0, policy_version 11280 (0.0010) +[2023-10-08 12:13:32,983][102897] Updated weights for policy 0, policy_version 11290 (0.0009) +[2023-10-08 12:13:36,248][102898] Updated weights for policy 1, policy_version 11300 (0.0009) +[2023-10-08 12:13:36,642][102898] Updated weights for policy 1, policy_version 11310 (0.0009) +[2023-10-08 12:13:36,743][102897] Updated weights for policy 0, policy_version 11300 (0.0007) +[2023-10-08 12:13:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 23134208. Throughput: 0: 1759.6, 1: 1774.1. Samples: 5794014. Policy #0 lag: (min: 28.0, avg: 33.6, max: 60.0) +[2023-10-08 12:13:36,876][101941] Avg episode reward: [(0, '6.640'), (1, '6.080')] +[2023-10-08 12:13:37,017][102898] Updated weights for policy 1, policy_version 11320 (0.0008) +[2023-10-08 12:13:37,117][102897] Updated weights for policy 0, policy_version 11310 (0.0007) +[2023-10-08 12:13:37,492][102897] Updated weights for policy 0, policy_version 11320 (0.0008) +[2023-10-08 12:13:40,802][102898] Updated weights for policy 1, policy_version 11330 (0.0009) +[2023-10-08 12:13:41,179][102898] Updated weights for policy 1, policy_version 11340 (0.0009) +[2023-10-08 12:13:41,309][102897] Updated weights for policy 0, policy_version 11330 (0.0008) +[2023-10-08 12:13:41,546][102898] Updated weights for policy 1, policy_version 11350 (0.0008) +[2023-10-08 12:13:41,686][102897] Updated weights for policy 0, policy_version 11340 (0.0007) +[2023-10-08 12:13:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 23199744. Throughput: 0: 1775.8, 1: 1792.1. Samples: 5816160. Policy #0 lag: (min: 28.0, avg: 33.6, max: 60.0) +[2023-10-08 12:13:41,876][101941] Avg episode reward: [(0, '6.620'), (1, '6.640')] +[2023-10-08 12:13:41,911][102898] Updated weights for policy 1, policy_version 11360 (0.0008) +[2023-10-08 12:13:42,048][102897] Updated weights for policy 0, policy_version 11350 (0.0009) +[2023-10-08 12:13:42,427][102897] Updated weights for policy 0, policy_version 11360 (0.0008) +[2023-10-08 12:13:45,673][102898] Updated weights for policy 1, policy_version 11370 (0.0010) +[2023-10-08 12:13:46,047][102898] Updated weights for policy 1, policy_version 11380 (0.0007) +[2023-10-08 12:13:46,252][102897] Updated weights for policy 0, policy_version 11370 (0.0009) +[2023-10-08 12:13:46,419][102898] Updated weights for policy 1, policy_version 11390 (0.0008) +[2023-10-08 12:13:46,615][102897] Updated weights for policy 0, policy_version 11380 (0.0007) +[2023-10-08 12:13:46,875][101941] Fps is (10 sec: 16383.7, 60 sec: 13653.3, 300 sec: 14218.0). Total num frames: 23298048. Throughput: 0: 1784.6, 1: 1773.7. Samples: 5836526. Policy #0 lag: (min: 31.0, avg: 36.8, max: 63.0) +[2023-10-08 12:13:46,876][101941] Avg episode reward: [(0, '5.420'), (1, '6.640')] +[2023-10-08 12:13:46,995][102897] Updated weights for policy 0, policy_version 11390 (0.0009) +[2023-10-08 12:13:50,332][102898] Updated weights for policy 1, policy_version 11400 (0.0009) +[2023-10-08 12:13:50,703][102898] Updated weights for policy 1, policy_version 11410 (0.0008) +[2023-10-08 12:13:50,759][102897] Updated weights for policy 0, policy_version 11400 (0.0009) +[2023-10-08 12:13:51,068][102898] Updated weights for policy 1, policy_version 11420 (0.0007) +[2023-10-08 12:13:51,122][102897] Updated weights for policy 0, policy_version 11410 (0.0009) +[2023-10-08 12:13:51,498][102897] Updated weights for policy 0, policy_version 11420 (0.0008) +[2023-10-08 12:13:51,875][101941] Fps is (10 sec: 19661.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 23396352. Throughput: 0: 1775.2, 1: 1785.5. Samples: 5848040. Policy #0 lag: (min: 31.0, avg: 36.8, max: 63.0) +[2023-10-08 12:13:51,875][101941] Avg episode reward: [(0, '5.250'), (1, '5.730')] +[2023-10-08 12:13:54,977][102898] Updated weights for policy 1, policy_version 11430 (0.0008) +[2023-10-08 12:13:55,169][102897] Updated weights for policy 0, policy_version 11430 (0.0008) +[2023-10-08 12:13:55,340][102898] Updated weights for policy 1, policy_version 11440 (0.0008) +[2023-10-08 12:13:55,548][102897] Updated weights for policy 0, policy_version 11440 (0.0008) +[2023-10-08 12:13:55,714][102898] Updated weights for policy 1, policy_version 11450 (0.0008) +[2023-10-08 12:13:55,919][102897] Updated weights for policy 0, policy_version 11450 (0.0007) +[2023-10-08 12:13:56,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 23461888. Throughput: 0: 1803.0, 1: 1782.9. Samples: 5869122. Policy #0 lag: (min: 31.0, avg: 33.3, max: 63.0) +[2023-10-08 12:13:56,876][101941] Avg episode reward: [(0, '5.570'), (1, '5.740')] +[2023-10-08 12:13:59,442][102898] Updated weights for policy 1, policy_version 11460 (0.0008) +[2023-10-08 12:13:59,723][102897] Updated weights for policy 0, policy_version 11460 (0.0007) +[2023-10-08 12:13:59,803][102898] Updated weights for policy 1, policy_version 11470 (0.0007) +[2023-10-08 12:14:00,083][102897] Updated weights for policy 0, policy_version 11470 (0.0007) +[2023-10-08 12:14:00,175][102898] Updated weights for policy 1, policy_version 11480 (0.0008) +[2023-10-08 12:14:00,462][102897] Updated weights for policy 0, policy_version 11480 (0.0008) +[2023-10-08 12:14:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 23527424. Throughput: 0: 1777.4, 1: 1766.7. Samples: 5889702. Policy #0 lag: (min: 31.0, avg: 33.3, max: 63.0) +[2023-10-08 12:14:01,876][101941] Avg episode reward: [(0, '6.210'), (1, '5.750')] +[2023-10-08 12:14:03,979][102898] Updated weights for policy 1, policy_version 11490 (0.0008) +[2023-10-08 12:14:04,304][102897] Updated weights for policy 0, policy_version 11490 (0.0008) +[2023-10-08 12:14:04,334][102898] Updated weights for policy 1, policy_version 11500 (0.0007) +[2023-10-08 12:14:04,672][102897] Updated weights for policy 0, policy_version 11500 (0.0008) +[2023-10-08 12:14:04,696][102898] Updated weights for policy 1, policy_version 11510 (0.0008) +[2023-10-08 12:14:05,041][102897] Updated weights for policy 0, policy_version 11510 (0.0008) +[2023-10-08 12:14:05,070][102898] Updated weights for policy 1, policy_version 11520 (0.0007) +[2023-10-08 12:14:05,417][102897] Updated weights for policy 0, policy_version 11520 (0.0007) +[2023-10-08 12:14:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 23592960. Throughput: 0: 1799.3, 1: 1783.4. Samples: 5901350. Policy #0 lag: (min: 31.0, avg: 33.3, max: 63.0) +[2023-10-08 12:14:06,876][101941] Avg episode reward: [(0, '6.070'), (1, '5.910')] +[2023-10-08 12:14:08,840][102898] Updated weights for policy 1, policy_version 11530 (0.0007) +[2023-10-08 12:14:09,210][102898] Updated weights for policy 1, policy_version 11540 (0.0009) +[2023-10-08 12:14:09,236][102897] Updated weights for policy 0, policy_version 11530 (0.0008) +[2023-10-08 12:14:09,573][102898] Updated weights for policy 1, policy_version 11550 (0.0010) +[2023-10-08 12:14:09,600][102897] Updated weights for policy 0, policy_version 11540 (0.0008) +[2023-10-08 12:14:09,978][102897] Updated weights for policy 0, policy_version 11550 (0.0007) +[2023-10-08 12:14:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 23658496. Throughput: 0: 1774.9, 1: 1762.8. Samples: 5921648. Policy #0 lag: (min: 31.0, avg: 39.3, max: 63.0) +[2023-10-08 12:14:11,876][101941] Avg episode reward: [(0, '6.110'), (1, '5.810')] +[2023-10-08 12:14:13,277][102898] Updated weights for policy 1, policy_version 11560 (0.0009) +[2023-10-08 12:14:13,647][102898] Updated weights for policy 1, policy_version 11570 (0.0008) +[2023-10-08 12:14:13,695][102897] Updated weights for policy 0, policy_version 11560 (0.0008) +[2023-10-08 12:14:14,019][102898] Updated weights for policy 1, policy_version 11580 (0.0007) +[2023-10-08 12:14:14,078][102897] Updated weights for policy 0, policy_version 11570 (0.0009) +[2023-10-08 12:14:14,445][102897] Updated weights for policy 0, policy_version 11580 (0.0008) +[2023-10-08 12:14:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 23724032. Throughput: 0: 1776.6, 1: 1766.3. Samples: 5944018. Policy #0 lag: (min: 31.0, avg: 39.3, max: 63.0) +[2023-10-08 12:14:16,876][101941] Avg episode reward: [(0, '5.850'), (1, '5.450')] +[2023-10-08 12:14:16,887][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000011584_11862016.pth... +[2023-10-08 12:14:16,887][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000011584_11862016.pth... +[2023-10-08 12:14:16,924][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000009920_10158080.pth +[2023-10-08 12:14:16,931][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000009920_10158080.pth +[2023-10-08 12:14:17,764][102898] Updated weights for policy 1, policy_version 11590 (0.0009) +[2023-10-08 12:14:18,129][102898] Updated weights for policy 1, policy_version 11600 (0.0008) +[2023-10-08 12:14:18,274][102897] Updated weights for policy 0, policy_version 11590 (0.0008) +[2023-10-08 12:14:18,490][102898] Updated weights for policy 1, policy_version 11610 (0.0007) +[2023-10-08 12:14:18,665][102897] Updated weights for policy 0, policy_version 11600 (0.0008) +[2023-10-08 12:14:19,043][102897] Updated weights for policy 0, policy_version 11610 (0.0009) +[2023-10-08 12:14:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 23789568. Throughput: 0: 1777.9, 1: 1767.3. Samples: 5953550. Policy #0 lag: (min: 31.0, avg: 39.3, max: 63.0) +[2023-10-08 12:14:21,876][101941] Avg episode reward: [(0, '5.560'), (1, '5.700')] +[2023-10-08 12:14:22,406][102898] Updated weights for policy 1, policy_version 11620 (0.0008) +[2023-10-08 12:14:22,772][102898] Updated weights for policy 1, policy_version 11630 (0.0009) +[2023-10-08 12:14:22,789][102897] Updated weights for policy 0, policy_version 11620 (0.0008) +[2023-10-08 12:14:23,149][102898] Updated weights for policy 1, policy_version 11640 (0.0008) +[2023-10-08 12:14:23,160][102897] Updated weights for policy 0, policy_version 11630 (0.0007) +[2023-10-08 12:14:23,543][102897] Updated weights for policy 0, policy_version 11640 (0.0008) +[2023-10-08 12:14:26,796][102898] Updated weights for policy 1, policy_version 11650 (0.0008) +[2023-10-08 12:14:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 23855104. Throughput: 0: 1772.7, 1: 1768.0. Samples: 5975494. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:14:26,876][101941] Avg episode reward: [(0, '5.560'), (1, '5.780')] +[2023-10-08 12:14:27,163][102898] Updated weights for policy 1, policy_version 11660 (0.0008) +[2023-10-08 12:14:27,329][102897] Updated weights for policy 0, policy_version 11650 (0.0010) +[2023-10-08 12:14:27,539][102898] Updated weights for policy 1, policy_version 11670 (0.0007) +[2023-10-08 12:14:27,697][102897] Updated weights for policy 0, policy_version 11660 (0.0008) +[2023-10-08 12:14:27,904][102898] Updated weights for policy 1, policy_version 11680 (0.0008) +[2023-10-08 12:14:28,075][102897] Updated weights for policy 0, policy_version 11670 (0.0008) +[2023-10-08 12:14:28,446][102897] Updated weights for policy 0, policy_version 11680 (0.0008) +[2023-10-08 12:14:31,854][102898] Updated weights for policy 1, policy_version 11690 (0.0008) +[2023-10-08 12:14:31,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 23920640. Throughput: 0: 1780.9, 1: 1798.5. Samples: 5997602. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:14:31,875][101941] Avg episode reward: [(0, '5.410'), (1, '5.590')] +[2023-10-08 12:14:32,232][102898] Updated weights for policy 1, policy_version 11700 (0.0008) +[2023-10-08 12:14:32,258][102897] Updated weights for policy 0, policy_version 11690 (0.0007) +[2023-10-08 12:14:32,596][102898] Updated weights for policy 1, policy_version 11710 (0.0008) +[2023-10-08 12:14:32,639][102897] Updated weights for policy 0, policy_version 11700 (0.0007) +[2023-10-08 12:14:33,016][102897] Updated weights for policy 0, policy_version 11710 (0.0008) +[2023-10-08 12:14:36,461][102898] Updated weights for policy 1, policy_version 11720 (0.0008) +[2023-10-08 12:14:36,610][102897] Updated weights for policy 0, policy_version 11720 (0.0008) +[2023-10-08 12:14:36,830][102898] Updated weights for policy 1, policy_version 11730 (0.0007) +[2023-10-08 12:14:36,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 23986176. Throughput: 0: 1772.7, 1: 1768.0. Samples: 6007372. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:14:36,875][101941] Avg episode reward: [(0, '5.760'), (1, '5.630')] +[2023-10-08 12:14:36,985][102897] Updated weights for policy 0, policy_version 11730 (0.0007) +[2023-10-08 12:14:37,191][102898] Updated weights for policy 1, policy_version 11740 (0.0009) +[2023-10-08 12:14:37,359][102897] Updated weights for policy 0, policy_version 11740 (0.0007) +[2023-10-08 12:14:41,029][102898] Updated weights for policy 1, policy_version 11750 (0.0007) +[2023-10-08 12:14:41,157][102897] Updated weights for policy 0, policy_version 11750 (0.0007) +[2023-10-08 12:14:41,405][102898] Updated weights for policy 1, policy_version 11760 (0.0007) +[2023-10-08 12:14:41,521][102897] Updated weights for policy 0, policy_version 11760 (0.0007) +[2023-10-08 12:14:41,765][102898] Updated weights for policy 1, policy_version 11770 (0.0007) +[2023-10-08 12:14:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14106.9). Total num frames: 24051712. Throughput: 0: 1780.6, 1: 1786.7. Samples: 6029650. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 12:14:41,875][101941] Avg episode reward: [(0, '5.720'), (1, '5.490')] +[2023-10-08 12:14:41,893][102897] Updated weights for policy 0, policy_version 11770 (0.0008) +[2023-10-08 12:14:45,663][102898] Updated weights for policy 1, policy_version 11780 (0.0007) +[2023-10-08 12:14:45,864][102897] Updated weights for policy 0, policy_version 11780 (0.0008) +[2023-10-08 12:14:46,030][102898] Updated weights for policy 1, policy_version 11790 (0.0008) +[2023-10-08 12:14:46,241][102897] Updated weights for policy 0, policy_version 11790 (0.0008) +[2023-10-08 12:14:46,394][102898] Updated weights for policy 1, policy_version 11800 (0.0008) +[2023-10-08 12:14:46,606][102897] Updated weights for policy 0, policy_version 11800 (0.0008) +[2023-10-08 12:14:46,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 24150016. Throughput: 0: 1782.0, 1: 1772.8. Samples: 6049670. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 12:14:46,876][101941] Avg episode reward: [(0, '5.830'), (1, '5.070')] +[2023-10-08 12:14:50,277][102898] Updated weights for policy 1, policy_version 11810 (0.0008) +[2023-10-08 12:14:50,399][102897] Updated weights for policy 0, policy_version 11810 (0.0008) +[2023-10-08 12:14:50,644][102898] Updated weights for policy 1, policy_version 11820 (0.0008) +[2023-10-08 12:14:50,761][102897] Updated weights for policy 0, policy_version 11820 (0.0007) +[2023-10-08 12:14:51,019][102898] Updated weights for policy 1, policy_version 11830 (0.0007) +[2023-10-08 12:14:51,132][102897] Updated weights for policy 0, policy_version 11830 (0.0008) +[2023-10-08 12:14:51,388][102898] Updated weights for policy 1, policy_version 11840 (0.0008) +[2023-10-08 12:14:51,503][102897] Updated weights for policy 0, policy_version 11840 (0.0009) +[2023-10-08 12:14:51,875][101941] Fps is (10 sec: 19660.3, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 24248320. Throughput: 0: 1773.8, 1: 1777.4. Samples: 6061152. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:14:51,876][101941] Avg episode reward: [(0, '5.910'), (1, '5.500')] +[2023-10-08 12:14:55,078][102898] Updated weights for policy 1, policy_version 11850 (0.0007) +[2023-10-08 12:14:55,287][102897] Updated weights for policy 0, policy_version 11850 (0.0008) +[2023-10-08 12:14:55,441][102898] Updated weights for policy 1, policy_version 11860 (0.0008) +[2023-10-08 12:14:55,648][102897] Updated weights for policy 0, policy_version 11860 (0.0009) +[2023-10-08 12:14:55,807][102898] Updated weights for policy 1, policy_version 11870 (0.0007) +[2023-10-08 12:14:56,017][102897] Updated weights for policy 0, policy_version 11870 (0.0009) +[2023-10-08 12:14:56,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 24313856. Throughput: 0: 1789.2, 1: 1779.5. Samples: 6082242. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:14:56,876][101941] Avg episode reward: [(0, '5.670'), (1, '6.920')] +[2023-10-08 12:14:56,878][102760] Saving new best policy, reward=6.920! +[2023-10-08 12:14:59,417][102898] Updated weights for policy 1, policy_version 11880 (0.0008) +[2023-10-08 12:14:59,702][102897] Updated weights for policy 0, policy_version 11880 (0.0008) +[2023-10-08 12:14:59,787][102898] Updated weights for policy 1, policy_version 11890 (0.0007) +[2023-10-08 12:15:00,069][102897] Updated weights for policy 0, policy_version 11890 (0.0009) +[2023-10-08 12:15:00,152][102898] Updated weights for policy 1, policy_version 11900 (0.0009) +[2023-10-08 12:15:00,445][102897] Updated weights for policy 0, policy_version 11900 (0.0008) +[2023-10-08 12:15:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 24379392. Throughput: 0: 1765.7, 1: 1770.4. Samples: 6103138. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:15:01,876][101941] Avg episode reward: [(0, '5.760'), (1, '6.190')] +[2023-10-08 12:15:03,837][102898] Updated weights for policy 1, policy_version 11910 (0.0007) +[2023-10-08 12:15:04,198][102897] Updated weights for policy 0, policy_version 11910 (0.0008) +[2023-10-08 12:15:04,212][102898] Updated weights for policy 1, policy_version 11920 (0.0007) +[2023-10-08 12:15:04,574][102897] Updated weights for policy 0, policy_version 11920 (0.0007) +[2023-10-08 12:15:04,577][102898] Updated weights for policy 1, policy_version 11930 (0.0007) +[2023-10-08 12:15:04,949][102897] Updated weights for policy 0, policy_version 11930 (0.0007) +[2023-10-08 12:15:06,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 24444928. Throughput: 0: 1790.1, 1: 1779.4. Samples: 6114176. Policy #0 lag: (min: 1.0, avg: 13.2, max: 33.0) +[2023-10-08 12:15:06,876][101941] Avg episode reward: [(0, '6.120'), (1, '5.170')] +[2023-10-08 12:15:08,311][102898] Updated weights for policy 1, policy_version 11940 (0.0009) +[2023-10-08 12:15:08,684][102898] Updated weights for policy 1, policy_version 11950 (0.0009) +[2023-10-08 12:15:08,720][102897] Updated weights for policy 0, policy_version 11940 (0.0008) +[2023-10-08 12:15:09,055][102898] Updated weights for policy 1, policy_version 11960 (0.0007) +[2023-10-08 12:15:09,084][102897] Updated weights for policy 0, policy_version 11950 (0.0007) +[2023-10-08 12:15:09,452][102897] Updated weights for policy 0, policy_version 11960 (0.0007) +[2023-10-08 12:15:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 24510464. Throughput: 0: 1766.6, 1: 1775.7. Samples: 6134898. Policy #0 lag: (min: 1.0, avg: 13.2, max: 33.0) +[2023-10-08 12:15:11,875][101941] Avg episode reward: [(0, '6.010'), (1, '5.780')] +[2023-10-08 12:15:12,850][102898] Updated weights for policy 1, policy_version 11970 (0.0007) +[2023-10-08 12:15:13,218][102898] Updated weights for policy 1, policy_version 11980 (0.0007) +[2023-10-08 12:15:13,317][102897] Updated weights for policy 0, policy_version 11970 (0.0007) +[2023-10-08 12:15:13,581][102898] Updated weights for policy 1, policy_version 11990 (0.0008) +[2023-10-08 12:15:13,687][102897] Updated weights for policy 0, policy_version 11980 (0.0007) +[2023-10-08 12:15:13,945][102898] Updated weights for policy 1, policy_version 12000 (0.0008) +[2023-10-08 12:15:14,048][102897] Updated weights for policy 0, policy_version 11990 (0.0009) +[2023-10-08 12:15:14,419][102897] Updated weights for policy 0, policy_version 12000 (0.0009) +[2023-10-08 12:15:16,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 24576000. Throughput: 0: 1772.1, 1: 1778.1. Samples: 6157362. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:15:16,877][101941] Avg episode reward: [(0, '5.860'), (1, '5.870')] +[2023-10-08 12:15:17,757][102898] Updated weights for policy 1, policy_version 12010 (0.0007) +[2023-10-08 12:15:18,124][102898] Updated weights for policy 1, policy_version 12020 (0.0008) +[2023-10-08 12:15:18,133][102897] Updated weights for policy 0, policy_version 12010 (0.0007) +[2023-10-08 12:15:18,484][102898] Updated weights for policy 1, policy_version 12030 (0.0007) +[2023-10-08 12:15:18,516][102897] Updated weights for policy 0, policy_version 12020 (0.0007) +[2023-10-08 12:15:18,878][102897] Updated weights for policy 0, policy_version 12030 (0.0010) +[2023-10-08 12:15:21,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 24641536. Throughput: 0: 1768.6, 1: 1781.9. Samples: 6167148. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:15:21,876][101941] Avg episode reward: [(0, '6.160'), (1, '5.560')] +[2023-10-08 12:15:22,308][102898] Updated weights for policy 1, policy_version 12040 (0.0008) +[2023-10-08 12:15:22,686][102898] Updated weights for policy 1, policy_version 12050 (0.0009) +[2023-10-08 12:15:22,823][102897] Updated weights for policy 0, policy_version 12040 (0.0009) +[2023-10-08 12:15:23,052][102898] Updated weights for policy 1, policy_version 12060 (0.0010) +[2023-10-08 12:15:23,185][102897] Updated weights for policy 0, policy_version 12050 (0.0007) +[2023-10-08 12:15:23,564][102897] Updated weights for policy 0, policy_version 12060 (0.0007) +[2023-10-08 12:15:26,679][102898] Updated weights for policy 1, policy_version 12070 (0.0008) +[2023-10-08 12:15:26,875][101941] Fps is (10 sec: 13107.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 24707072. Throughput: 0: 1761.9, 1: 1790.8. Samples: 6189522. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:15:26,876][101941] Avg episode reward: [(0, '5.950'), (1, '5.940')] +[2023-10-08 12:15:27,049][102898] Updated weights for policy 1, policy_version 12080 (0.0009) +[2023-10-08 12:15:27,340][102897] Updated weights for policy 0, policy_version 12070 (0.0007) +[2023-10-08 12:15:27,407][102898] Updated weights for policy 1, policy_version 12090 (0.0008) +[2023-10-08 12:15:27,705][102897] Updated weights for policy 0, policy_version 12080 (0.0008) +[2023-10-08 12:15:28,080][102897] Updated weights for policy 0, policy_version 12090 (0.0008) +[2023-10-08 12:15:31,313][102898] Updated weights for policy 1, policy_version 12100 (0.0009) +[2023-10-08 12:15:31,677][102898] Updated weights for policy 1, policy_version 12110 (0.0009) +[2023-10-08 12:15:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 24772608. Throughput: 0: 1785.9, 1: 1805.3. Samples: 6211276. Policy #0 lag: (min: 22.0, avg: 28.5, max: 54.0) +[2023-10-08 12:15:31,876][101941] Avg episode reward: [(0, '6.620'), (1, '5.780')] +[2023-10-08 12:15:31,949][102897] Updated weights for policy 0, policy_version 12100 (0.0007) +[2023-10-08 12:15:32,053][102898] Updated weights for policy 1, policy_version 12120 (0.0007) +[2023-10-08 12:15:32,314][102897] Updated weights for policy 0, policy_version 12110 (0.0008) +[2023-10-08 12:15:32,686][102897] Updated weights for policy 0, policy_version 12120 (0.0008) +[2023-10-08 12:15:35,735][102898] Updated weights for policy 1, policy_version 12130 (0.0008) +[2023-10-08 12:15:36,097][102898] Updated weights for policy 1, policy_version 12140 (0.0008) +[2023-10-08 12:15:36,364][102897] Updated weights for policy 0, policy_version 12130 (0.0007) +[2023-10-08 12:15:36,475][102898] Updated weights for policy 1, policy_version 12150 (0.0009) +[2023-10-08 12:15:36,738][102897] Updated weights for policy 0, policy_version 12140 (0.0007) +[2023-10-08 12:15:36,841][102898] Updated weights for policy 1, policy_version 12160 (0.0008) +[2023-10-08 12:15:36,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.5, 300 sec: 14218.0). Total num frames: 24870912. Throughput: 0: 1772.8, 1: 1792.0. Samples: 6221566. Policy #0 lag: (min: 22.0, avg: 28.5, max: 54.0) +[2023-10-08 12:15:36,876][101941] Avg episode reward: [(0, '6.470'), (1, '6.250')] +[2023-10-08 12:15:37,116][102897] Updated weights for policy 0, policy_version 12150 (0.0007) +[2023-10-08 12:15:37,490][102897] Updated weights for policy 0, policy_version 12160 (0.0008) +[2023-10-08 12:15:40,479][102898] Updated weights for policy 1, policy_version 12170 (0.0008) +[2023-10-08 12:15:40,846][102898] Updated weights for policy 1, policy_version 12180 (0.0008) +[2023-10-08 12:15:41,222][102898] Updated weights for policy 1, policy_version 12190 (0.0008) +[2023-10-08 12:15:41,261][102897] Updated weights for policy 0, policy_version 12170 (0.0007) +[2023-10-08 12:15:41,639][102897] Updated weights for policy 0, policy_version 12180 (0.0010) +[2023-10-08 12:15:41,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14218.0). Total num frames: 24936448. Throughput: 0: 1782.2, 1: 1801.3. Samples: 6243500. Policy #0 lag: (min: 22.0, avg: 28.5, max: 54.0) +[2023-10-08 12:15:41,876][101941] Avg episode reward: [(0, '6.570'), (1, '6.300')] +[2023-10-08 12:15:41,998][102897] Updated weights for policy 0, policy_version 12190 (0.0009) +[2023-10-08 12:15:45,188][102898] Updated weights for policy 1, policy_version 12200 (0.0010) +[2023-10-08 12:15:45,545][102898] Updated weights for policy 1, policy_version 12210 (0.0008) +[2023-10-08 12:15:45,593][102897] Updated weights for policy 0, policy_version 12200 (0.0008) +[2023-10-08 12:15:45,921][102898] Updated weights for policy 1, policy_version 12220 (0.0008) +[2023-10-08 12:15:45,968][102897] Updated weights for policy 0, policy_version 12210 (0.0009) +[2023-10-08 12:15:46,335][102897] Updated weights for policy 0, policy_version 12220 (0.0009) +[2023-10-08 12:15:46,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14218.0). Total num frames: 25034752. Throughput: 0: 1781.7, 1: 1784.1. Samples: 6263600. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:15:46,876][101941] Avg episode reward: [(0, '6.910'), (1, '6.430')] +[2023-10-08 12:15:46,886][102634] Saving new best policy, reward=6.910! +[2023-10-08 12:15:49,645][102898] Updated weights for policy 1, policy_version 12230 (0.0007) +[2023-10-08 12:15:50,012][102898] Updated weights for policy 1, policy_version 12240 (0.0007) +[2023-10-08 12:15:50,079][102897] Updated weights for policy 0, policy_version 12230 (0.0008) +[2023-10-08 12:15:50,386][102898] Updated weights for policy 1, policy_version 12250 (0.0007) +[2023-10-08 12:15:50,444][102897] Updated weights for policy 0, policy_version 12240 (0.0010) +[2023-10-08 12:15:50,819][102897] Updated weights for policy 0, policy_version 12250 (0.0008) +[2023-10-08 12:15:51,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 25100288. Throughput: 0: 1788.1, 1: 1805.8. Samples: 6275904. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:15:51,876][101941] Avg episode reward: [(0, '6.370'), (1, '5.870')] +[2023-10-08 12:15:54,161][102898] Updated weights for policy 1, policy_version 12260 (0.0007) +[2023-10-08 12:15:54,517][102898] Updated weights for policy 1, policy_version 12270 (0.0010) +[2023-10-08 12:15:54,579][102897] Updated weights for policy 0, policy_version 12260 (0.0007) +[2023-10-08 12:15:54,885][102898] Updated weights for policy 1, policy_version 12280 (0.0009) +[2023-10-08 12:15:54,948][102897] Updated weights for policy 0, policy_version 12270 (0.0008) +[2023-10-08 12:15:55,324][102897] Updated weights for policy 0, policy_version 12280 (0.0008) +[2023-10-08 12:15:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 25165824. Throughput: 0: 1787.8, 1: 1785.0. Samples: 6295674. Policy #0 lag: (min: 31.0, avg: 39.3, max: 63.0) +[2023-10-08 12:15:56,876][101941] Avg episode reward: [(0, '5.820'), (1, '5.160')] +[2023-10-08 12:15:58,586][102898] Updated weights for policy 1, policy_version 12290 (0.0009) +[2023-10-08 12:15:58,988][102898] Updated weights for policy 1, policy_version 12300 (0.0008) +[2023-10-08 12:15:59,068][102897] Updated weights for policy 0, policy_version 12290 (0.0010) +[2023-10-08 12:15:59,359][102898] Updated weights for policy 1, policy_version 12310 (0.0007) +[2023-10-08 12:15:59,443][102897] Updated weights for policy 0, policy_version 12300 (0.0008) +[2023-10-08 12:15:59,718][102898] Updated weights for policy 1, policy_version 12320 (0.0007) +[2023-10-08 12:15:59,819][102897] Updated weights for policy 0, policy_version 12310 (0.0007) +[2023-10-08 12:16:00,191][102897] Updated weights for policy 0, policy_version 12320 (0.0008) +[2023-10-08 12:16:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 25231360. Throughput: 0: 1777.4, 1: 1781.2. Samples: 6317498. Policy #0 lag: (min: 31.0, avg: 39.3, max: 63.0) +[2023-10-08 12:16:01,876][101941] Avg episode reward: [(0, '5.800'), (1, '5.360')] +[2023-10-08 12:16:03,534][102898] Updated weights for policy 1, policy_version 12330 (0.0007) +[2023-10-08 12:16:03,899][102898] Updated weights for policy 1, policy_version 12340 (0.0007) +[2023-10-08 12:16:04,063][102897] Updated weights for policy 0, policy_version 12330 (0.0009) +[2023-10-08 12:16:04,267][102898] Updated weights for policy 1, policy_version 12350 (0.0007) +[2023-10-08 12:16:04,436][102897] Updated weights for policy 0, policy_version 12340 (0.0007) +[2023-10-08 12:16:04,813][102897] Updated weights for policy 0, policy_version 12350 (0.0011) +[2023-10-08 12:16:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 25296896. Throughput: 0: 1791.7, 1: 1779.1. Samples: 6327832. Policy #0 lag: (min: 31.0, avg: 39.3, max: 63.0) +[2023-10-08 12:16:06,875][101941] Avg episode reward: [(0, '6.030'), (1, '5.920')] +[2023-10-08 12:16:07,942][102898] Updated weights for policy 1, policy_version 12360 (0.0007) +[2023-10-08 12:16:08,313][102898] Updated weights for policy 1, policy_version 12370 (0.0007) +[2023-10-08 12:16:08,538][102897] Updated weights for policy 0, policy_version 12360 (0.0008) +[2023-10-08 12:16:08,678][102898] Updated weights for policy 1, policy_version 12380 (0.0009) +[2023-10-08 12:16:08,909][102897] Updated weights for policy 0, policy_version 12370 (0.0009) +[2023-10-08 12:16:09,288][102897] Updated weights for policy 0, policy_version 12380 (0.0009) +[2023-10-08 12:16:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 25362432. Throughput: 0: 1775.9, 1: 1782.9. Samples: 6349670. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 12:16:11,876][101941] Avg episode reward: [(0, '6.250'), (1, '5.610')] +[2023-10-08 12:16:12,461][102898] Updated weights for policy 1, policy_version 12390 (0.0008) +[2023-10-08 12:16:12,826][102898] Updated weights for policy 1, policy_version 12400 (0.0008) +[2023-10-08 12:16:13,120][102897] Updated weights for policy 0, policy_version 12390 (0.0010) +[2023-10-08 12:16:13,199][102898] Updated weights for policy 1, policy_version 12410 (0.0007) +[2023-10-08 12:16:13,502][102897] Updated weights for policy 0, policy_version 12400 (0.0008) +[2023-10-08 12:16:13,865][102897] Updated weights for policy 0, policy_version 12410 (0.0011) +[2023-10-08 12:16:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.6, 300 sec: 14218.0). Total num frames: 25427968. Throughput: 0: 1775.2, 1: 1785.8. Samples: 6371518. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 12:16:16,875][101941] Avg episode reward: [(0, '6.420'), (1, '5.260')] +[2023-10-08 12:16:16,885][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000012416_12713984.pth... +[2023-10-08 12:16:16,913][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000010752_11010048.pth +[2023-10-08 12:16:17,071][102898] Updated weights for policy 1, policy_version 12420 (0.0007) +[2023-10-08 12:16:17,433][102898] Updated weights for policy 1, policy_version 12430 (0.0009) +[2023-10-08 12:16:17,805][102898] Updated weights for policy 1, policy_version 12440 (0.0009) +[2023-10-08 12:16:17,810][102897] Updated weights for policy 0, policy_version 12420 (0.0009) +[2023-10-08 12:16:18,091][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000012448_12746752.pth... +[2023-10-08 12:16:18,124][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000010752_11010048.pth +[2023-10-08 12:16:18,176][102897] Updated weights for policy 0, policy_version 12430 (0.0008) +[2023-10-08 12:16:18,556][102897] Updated weights for policy 0, policy_version 12440 (0.0007) +[2023-10-08 12:16:21,626][102898] Updated weights for policy 1, policy_version 12450 (0.0008) +[2023-10-08 12:16:21,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 25493504. Throughput: 0: 1770.3, 1: 1774.8. Samples: 6381094. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 12:16:21,875][101941] Avg episode reward: [(0, '6.080'), (1, '5.600')] +[2023-10-08 12:16:21,995][102898] Updated weights for policy 1, policy_version 12460 (0.0010) +[2023-10-08 12:16:22,353][102898] Updated weights for policy 1, policy_version 12470 (0.0007) +[2023-10-08 12:16:22,404][102897] Updated weights for policy 0, policy_version 12450 (0.0009) +[2023-10-08 12:16:22,718][102898] Updated weights for policy 1, policy_version 12480 (0.0007) +[2023-10-08 12:16:22,772][102897] Updated weights for policy 0, policy_version 12460 (0.0007) +[2023-10-08 12:16:23,148][102897] Updated weights for policy 0, policy_version 12470 (0.0008) +[2023-10-08 12:16:23,513][102897] Updated weights for policy 0, policy_version 12480 (0.0007) +[2023-10-08 12:16:26,524][102898] Updated weights for policy 1, policy_version 12490 (0.0008) +[2023-10-08 12:16:26,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 25559040. Throughput: 0: 1767.2, 1: 1785.2. Samples: 6403360. Policy #0 lag: (min: 31.0, avg: 32.7, max: 60.0) +[2023-10-08 12:16:26,876][101941] Avg episode reward: [(0, '6.370'), (1, '5.970')] +[2023-10-08 12:16:26,885][102898] Updated weights for policy 1, policy_version 12500 (0.0008) +[2023-10-08 12:16:27,258][102898] Updated weights for policy 1, policy_version 12510 (0.0009) +[2023-10-08 12:16:27,378][102897] Updated weights for policy 0, policy_version 12490 (0.0008) +[2023-10-08 12:16:27,754][102897] Updated weights for policy 0, policy_version 12500 (0.0008) +[2023-10-08 12:16:28,142][102897] Updated weights for policy 0, policy_version 12510 (0.0008) +[2023-10-08 12:16:31,012][102898] Updated weights for policy 1, policy_version 12520 (0.0009) +[2023-10-08 12:16:31,377][102898] Updated weights for policy 1, policy_version 12530 (0.0008) +[2023-10-08 12:16:31,746][102898] Updated weights for policy 1, policy_version 12540 (0.0009) +[2023-10-08 12:16:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 25624576. Throughput: 0: 1788.7, 1: 1789.4. Samples: 6424614. Policy #0 lag: (min: 31.0, avg: 32.7, max: 60.0) +[2023-10-08 12:16:31,875][101941] Avg episode reward: [(0, '6.790'), (1, '6.210')] +[2023-10-08 12:16:31,971][102897] Updated weights for policy 0, policy_version 12520 (0.0011) +[2023-10-08 12:16:32,344][102897] Updated weights for policy 0, policy_version 12530 (0.0008) +[2023-10-08 12:16:32,714][102897] Updated weights for policy 0, policy_version 12540 (0.0009) +[2023-10-08 12:16:35,691][102898] Updated weights for policy 1, policy_version 12550 (0.0009) +[2023-10-08 12:16:36,057][102898] Updated weights for policy 1, policy_version 12560 (0.0007) +[2023-10-08 12:16:36,419][102898] Updated weights for policy 1, policy_version 12570 (0.0007) +[2023-10-08 12:16:36,462][102897] Updated weights for policy 0, policy_version 12550 (0.0008) +[2023-10-08 12:16:36,851][102897] Updated weights for policy 0, policy_version 12560 (0.0008) +[2023-10-08 12:16:36,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 25722880. Throughput: 0: 1759.7, 1: 1780.0. Samples: 6435192. Policy #0 lag: (min: 31.0, avg: 32.7, max: 60.0) +[2023-10-08 12:16:36,876][101941] Avg episode reward: [(0, '6.280'), (1, '6.330')] +[2023-10-08 12:16:37,223][102897] Updated weights for policy 0, policy_version 12570 (0.0010) +[2023-10-08 12:16:40,154][102898] Updated weights for policy 1, policy_version 12580 (0.0010) +[2023-10-08 12:16:40,524][102898] Updated weights for policy 1, policy_version 12590 (0.0009) +[2023-10-08 12:16:40,892][102898] Updated weights for policy 1, policy_version 12600 (0.0008) +[2023-10-08 12:16:41,048][102897] Updated weights for policy 0, policy_version 12580 (0.0008) +[2023-10-08 12:16:41,416][102897] Updated weights for policy 0, policy_version 12590 (0.0009) +[2023-10-08 12:16:41,794][102897] Updated weights for policy 0, policy_version 12600 (0.0008) +[2023-10-08 12:16:41,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14106.9). Total num frames: 25788416. Throughput: 0: 1783.4, 1: 1798.9. Samples: 6456880. Policy #0 lag: (min: 12.0, avg: 15.1, max: 44.0) +[2023-10-08 12:16:41,876][101941] Avg episode reward: [(0, '6.300'), (1, '6.360')] +[2023-10-08 12:16:44,662][102898] Updated weights for policy 1, policy_version 12610 (0.0009) +[2023-10-08 12:16:45,051][102898] Updated weights for policy 1, policy_version 12620 (0.0008) +[2023-10-08 12:16:45,419][102898] Updated weights for policy 1, policy_version 12630 (0.0010) +[2023-10-08 12:16:45,625][102897] Updated weights for policy 0, policy_version 12610 (0.0008) +[2023-10-08 12:16:45,789][102898] Updated weights for policy 1, policy_version 12640 (0.0009) +[2023-10-08 12:16:45,985][102897] Updated weights for policy 0, policy_version 12620 (0.0009) +[2023-10-08 12:16:46,360][102897] Updated weights for policy 0, policy_version 12630 (0.0008) +[2023-10-08 12:16:46,730][102897] Updated weights for policy 0, policy_version 12640 (0.0008) +[2023-10-08 12:16:46,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 25886720. Throughput: 0: 1767.5, 1: 1780.6. Samples: 6477164. Policy #0 lag: (min: 12.0, avg: 15.1, max: 44.0) +[2023-10-08 12:16:46,876][101941] Avg episode reward: [(0, '6.180'), (1, '5.860')] +[2023-10-08 12:16:49,471][102898] Updated weights for policy 1, policy_version 12650 (0.0009) +[2023-10-08 12:16:49,845][102898] Updated weights for policy 1, policy_version 12660 (0.0009) +[2023-10-08 12:16:50,215][102898] Updated weights for policy 1, policy_version 12670 (0.0008) +[2023-10-08 12:16:50,525][102897] Updated weights for policy 0, policy_version 12650 (0.0008) +[2023-10-08 12:16:50,899][102897] Updated weights for policy 0, policy_version 12660 (0.0008) +[2023-10-08 12:16:51,268][102897] Updated weights for policy 0, policy_version 12670 (0.0010) +[2023-10-08 12:16:51,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 25952256. Throughput: 0: 1776.6, 1: 1804.0. Samples: 6488960. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 12:16:51,876][101941] Avg episode reward: [(0, '6.160'), (1, '5.730')] +[2023-10-08 12:16:53,907][102898] Updated weights for policy 1, policy_version 12680 (0.0008) +[2023-10-08 12:16:54,279][102898] Updated weights for policy 1, policy_version 12690 (0.0009) +[2023-10-08 12:16:54,643][102898] Updated weights for policy 1, policy_version 12700 (0.0009) +[2023-10-08 12:16:54,909][102897] Updated weights for policy 0, policy_version 12680 (0.0007) +[2023-10-08 12:16:55,275][102897] Updated weights for policy 0, policy_version 12690 (0.0008) +[2023-10-08 12:16:55,653][102897] Updated weights for policy 0, policy_version 12700 (0.0011) +[2023-10-08 12:16:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 26017792. Throughput: 0: 1777.4, 1: 1779.3. Samples: 6509720. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 12:16:56,876][101941] Avg episode reward: [(0, '6.420'), (1, '6.200')] +[2023-10-08 12:16:58,414][102898] Updated weights for policy 1, policy_version 12710 (0.0007) +[2023-10-08 12:16:58,780][102898] Updated weights for policy 1, policy_version 12720 (0.0008) +[2023-10-08 12:16:59,157][102898] Updated weights for policy 1, policy_version 12730 (0.0009) +[2023-10-08 12:16:59,517][102897] Updated weights for policy 0, policy_version 12710 (0.0009) +[2023-10-08 12:16:59,888][102897] Updated weights for policy 0, policy_version 12720 (0.0007) +[2023-10-08 12:17:00,264][102897] Updated weights for policy 0, policy_version 12730 (0.0009) +[2023-10-08 12:17:01,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 26083328. Throughput: 0: 1765.7, 1: 1785.6. Samples: 6531330. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 12:17:01,875][101941] Avg episode reward: [(0, '5.560'), (1, '6.720')] +[2023-10-08 12:17:02,956][102898] Updated weights for policy 1, policy_version 12740 (0.0009) +[2023-10-08 12:17:03,322][102898] Updated weights for policy 1, policy_version 12750 (0.0010) +[2023-10-08 12:17:03,693][102898] Updated weights for policy 1, policy_version 12760 (0.0010) +[2023-10-08 12:17:04,020][102897] Updated weights for policy 0, policy_version 12740 (0.0009) +[2023-10-08 12:17:04,403][102897] Updated weights for policy 0, policy_version 12750 (0.0010) +[2023-10-08 12:17:04,769][102897] Updated weights for policy 0, policy_version 12760 (0.0010) +[2023-10-08 12:17:06,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 26148864. Throughput: 0: 1786.8, 1: 1782.7. Samples: 6541724. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:17:06,875][101941] Avg episode reward: [(0, '5.130'), (1, '6.260')] +[2023-10-08 12:17:07,457][102898] Updated weights for policy 1, policy_version 12770 (0.0008) +[2023-10-08 12:17:07,821][102898] Updated weights for policy 1, policy_version 12780 (0.0007) +[2023-10-08 12:17:08,197][102898] Updated weights for policy 1, policy_version 12790 (0.0007) +[2023-10-08 12:17:08,472][102897] Updated weights for policy 0, policy_version 12770 (0.0010) +[2023-10-08 12:17:08,567][102898] Updated weights for policy 1, policy_version 12800 (0.0007) +[2023-10-08 12:17:08,833][102897] Updated weights for policy 0, policy_version 12780 (0.0010) +[2023-10-08 12:17:09,207][102897] Updated weights for policy 0, policy_version 12790 (0.0008) +[2023-10-08 12:17:09,582][102897] Updated weights for policy 0, policy_version 12800 (0.0011) +[2023-10-08 12:17:11,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 26214400. Throughput: 0: 1767.0, 1: 1785.6. Samples: 6563228. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:17:11,876][101941] Avg episode reward: [(0, '5.580'), (1, '6.330')] +[2023-10-08 12:17:12,324][102898] Updated weights for policy 1, policy_version 12810 (0.0008) +[2023-10-08 12:17:12,685][102898] Updated weights for policy 1, policy_version 12820 (0.0008) +[2023-10-08 12:17:13,050][102898] Updated weights for policy 1, policy_version 12830 (0.0007) +[2023-10-08 12:17:13,426][102897] Updated weights for policy 0, policy_version 12810 (0.0009) +[2023-10-08 12:17:13,801][102897] Updated weights for policy 0, policy_version 12820 (0.0009) +[2023-10-08 12:17:14,176][102897] Updated weights for policy 0, policy_version 12830 (0.0007) +[2023-10-08 12:17:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 26279936. Throughput: 0: 1770.6, 1: 1806.9. Samples: 6585600. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:17:16,876][101941] Avg episode reward: [(0, '5.890'), (1, '6.180')] +[2023-10-08 12:17:16,991][102898] Updated weights for policy 1, policy_version 12840 (0.0009) +[2023-10-08 12:17:17,366][102898] Updated weights for policy 1, policy_version 12850 (0.0007) +[2023-10-08 12:17:17,734][102898] Updated weights for policy 1, policy_version 12860 (0.0007) +[2023-10-08 12:17:17,944][102897] Updated weights for policy 0, policy_version 12840 (0.0007) +[2023-10-08 12:17:18,311][102897] Updated weights for policy 0, policy_version 12850 (0.0008) +[2023-10-08 12:17:18,689][102897] Updated weights for policy 0, policy_version 12860 (0.0009) +[2023-10-08 12:17:21,526][102898] Updated weights for policy 1, policy_version 12870 (0.0008) +[2023-10-08 12:17:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 26345472. Throughput: 0: 1770.7, 1: 1783.6. Samples: 6595136. Policy #0 lag: (min: 24.0, avg: 49.0, max: 56.0) +[2023-10-08 12:17:21,876][101941] Avg episode reward: [(0, '5.800'), (1, '5.690')] +[2023-10-08 12:17:21,901][102898] Updated weights for policy 1, policy_version 12880 (0.0008) +[2023-10-08 12:17:22,262][102898] Updated weights for policy 1, policy_version 12890 (0.0008) +[2023-10-08 12:17:22,444][102897] Updated weights for policy 0, policy_version 12870 (0.0008) +[2023-10-08 12:17:22,812][102897] Updated weights for policy 0, policy_version 12880 (0.0009) +[2023-10-08 12:17:23,192][102897] Updated weights for policy 0, policy_version 12890 (0.0007) +[2023-10-08 12:17:26,197][102898] Updated weights for policy 1, policy_version 12900 (0.0007) +[2023-10-08 12:17:26,571][102898] Updated weights for policy 1, policy_version 12910 (0.0009) +[2023-10-08 12:17:26,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 26411008. Throughput: 0: 1774.3, 1: 1790.2. Samples: 6617282. Policy #0 lag: (min: 24.0, avg: 49.0, max: 56.0) +[2023-10-08 12:17:26,876][101941] Avg episode reward: [(0, '6.220'), (1, '5.790')] +[2023-10-08 12:17:26,932][102898] Updated weights for policy 1, policy_version 12920 (0.0007) +[2023-10-08 12:17:27,102][102897] Updated weights for policy 0, policy_version 12900 (0.0007) +[2023-10-08 12:17:27,486][102897] Updated weights for policy 0, policy_version 12910 (0.0007) +[2023-10-08 12:17:27,863][102897] Updated weights for policy 0, policy_version 12920 (0.0007) +[2023-10-08 12:17:30,526][102898] Updated weights for policy 1, policy_version 12930 (0.0007) +[2023-10-08 12:17:30,926][102898] Updated weights for policy 1, policy_version 12940 (0.0007) +[2023-10-08 12:17:31,291][102898] Updated weights for policy 1, policy_version 12950 (0.0007) +[2023-10-08 12:17:31,373][102897] Updated weights for policy 0, policy_version 12930 (0.0008) +[2023-10-08 12:17:31,663][102898] Updated weights for policy 1, policy_version 12960 (0.0010) +[2023-10-08 12:17:31,743][102897] Updated weights for policy 0, policy_version 12940 (0.0008) +[2023-10-08 12:17:31,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 26509312. Throughput: 0: 1799.8, 1: 1786.1. Samples: 6638528. Policy #0 lag: (min: 24.0, avg: 49.0, max: 56.0) +[2023-10-08 12:17:31,875][101941] Avg episode reward: [(0, '5.930'), (1, '6.370')] +[2023-10-08 12:17:32,124][102897] Updated weights for policy 0, policy_version 12950 (0.0008) +[2023-10-08 12:17:32,483][102897] Updated weights for policy 0, policy_version 12960 (0.0010) +[2023-10-08 12:17:35,324][102898] Updated weights for policy 1, policy_version 12970 (0.0010) +[2023-10-08 12:17:35,691][102898] Updated weights for policy 1, policy_version 12980 (0.0011) +[2023-10-08 12:17:36,058][102898] Updated weights for policy 1, policy_version 12990 (0.0009) +[2023-10-08 12:17:36,296][102897] Updated weights for policy 0, policy_version 12970 (0.0007) +[2023-10-08 12:17:36,666][102897] Updated weights for policy 0, policy_version 12980 (0.0009) +[2023-10-08 12:17:36,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 26574848. Throughput: 0: 1778.8, 1: 1788.4. Samples: 6649482. Policy #0 lag: (min: 1.0, avg: 9.4, max: 33.0) +[2023-10-08 12:17:36,875][101941] Avg episode reward: [(0, '5.810'), (1, '6.570')] +[2023-10-08 12:17:37,040][102897] Updated weights for policy 0, policy_version 12990 (0.0011) +[2023-10-08 12:17:39,681][102898] Updated weights for policy 1, policy_version 13000 (0.0009) +[2023-10-08 12:17:40,051][102898] Updated weights for policy 1, policy_version 13010 (0.0007) +[2023-10-08 12:17:40,426][102898] Updated weights for policy 1, policy_version 13020 (0.0010) +[2023-10-08 12:17:41,040][102897] Updated weights for policy 0, policy_version 13000 (0.0007) +[2023-10-08 12:17:41,408][102897] Updated weights for policy 0, policy_version 13010 (0.0007) +[2023-10-08 12:17:41,784][102897] Updated weights for policy 0, policy_version 13020 (0.0008) +[2023-10-08 12:17:41,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14106.9). Total num frames: 26640384. Throughput: 0: 1792.9, 1: 1786.0. Samples: 6670770. Policy #0 lag: (min: 1.0, avg: 9.4, max: 33.0) +[2023-10-08 12:17:41,876][101941] Avg episode reward: [(0, '6.340'), (1, '6.070')] +[2023-10-08 12:17:44,064][102898] Updated weights for policy 1, policy_version 13030 (0.0009) +[2023-10-08 12:17:44,439][102898] Updated weights for policy 1, policy_version 13040 (0.0009) +[2023-10-08 12:17:44,803][102898] Updated weights for policy 1, policy_version 13050 (0.0008) +[2023-10-08 12:17:45,711][102897] Updated weights for policy 0, policy_version 13030 (0.0010) +[2023-10-08 12:17:46,092][102897] Updated weights for policy 0, policy_version 13040 (0.0009) +[2023-10-08 12:17:46,463][102897] Updated weights for policy 0, policy_version 13050 (0.0007) +[2023-10-08 12:17:46,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 26738688. Throughput: 0: 1777.0, 1: 1782.1. Samples: 6691490. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:17:46,876][101941] Avg episode reward: [(0, '6.460'), (1, '6.200')] +[2023-10-08 12:17:48,600][102898] Updated weights for policy 1, policy_version 13060 (0.0007) +[2023-10-08 12:17:48,965][102898] Updated weights for policy 1, policy_version 13070 (0.0008) +[2023-10-08 12:17:49,334][102898] Updated weights for policy 1, policy_version 13080 (0.0009) +[2023-10-08 12:17:50,261][102897] Updated weights for policy 0, policy_version 13060 (0.0008) +[2023-10-08 12:17:50,631][102897] Updated weights for policy 0, policy_version 13070 (0.0007) +[2023-10-08 12:17:51,014][102897] Updated weights for policy 0, policy_version 13080 (0.0008) +[2023-10-08 12:17:51,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.6, 300 sec: 14218.0). Total num frames: 26804224. Throughput: 0: 1781.3, 1: 1793.7. Samples: 6702600. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:17:51,876][101941] Avg episode reward: [(0, '6.300'), (1, '6.320')] +[2023-10-08 12:17:53,151][102898] Updated weights for policy 1, policy_version 13090 (0.0008) +[2023-10-08 12:17:53,524][102898] Updated weights for policy 1, policy_version 13100 (0.0009) +[2023-10-08 12:17:53,892][102898] Updated weights for policy 1, policy_version 13110 (0.0009) +[2023-10-08 12:17:54,256][102898] Updated weights for policy 1, policy_version 13120 (0.0008) +[2023-10-08 12:17:54,776][102897] Updated weights for policy 0, policy_version 13090 (0.0009) +[2023-10-08 12:17:55,155][102897] Updated weights for policy 0, policy_version 13100 (0.0010) +[2023-10-08 12:17:55,531][102897] Updated weights for policy 0, policy_version 13110 (0.0009) +[2023-10-08 12:17:55,904][102897] Updated weights for policy 0, policy_version 13120 (0.0009) +[2023-10-08 12:17:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 26869760. Throughput: 0: 1785.5, 1: 1781.7. Samples: 6723752. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:17:56,876][101941] Avg episode reward: [(0, '6.110'), (1, '6.430')] +[2023-10-08 12:17:57,916][102898] Updated weights for policy 1, policy_version 13130 (0.0010) +[2023-10-08 12:17:58,295][102898] Updated weights for policy 1, policy_version 13140 (0.0009) +[2023-10-08 12:17:58,661][102898] Updated weights for policy 1, policy_version 13150 (0.0010) +[2023-10-08 12:17:59,453][102897] Updated weights for policy 0, policy_version 13130 (0.0008) +[2023-10-08 12:17:59,834][102897] Updated weights for policy 0, policy_version 13140 (0.0008) +[2023-10-08 12:18:00,197][102897] Updated weights for policy 0, policy_version 13150 (0.0008) +[2023-10-08 12:18:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 26935296. Throughput: 0: 1771.1, 1: 1786.0. Samples: 6745666. Policy #0 lag: (min: 13.0, avg: 21.0, max: 45.0) +[2023-10-08 12:18:01,875][101941] Avg episode reward: [(0, '6.600'), (1, '6.090')] +[2023-10-08 12:18:02,492][102898] Updated weights for policy 1, policy_version 13160 (0.0008) +[2023-10-08 12:18:02,857][102898] Updated weights for policy 1, policy_version 13170 (0.0007) +[2023-10-08 12:18:03,226][102898] Updated weights for policy 1, policy_version 13180 (0.0007) +[2023-10-08 12:18:03,982][102897] Updated weights for policy 0, policy_version 13160 (0.0009) +[2023-10-08 12:18:04,349][102897] Updated weights for policy 0, policy_version 13170 (0.0010) +[2023-10-08 12:18:04,736][102897] Updated weights for policy 0, policy_version 13180 (0.0011) +[2023-10-08 12:18:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 27000832. Throughput: 0: 1791.1, 1: 1788.4. Samples: 6756214. Policy #0 lag: (min: 13.0, avg: 21.0, max: 45.0) +[2023-10-08 12:18:06,876][101941] Avg episode reward: [(0, '5.870'), (1, '5.890')] +[2023-10-08 12:18:07,056][102898] Updated weights for policy 1, policy_version 13190 (0.0007) +[2023-10-08 12:18:07,429][102898] Updated weights for policy 1, policy_version 13200 (0.0007) +[2023-10-08 12:18:07,802][102898] Updated weights for policy 1, policy_version 13210 (0.0007) +[2023-10-08 12:18:08,601][102897] Updated weights for policy 0, policy_version 13190 (0.0008) +[2023-10-08 12:18:08,969][102897] Updated weights for policy 0, policy_version 13200 (0.0007) +[2023-10-08 12:18:09,347][102897] Updated weights for policy 0, policy_version 13210 (0.0007) +[2023-10-08 12:18:11,457][102898] Updated weights for policy 1, policy_version 13220 (0.0008) +[2023-10-08 12:18:11,823][102898] Updated weights for policy 1, policy_version 13230 (0.0008) +[2023-10-08 12:18:11,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 27066368. Throughput: 0: 1775.8, 1: 1792.9. Samples: 6777874. Policy #0 lag: (min: 13.0, avg: 21.0, max: 45.0) +[2023-10-08 12:18:11,875][101941] Avg episode reward: [(0, '5.680'), (1, '5.820')] +[2023-10-08 12:18:12,195][102898] Updated weights for policy 1, policy_version 13240 (0.0009) +[2023-10-08 12:18:13,095][102897] Updated weights for policy 0, policy_version 13220 (0.0007) +[2023-10-08 12:18:13,486][102897] Updated weights for policy 0, policy_version 13230 (0.0007) +[2023-10-08 12:18:13,854][102897] Updated weights for policy 0, policy_version 13240 (0.0009) +[2023-10-08 12:18:16,079][102898] Updated weights for policy 1, policy_version 13250 (0.0007) +[2023-10-08 12:18:16,485][102898] Updated weights for policy 1, policy_version 13260 (0.0007) +[2023-10-08 12:18:16,845][102898] Updated weights for policy 1, policy_version 13270 (0.0008) +[2023-10-08 12:18:16,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 27131904. Throughput: 0: 1770.4, 1: 1808.4. Samples: 6799574. Policy #0 lag: (min: 8.0, avg: 30.6, max: 40.0) +[2023-10-08 12:18:16,875][101941] Avg episode reward: [(0, '6.130'), (1, '6.010')] +[2023-10-08 12:18:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000013248_13565952.pth... +[2023-10-08 12:18:16,917][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000011584_11862016.pth +[2023-10-08 12:18:17,213][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000013280_13598720.pth... +[2023-10-08 12:18:17,218][102898] Updated weights for policy 1, policy_version 13280 (0.0009) +[2023-10-08 12:18:17,242][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000011584_11862016.pth +[2023-10-08 12:18:17,714][102897] Updated weights for policy 0, policy_version 13250 (0.0009) +[2023-10-08 12:18:18,083][102897] Updated weights for policy 0, policy_version 13260 (0.0008) +[2023-10-08 12:18:18,457][102897] Updated weights for policy 0, policy_version 13270 (0.0008) +[2023-10-08 12:18:18,826][102897] Updated weights for policy 0, policy_version 13280 (0.0008) +[2023-10-08 12:18:20,937][102898] Updated weights for policy 1, policy_version 13290 (0.0011) +[2023-10-08 12:18:21,309][102898] Updated weights for policy 1, policy_version 13300 (0.0010) +[2023-10-08 12:18:21,684][102898] Updated weights for policy 1, policy_version 13310 (0.0009) +[2023-10-08 12:18:21,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 27230208. Throughput: 0: 1767.3, 1: 1794.2. Samples: 6809750. Policy #0 lag: (min: 8.0, avg: 30.6, max: 40.0) +[2023-10-08 12:18:21,876][101941] Avg episode reward: [(0, '5.900'), (1, '6.160')] +[2023-10-08 12:18:22,556][102897] Updated weights for policy 0, policy_version 13290 (0.0007) +[2023-10-08 12:18:22,929][102897] Updated weights for policy 0, policy_version 13300 (0.0008) +[2023-10-08 12:18:23,308][102897] Updated weights for policy 0, policy_version 13310 (0.0009) +[2023-10-08 12:18:25,418][102898] Updated weights for policy 1, policy_version 13320 (0.0008) +[2023-10-08 12:18:25,782][102898] Updated weights for policy 1, policy_version 13330 (0.0011) +[2023-10-08 12:18:26,157][102898] Updated weights for policy 1, policy_version 13340 (0.0011) +[2023-10-08 12:18:26,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 27295744. Throughput: 0: 1763.8, 1: 1807.0. Samples: 6831456. Policy #0 lag: (min: 8.0, avg: 30.6, max: 40.0) +[2023-10-08 12:18:26,876][101941] Avg episode reward: [(0, '5.670'), (1, '6.110')] +[2023-10-08 12:18:27,124][102897] Updated weights for policy 0, policy_version 13320 (0.0010) +[2023-10-08 12:18:27,485][102897] Updated weights for policy 0, policy_version 13330 (0.0009) +[2023-10-08 12:18:27,856][102897] Updated weights for policy 0, policy_version 13340 (0.0009) +[2023-10-08 12:18:29,754][102898] Updated weights for policy 1, policy_version 13350 (0.0009) +[2023-10-08 12:18:30,124][102898] Updated weights for policy 1, policy_version 13360 (0.0008) +[2023-10-08 12:18:30,496][102898] Updated weights for policy 1, policy_version 13370 (0.0010) +[2023-10-08 12:18:31,418][102897] Updated weights for policy 0, policy_version 13350 (0.0007) +[2023-10-08 12:18:31,795][102897] Updated weights for policy 0, policy_version 13360 (0.0009) +[2023-10-08 12:18:31,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 27361280. Throughput: 0: 1801.2, 1: 1791.6. Samples: 6853168. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:18:31,875][101941] Avg episode reward: [(0, '6.150'), (1, '6.420')] +[2023-10-08 12:18:32,158][102897] Updated weights for policy 0, policy_version 13370 (0.0009) +[2023-10-08 12:18:34,182][102898] Updated weights for policy 1, policy_version 13380 (0.0008) +[2023-10-08 12:18:34,542][102898] Updated weights for policy 1, policy_version 13390 (0.0007) +[2023-10-08 12:18:34,915][102898] Updated weights for policy 1, policy_version 13400 (0.0009) +[2023-10-08 12:18:35,791][102897] Updated weights for policy 0, policy_version 13380 (0.0010) +[2023-10-08 12:18:36,169][102897] Updated weights for policy 0, policy_version 13390 (0.0007) +[2023-10-08 12:18:36,534][102897] Updated weights for policy 0, policy_version 13400 (0.0007) +[2023-10-08 12:18:36,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 27459584. Throughput: 0: 1782.5, 1: 1810.4. Samples: 6864278. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:18:36,875][101941] Avg episode reward: [(0, '6.890'), (1, '6.100')] +[2023-10-08 12:18:38,707][102898] Updated weights for policy 1, policy_version 13410 (0.0009) +[2023-10-08 12:18:39,082][102898] Updated weights for policy 1, policy_version 13420 (0.0009) +[2023-10-08 12:18:39,458][102898] Updated weights for policy 1, policy_version 13430 (0.0008) +[2023-10-08 12:18:39,819][102898] Updated weights for policy 1, policy_version 13440 (0.0011) +[2023-10-08 12:18:40,416][102897] Updated weights for policy 0, policy_version 13410 (0.0009) +[2023-10-08 12:18:40,790][102897] Updated weights for policy 0, policy_version 13420 (0.0009) +[2023-10-08 12:18:41,166][102897] Updated weights for policy 0, policy_version 13430 (0.0007) +[2023-10-08 12:18:41,547][102897] Updated weights for policy 0, policy_version 13440 (0.0010) +[2023-10-08 12:18:41,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 27525120. Throughput: 0: 1800.0, 1: 1795.2. Samples: 6885538. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:18:41,876][101941] Avg episode reward: [(0, '6.680'), (1, '5.450')] +[2023-10-08 12:18:43,623][102898] Updated weights for policy 1, policy_version 13450 (0.0009) +[2023-10-08 12:18:43,989][102898] Updated weights for policy 1, policy_version 13460 (0.0011) +[2023-10-08 12:18:44,358][102898] Updated weights for policy 1, policy_version 13470 (0.0009) +[2023-10-08 12:18:45,215][102897] Updated weights for policy 0, policy_version 13450 (0.0010) +[2023-10-08 12:18:45,579][102897] Updated weights for policy 0, policy_version 13460 (0.0009) +[2023-10-08 12:18:45,953][102897] Updated weights for policy 0, policy_version 13470 (0.0009) +[2023-10-08 12:18:46,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 27590656. Throughput: 0: 1784.3, 1: 1792.1. Samples: 6906602. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:18:46,876][101941] Avg episode reward: [(0, '6.220'), (1, '5.730')] +[2023-10-08 12:18:48,148][102898] Updated weights for policy 1, policy_version 13480 (0.0008) +[2023-10-08 12:18:48,519][102898] Updated weights for policy 1, policy_version 13490 (0.0008) +[2023-10-08 12:18:48,887][102898] Updated weights for policy 1, policy_version 13500 (0.0007) +[2023-10-08 12:18:49,904][102897] Updated weights for policy 0, policy_version 13480 (0.0008) +[2023-10-08 12:18:50,283][102897] Updated weights for policy 0, policy_version 13490 (0.0011) +[2023-10-08 12:18:50,655][102897] Updated weights for policy 0, policy_version 13500 (0.0010) +[2023-10-08 12:18:51,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 27656192. Throughput: 0: 1800.8, 1: 1791.5. Samples: 6917868. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:18:51,876][101941] Avg episode reward: [(0, '6.030'), (1, '5.840')] +[2023-10-08 12:18:52,739][102898] Updated weights for policy 1, policy_version 13510 (0.0007) +[2023-10-08 12:18:53,114][102898] Updated weights for policy 1, policy_version 13520 (0.0008) +[2023-10-08 12:18:53,482][102898] Updated weights for policy 1, policy_version 13530 (0.0009) +[2023-10-08 12:18:54,562][102897] Updated weights for policy 0, policy_version 13510 (0.0008) +[2023-10-08 12:18:54,936][102897] Updated weights for policy 0, policy_version 13520 (0.0008) +[2023-10-08 12:18:55,306][102897] Updated weights for policy 0, policy_version 13530 (0.0009) +[2023-10-08 12:18:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 27721728. Throughput: 0: 1786.7, 1: 1790.3. Samples: 6938840. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:18:56,876][101941] Avg episode reward: [(0, '6.210'), (1, '5.820')] +[2023-10-08 12:18:57,212][102898] Updated weights for policy 1, policy_version 13540 (0.0007) +[2023-10-08 12:18:57,572][102898] Updated weights for policy 1, policy_version 13550 (0.0007) +[2023-10-08 12:18:57,946][102898] Updated weights for policy 1, policy_version 13560 (0.0010) +[2023-10-08 12:18:59,106][102897] Updated weights for policy 0, policy_version 13540 (0.0008) +[2023-10-08 12:18:59,496][102897] Updated weights for policy 0, policy_version 13550 (0.0007) +[2023-10-08 12:18:59,875][102897] Updated weights for policy 0, policy_version 13560 (0.0007) +[2023-10-08 12:19:01,786][102898] Updated weights for policy 1, policy_version 13570 (0.0009) +[2023-10-08 12:19:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 27787264. Throughput: 0: 1783.0, 1: 1802.9. Samples: 6960940. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:19:01,876][101941] Avg episode reward: [(0, '5.630'), (1, '5.980')] +[2023-10-08 12:19:02,185][102898] Updated weights for policy 1, policy_version 13580 (0.0007) +[2023-10-08 12:19:02,569][102898] Updated weights for policy 1, policy_version 13590 (0.0009) +[2023-10-08 12:19:02,932][102898] Updated weights for policy 1, policy_version 13600 (0.0008) +[2023-10-08 12:19:03,543][102897] Updated weights for policy 0, policy_version 13570 (0.0008) +[2023-10-08 12:19:03,905][102897] Updated weights for policy 0, policy_version 13580 (0.0010) +[2023-10-08 12:19:04,277][102897] Updated weights for policy 0, policy_version 13590 (0.0009) +[2023-10-08 12:19:04,663][102897] Updated weights for policy 0, policy_version 13600 (0.0010) +[2023-10-08 12:19:06,672][102898] Updated weights for policy 1, policy_version 13610 (0.0008) +[2023-10-08 12:19:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 27852800. Throughput: 0: 1792.4, 1: 1788.8. Samples: 6970902. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:19:06,876][101941] Avg episode reward: [(0, '5.450'), (1, '5.820')] +[2023-10-08 12:19:07,046][102898] Updated weights for policy 1, policy_version 13620 (0.0007) +[2023-10-08 12:19:07,405][102898] Updated weights for policy 1, policy_version 13630 (0.0008) +[2023-10-08 12:19:08,225][102897] Updated weights for policy 0, policy_version 13610 (0.0009) +[2023-10-08 12:19:08,595][102897] Updated weights for policy 0, policy_version 13620 (0.0007) +[2023-10-08 12:19:08,975][102897] Updated weights for policy 0, policy_version 13630 (0.0008) +[2023-10-08 12:19:11,136][102898] Updated weights for policy 1, policy_version 13640 (0.0007) +[2023-10-08 12:19:11,497][102898] Updated weights for policy 1, policy_version 13650 (0.0007) +[2023-10-08 12:19:11,867][102898] Updated weights for policy 1, policy_version 13660 (0.0008) +[2023-10-08 12:19:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 27918336. Throughput: 0: 1798.3, 1: 1794.6. Samples: 6993136. Policy #0 lag: (min: 13.0, avg: 13.6, max: 29.0) +[2023-10-08 12:19:11,875][101941] Avg episode reward: [(0, '5.840'), (1, '5.680')] +[2023-10-08 12:19:12,628][102897] Updated weights for policy 0, policy_version 13640 (0.0007) +[2023-10-08 12:19:13,003][102897] Updated weights for policy 0, policy_version 13650 (0.0007) +[2023-10-08 12:19:13,379][102897] Updated weights for policy 0, policy_version 13660 (0.0008) +[2023-10-08 12:19:15,595][102898] Updated weights for policy 1, policy_version 13670 (0.0008) +[2023-10-08 12:19:15,967][102898] Updated weights for policy 1, policy_version 13680 (0.0008) +[2023-10-08 12:19:16,344][102898] Updated weights for policy 1, policy_version 13690 (0.0009) +[2023-10-08 12:19:16,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 28016640. Throughput: 0: 1791.1, 1: 1789.0. Samples: 7014274. Policy #0 lag: (min: 13.0, avg: 13.6, max: 29.0) +[2023-10-08 12:19:16,876][101941] Avg episode reward: [(0, '5.970'), (1, '5.810')] +[2023-10-08 12:19:17,157][102897] Updated weights for policy 0, policy_version 13670 (0.0008) +[2023-10-08 12:19:17,528][102897] Updated weights for policy 0, policy_version 13680 (0.0009) +[2023-10-08 12:19:17,911][102897] Updated weights for policy 0, policy_version 13690 (0.0008) +[2023-10-08 12:19:20,134][102898] Updated weights for policy 1, policy_version 13700 (0.0007) +[2023-10-08 12:19:20,496][102898] Updated weights for policy 1, policy_version 13710 (0.0008) +[2023-10-08 12:19:20,860][102898] Updated weights for policy 1, policy_version 13720 (0.0010) +[2023-10-08 12:19:21,687][102897] Updated weights for policy 0, policy_version 13700 (0.0009) +[2023-10-08 12:19:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 28082176. Throughput: 0: 1784.6, 1: 1789.9. Samples: 7025130. Policy #0 lag: (min: 13.0, avg: 13.6, max: 29.0) +[2023-10-08 12:19:21,876][101941] Avg episode reward: [(0, '5.910'), (1, '6.340')] +[2023-10-08 12:19:22,070][102897] Updated weights for policy 0, policy_version 13710 (0.0009) +[2023-10-08 12:19:22,451][102897] Updated weights for policy 0, policy_version 13720 (0.0009) +[2023-10-08 12:19:24,632][102898] Updated weights for policy 1, policy_version 13730 (0.0011) +[2023-10-08 12:19:24,997][102898] Updated weights for policy 1, policy_version 13740 (0.0010) +[2023-10-08 12:19:25,361][102898] Updated weights for policy 1, policy_version 13750 (0.0011) +[2023-10-08 12:19:25,733][102898] Updated weights for policy 1, policy_version 13760 (0.0009) +[2023-10-08 12:19:26,048][102897] Updated weights for policy 0, policy_version 13730 (0.0008) +[2023-10-08 12:19:26,418][102897] Updated weights for policy 0, policy_version 13740 (0.0009) +[2023-10-08 12:19:26,797][102897] Updated weights for policy 0, policy_version 13750 (0.0011) +[2023-10-08 12:19:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 28147712. Throughput: 0: 1788.4, 1: 1784.8. Samples: 7046334. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 12:19:26,875][101941] Avg episode reward: [(0, '5.470'), (1, '6.380')] +[2023-10-08 12:19:27,179][102897] Updated weights for policy 0, policy_version 13760 (0.0010) +[2023-10-08 12:19:29,386][102898] Updated weights for policy 1, policy_version 13770 (0.0009) +[2023-10-08 12:19:29,759][102898] Updated weights for policy 1, policy_version 13780 (0.0008) +[2023-10-08 12:19:30,117][102898] Updated weights for policy 1, policy_version 13790 (0.0009) +[2023-10-08 12:19:30,981][102897] Updated weights for policy 0, policy_version 13770 (0.0011) +[2023-10-08 12:19:31,357][102897] Updated weights for policy 0, policy_version 13780 (0.0008) +[2023-10-08 12:19:31,730][102897] Updated weights for policy 0, policy_version 13790 (0.0008) +[2023-10-08 12:19:31,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 28246016. Throughput: 0: 1797.0, 1: 1782.4. Samples: 7067674. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 12:19:31,876][101941] Avg episode reward: [(0, '5.470'), (1, '5.910')] +[2023-10-08 12:19:33,889][102898] Updated weights for policy 1, policy_version 13800 (0.0008) +[2023-10-08 12:19:34,265][102898] Updated weights for policy 1, policy_version 13810 (0.0007) +[2023-10-08 12:19:34,633][102898] Updated weights for policy 1, policy_version 13820 (0.0010) +[2023-10-08 12:19:35,573][102897] Updated weights for policy 0, policy_version 13800 (0.0009) +[2023-10-08 12:19:35,944][102897] Updated weights for policy 0, policy_version 13810 (0.0011) +[2023-10-08 12:19:36,312][102897] Updated weights for policy 0, policy_version 13820 (0.0009) +[2023-10-08 12:19:36,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 28311552. Throughput: 0: 1779.6, 1: 1791.3. Samples: 7078562. Policy #0 lag: (min: 11.0, avg: 17.8, max: 43.0) +[2023-10-08 12:19:36,876][101941] Avg episode reward: [(0, '5.290'), (1, '5.910')] +[2023-10-08 12:19:38,326][102898] Updated weights for policy 1, policy_version 13830 (0.0010) +[2023-10-08 12:19:38,696][102898] Updated weights for policy 1, policy_version 13840 (0.0009) +[2023-10-08 12:19:39,062][102898] Updated weights for policy 1, policy_version 13850 (0.0009) +[2023-10-08 12:19:40,025][102897] Updated weights for policy 0, policy_version 13830 (0.0007) +[2023-10-08 12:19:40,403][102897] Updated weights for policy 0, policy_version 13840 (0.0008) +[2023-10-08 12:19:40,778][102897] Updated weights for policy 0, policy_version 13850 (0.0009) +[2023-10-08 12:19:41,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 28377088. Throughput: 0: 1796.4, 1: 1786.4. Samples: 7100066. Policy #0 lag: (min: 11.0, avg: 17.8, max: 43.0) +[2023-10-08 12:19:41,875][101941] Avg episode reward: [(0, '5.820'), (1, '5.420')] +[2023-10-08 12:19:42,906][102898] Updated weights for policy 1, policy_version 13860 (0.0008) +[2023-10-08 12:19:43,277][102898] Updated weights for policy 1, policy_version 13870 (0.0009) +[2023-10-08 12:19:43,637][102898] Updated weights for policy 1, policy_version 13880 (0.0010) +[2023-10-08 12:19:44,514][102897] Updated weights for policy 0, policy_version 13860 (0.0007) +[2023-10-08 12:19:44,909][102897] Updated weights for policy 0, policy_version 13870 (0.0007) +[2023-10-08 12:19:45,289][102897] Updated weights for policy 0, policy_version 13880 (0.0009) +[2023-10-08 12:19:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 28442624. Throughput: 0: 1789.0, 1: 1778.6. Samples: 7121482. Policy #0 lag: (min: 11.0, avg: 17.8, max: 43.0) +[2023-10-08 12:19:46,876][101941] Avg episode reward: [(0, '6.600'), (1, '5.620')] +[2023-10-08 12:19:47,497][102898] Updated weights for policy 1, policy_version 13890 (0.0008) +[2023-10-08 12:19:47,901][102898] Updated weights for policy 1, policy_version 13900 (0.0010) +[2023-10-08 12:19:48,274][102898] Updated weights for policy 1, policy_version 13910 (0.0009) +[2023-10-08 12:19:48,649][102898] Updated weights for policy 1, policy_version 13920 (0.0008) +[2023-10-08 12:19:48,973][102897] Updated weights for policy 0, policy_version 13890 (0.0008) +[2023-10-08 12:19:49,344][102897] Updated weights for policy 0, policy_version 13900 (0.0007) +[2023-10-08 12:19:49,730][102897] Updated weights for policy 0, policy_version 13910 (0.0009) +[2023-10-08 12:19:50,113][102897] Updated weights for policy 0, policy_version 13920 (0.0010) +[2023-10-08 12:19:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 28508160. Throughput: 0: 1802.7, 1: 1779.1. Samples: 7132082. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:19:51,876][101941] Avg episode reward: [(0, '6.270'), (1, '6.070')] +[2023-10-08 12:19:52,222][102898] Updated weights for policy 1, policy_version 13930 (0.0008) +[2023-10-08 12:19:52,592][102898] Updated weights for policy 1, policy_version 13940 (0.0007) +[2023-10-08 12:19:52,960][102898] Updated weights for policy 1, policy_version 13950 (0.0007) +[2023-10-08 12:19:53,808][102897] Updated weights for policy 0, policy_version 13930 (0.0007) +[2023-10-08 12:19:54,178][102897] Updated weights for policy 0, policy_version 13940 (0.0009) +[2023-10-08 12:19:54,556][102897] Updated weights for policy 0, policy_version 13950 (0.0011) +[2023-10-08 12:19:56,786][102898] Updated weights for policy 1, policy_version 13960 (0.0010) +[2023-10-08 12:19:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 28573696. Throughput: 0: 1781.9, 1: 1780.2. Samples: 7153430. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:19:56,876][101941] Avg episode reward: [(0, '5.610'), (1, '6.090')] +[2023-10-08 12:19:57,159][102898] Updated weights for policy 1, policy_version 13970 (0.0010) +[2023-10-08 12:19:57,529][102898] Updated weights for policy 1, policy_version 13980 (0.0007) +[2023-10-08 12:19:58,460][102897] Updated weights for policy 0, policy_version 13960 (0.0008) +[2023-10-08 12:19:58,828][102897] Updated weights for policy 0, policy_version 13970 (0.0008) +[2023-10-08 12:19:59,199][102897] Updated weights for policy 0, policy_version 13980 (0.0008) +[2023-10-08 12:20:01,353][102898] Updated weights for policy 1, policy_version 13990 (0.0007) +[2023-10-08 12:20:01,720][102898] Updated weights for policy 1, policy_version 14000 (0.0008) +[2023-10-08 12:20:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 28639232. Throughput: 0: 1786.6, 1: 1798.0. Samples: 7175580. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:20:01,875][101941] Avg episode reward: [(0, '5.560'), (1, '6.520')] +[2023-10-08 12:20:02,098][102898] Updated weights for policy 1, policy_version 14010 (0.0009) +[2023-10-08 12:20:02,817][102897] Updated weights for policy 0, policy_version 13990 (0.0007) +[2023-10-08 12:20:03,181][102897] Updated weights for policy 0, policy_version 14000 (0.0009) +[2023-10-08 12:20:03,559][102897] Updated weights for policy 0, policy_version 14010 (0.0009) +[2023-10-08 12:20:05,788][102898] Updated weights for policy 1, policy_version 14020 (0.0010) +[2023-10-08 12:20:06,152][102898] Updated weights for policy 1, policy_version 14030 (0.0009) +[2023-10-08 12:20:06,526][102898] Updated weights for policy 1, policy_version 14040 (0.0008) +[2023-10-08 12:20:06,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 28737536. Throughput: 0: 1791.1, 1: 1783.2. Samples: 7185974. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 12:20:06,876][101941] Avg episode reward: [(0, '5.840'), (1, '6.190')] +[2023-10-08 12:20:07,230][102897] Updated weights for policy 0, policy_version 14020 (0.0008) +[2023-10-08 12:20:07,602][102897] Updated weights for policy 0, policy_version 14030 (0.0007) +[2023-10-08 12:20:07,983][102897] Updated weights for policy 0, policy_version 14040 (0.0008) +[2023-10-08 12:20:10,362][102898] Updated weights for policy 1, policy_version 14050 (0.0009) +[2023-10-08 12:20:10,732][102898] Updated weights for policy 1, policy_version 14060 (0.0011) +[2023-10-08 12:20:11,097][102898] Updated weights for policy 1, policy_version 14070 (0.0008) +[2023-10-08 12:20:11,463][102898] Updated weights for policy 1, policy_version 14080 (0.0009) +[2023-10-08 12:20:11,740][102897] Updated weights for policy 0, policy_version 14050 (0.0009) +[2023-10-08 12:20:11,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 28803072. Throughput: 0: 1792.1, 1: 1806.0. Samples: 7208250. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 12:20:11,876][101941] Avg episode reward: [(0, '5.810'), (1, '6.230')] +[2023-10-08 12:20:12,104][102897] Updated weights for policy 0, policy_version 14060 (0.0007) +[2023-10-08 12:20:12,474][102897] Updated weights for policy 0, policy_version 14070 (0.0009) +[2023-10-08 12:20:12,845][102897] Updated weights for policy 0, policy_version 14080 (0.0008) +[2023-10-08 12:20:15,230][102898] Updated weights for policy 1, policy_version 14090 (0.0008) +[2023-10-08 12:20:15,596][102898] Updated weights for policy 1, policy_version 14100 (0.0007) +[2023-10-08 12:20:15,968][102898] Updated weights for policy 1, policy_version 14110 (0.0007) +[2023-10-08 12:20:16,734][102897] Updated weights for policy 0, policy_version 14090 (0.0008) +[2023-10-08 12:20:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 28868608. Throughput: 0: 1811.2, 1: 1783.6. Samples: 7229440. Policy #0 lag: (min: 20.0, avg: 20.0, max: 20.0) +[2023-10-08 12:20:16,877][101941] Avg episode reward: [(0, '6.520'), (1, '6.170')] +[2023-10-08 12:20:16,886][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000014112_14450688.pth... +[2023-10-08 12:20:16,928][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000012448_12746752.pth +[2023-10-08 12:20:17,109][102897] Updated weights for policy 0, policy_version 14100 (0.0009) +[2023-10-08 12:20:17,471][102897] Updated weights for policy 0, policy_version 14110 (0.0010) +[2023-10-08 12:20:17,544][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000014112_14450688.pth... +[2023-10-08 12:20:17,588][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000012416_12713984.pth +[2023-10-08 12:20:19,862][102898] Updated weights for policy 1, policy_version 14120 (0.0009) +[2023-10-08 12:20:20,232][102898] Updated weights for policy 1, policy_version 14130 (0.0009) +[2023-10-08 12:20:20,592][102898] Updated weights for policy 1, policy_version 14140 (0.0009) +[2023-10-08 12:20:21,462][102897] Updated weights for policy 0, policy_version 14120 (0.0009) +[2023-10-08 12:20:21,829][102897] Updated weights for policy 0, policy_version 14130 (0.0007) +[2023-10-08 12:20:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 28934144. Throughput: 0: 1791.9, 1: 1807.2. Samples: 7240518. Policy #0 lag: (min: 17.0, avg: 17.6, max: 32.0) +[2023-10-08 12:20:21,876][101941] Avg episode reward: [(0, '6.990'), (1, '6.600')] +[2023-10-08 12:20:22,194][102897] Updated weights for policy 0, policy_version 14140 (0.0010) +[2023-10-08 12:20:22,343][102634] Saving new best policy, reward=6.990! +[2023-10-08 12:20:24,448][102898] Updated weights for policy 1, policy_version 14150 (0.0009) +[2023-10-08 12:20:24,825][102898] Updated weights for policy 1, policy_version 14160 (0.0008) +[2023-10-08 12:20:25,193][102898] Updated weights for policy 1, policy_version 14170 (0.0007) +[2023-10-08 12:20:25,987][102897] Updated weights for policy 0, policy_version 14150 (0.0011) +[2023-10-08 12:20:26,369][102897] Updated weights for policy 0, policy_version 14160 (0.0010) +[2023-10-08 12:20:26,742][102897] Updated weights for policy 0, policy_version 14170 (0.0007) +[2023-10-08 12:20:26,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 28999680. Throughput: 0: 1803.5, 1: 1780.0. Samples: 7261324. Policy #0 lag: (min: 17.0, avg: 17.6, max: 32.0) +[2023-10-08 12:20:26,876][101941] Avg episode reward: [(0, '6.730'), (1, '7.010')] +[2023-10-08 12:20:26,876][102760] Saving new best policy, reward=7.010! +[2023-10-08 12:20:28,801][102898] Updated weights for policy 1, policy_version 14180 (0.0008) +[2023-10-08 12:20:29,165][102898] Updated weights for policy 1, policy_version 14190 (0.0008) +[2023-10-08 12:20:29,545][102898] Updated weights for policy 1, policy_version 14200 (0.0008) +[2023-10-08 12:20:30,535][102897] Updated weights for policy 0, policy_version 14180 (0.0008) +[2023-10-08 12:20:30,930][102897] Updated weights for policy 0, policy_version 14190 (0.0009) +[2023-10-08 12:20:31,303][102897] Updated weights for policy 0, policy_version 14200 (0.0010) +[2023-10-08 12:20:31,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 29097984. Throughput: 0: 1788.8, 1: 1786.5. Samples: 7282374. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 12:20:31,876][101941] Avg episode reward: [(0, '6.140'), (1, '6.510')] +[2023-10-08 12:20:33,264][102898] Updated weights for policy 1, policy_version 14210 (0.0007) +[2023-10-08 12:20:33,656][102898] Updated weights for policy 1, policy_version 14220 (0.0008) +[2023-10-08 12:20:34,025][102898] Updated weights for policy 1, policy_version 14230 (0.0009) +[2023-10-08 12:20:34,389][102898] Updated weights for policy 1, policy_version 14240 (0.0010) +[2023-10-08 12:20:34,940][102897] Updated weights for policy 0, policy_version 14210 (0.0009) +[2023-10-08 12:20:35,310][102897] Updated weights for policy 0, policy_version 14220 (0.0010) +[2023-10-08 12:20:35,688][102897] Updated weights for policy 0, policy_version 14230 (0.0008) +[2023-10-08 12:20:36,058][102897] Updated weights for policy 0, policy_version 14240 (0.0010) +[2023-10-08 12:20:36,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 29163520. Throughput: 0: 1791.9, 1: 1785.4. Samples: 7293060. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 12:20:36,875][101941] Avg episode reward: [(0, '6.370'), (1, '6.460')] +[2023-10-08 12:20:38,215][102898] Updated weights for policy 1, policy_version 14250 (0.0007) +[2023-10-08 12:20:38,593][102898] Updated weights for policy 1, policy_version 14260 (0.0007) +[2023-10-08 12:20:38,961][102898] Updated weights for policy 1, policy_version 14270 (0.0008) +[2023-10-08 12:20:39,801][102897] Updated weights for policy 0, policy_version 14250 (0.0009) +[2023-10-08 12:20:40,171][102897] Updated weights for policy 0, policy_version 14260 (0.0008) +[2023-10-08 12:20:40,535][102897] Updated weights for policy 0, policy_version 14270 (0.0010) +[2023-10-08 12:20:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 29229056. Throughput: 0: 1792.2, 1: 1791.8. Samples: 7314708. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 12:20:41,876][101941] Avg episode reward: [(0, '6.370'), (1, '6.060')] +[2023-10-08 12:20:42,696][102898] Updated weights for policy 1, policy_version 14280 (0.0008) +[2023-10-08 12:20:43,061][102898] Updated weights for policy 1, policy_version 14290 (0.0010) +[2023-10-08 12:20:43,432][102898] Updated weights for policy 1, policy_version 14300 (0.0009) +[2023-10-08 12:20:44,079][102897] Updated weights for policy 0, policy_version 14280 (0.0009) +[2023-10-08 12:20:44,446][102897] Updated weights for policy 0, policy_version 14290 (0.0007) +[2023-10-08 12:20:44,816][102897] Updated weights for policy 0, policy_version 14300 (0.0009) +[2023-10-08 12:20:46,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 29294592. Throughput: 0: 1782.6, 1: 1802.7. Samples: 7336918. Policy #0 lag: (min: 31.0, avg: 37.2, max: 63.0) +[2023-10-08 12:20:46,876][101941] Avg episode reward: [(0, '6.120'), (1, '5.840')] +[2023-10-08 12:20:47,053][102898] Updated weights for policy 1, policy_version 14310 (0.0008) +[2023-10-08 12:20:47,432][102898] Updated weights for policy 1, policy_version 14320 (0.0007) +[2023-10-08 12:20:47,793][102898] Updated weights for policy 1, policy_version 14330 (0.0007) +[2023-10-08 12:20:48,655][102897] Updated weights for policy 0, policy_version 14310 (0.0008) +[2023-10-08 12:20:49,018][102897] Updated weights for policy 0, policy_version 14320 (0.0010) +[2023-10-08 12:20:49,393][102897] Updated weights for policy 0, policy_version 14330 (0.0008) +[2023-10-08 12:20:51,690][102898] Updated weights for policy 1, policy_version 14340 (0.0008) +[2023-10-08 12:20:51,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 29360128. Throughput: 0: 1786.1, 1: 1792.8. Samples: 7347020. Policy #0 lag: (min: 31.0, avg: 37.2, max: 63.0) +[2023-10-08 12:20:51,875][101941] Avg episode reward: [(0, '5.650'), (1, '6.150')] +[2023-10-08 12:20:52,050][102898] Updated weights for policy 1, policy_version 14350 (0.0007) +[2023-10-08 12:20:52,418][102898] Updated weights for policy 1, policy_version 14360 (0.0007) +[2023-10-08 12:20:53,209][102897] Updated weights for policy 0, policy_version 14340 (0.0008) +[2023-10-08 12:20:53,584][102897] Updated weights for policy 0, policy_version 14350 (0.0007) +[2023-10-08 12:20:53,950][102897] Updated weights for policy 0, policy_version 14360 (0.0008) +[2023-10-08 12:20:56,032][102898] Updated weights for policy 1, policy_version 14370 (0.0008) +[2023-10-08 12:20:56,395][102898] Updated weights for policy 1, policy_version 14380 (0.0009) +[2023-10-08 12:20:56,755][102898] Updated weights for policy 1, policy_version 14390 (0.0007) +[2023-10-08 12:20:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 29425664. Throughput: 0: 1773.3, 1: 1799.9. Samples: 7369044. Policy #0 lag: (min: 31.0, avg: 37.2, max: 63.0) +[2023-10-08 12:20:56,875][101941] Avg episode reward: [(0, '6.480'), (1, '6.550')] +[2023-10-08 12:20:57,116][102898] Updated weights for policy 1, policy_version 14400 (0.0007) +[2023-10-08 12:20:57,755][102897] Updated weights for policy 0, policy_version 14370 (0.0008) +[2023-10-08 12:20:58,137][102897] Updated weights for policy 0, policy_version 14380 (0.0008) +[2023-10-08 12:20:58,506][102897] Updated weights for policy 0, policy_version 14390 (0.0007) +[2023-10-08 12:20:58,877][102897] Updated weights for policy 0, policy_version 14400 (0.0009) +[2023-10-08 12:21:00,936][102898] Updated weights for policy 1, policy_version 14410 (0.0007) +[2023-10-08 12:21:01,300][102898] Updated weights for policy 1, policy_version 14420 (0.0008) +[2023-10-08 12:21:01,673][102898] Updated weights for policy 1, policy_version 14430 (0.0007) +[2023-10-08 12:21:01,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 29523968. Throughput: 0: 1780.7, 1: 1798.8. Samples: 7390516. Policy #0 lag: (min: 8.0, avg: 34.7, max: 40.0) +[2023-10-08 12:21:01,876][101941] Avg episode reward: [(0, '6.350'), (1, '6.240')] +[2023-10-08 12:21:02,598][102897] Updated weights for policy 0, policy_version 14410 (0.0007) +[2023-10-08 12:21:02,969][102897] Updated weights for policy 0, policy_version 14420 (0.0007) +[2023-10-08 12:21:03,343][102897] Updated weights for policy 0, policy_version 14430 (0.0009) +[2023-10-08 12:21:05,398][102898] Updated weights for policy 1, policy_version 14440 (0.0008) +[2023-10-08 12:21:05,762][102898] Updated weights for policy 1, policy_version 14450 (0.0011) +[2023-10-08 12:21:06,118][102898] Updated weights for policy 1, policy_version 14460 (0.0009) +[2023-10-08 12:21:06,866][102897] Updated weights for policy 0, policy_version 14440 (0.0008) +[2023-10-08 12:21:06,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 29589504. Throughput: 0: 1780.9, 1: 1794.9. Samples: 7401430. Policy #0 lag: (min: 8.0, avg: 34.7, max: 40.0) +[2023-10-08 12:21:06,875][101941] Avg episode reward: [(0, '6.650'), (1, '5.810')] +[2023-10-08 12:21:07,237][102897] Updated weights for policy 0, policy_version 14450 (0.0008) +[2023-10-08 12:21:07,614][102897] Updated weights for policy 0, policy_version 14460 (0.0008) +[2023-10-08 12:21:09,849][102898] Updated weights for policy 1, policy_version 14470 (0.0008) +[2023-10-08 12:21:10,217][102898] Updated weights for policy 1, policy_version 14480 (0.0009) +[2023-10-08 12:21:10,580][102898] Updated weights for policy 1, policy_version 14490 (0.0011) +[2023-10-08 12:21:11,465][102897] Updated weights for policy 0, policy_version 14470 (0.0007) +[2023-10-08 12:21:11,841][102897] Updated weights for policy 0, policy_version 14480 (0.0009) +[2023-10-08 12:21:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 29655040. Throughput: 0: 1788.3, 1: 1807.5. Samples: 7423132. Policy #0 lag: (min: 8.0, avg: 34.7, max: 40.0) +[2023-10-08 12:21:11,876][101941] Avg episode reward: [(0, '6.010'), (1, '5.730')] +[2023-10-08 12:21:12,214][102897] Updated weights for policy 0, policy_version 14490 (0.0010) +[2023-10-08 12:21:14,419][102898] Updated weights for policy 1, policy_version 14500 (0.0007) +[2023-10-08 12:21:14,788][102898] Updated weights for policy 1, policy_version 14510 (0.0007) +[2023-10-08 12:21:15,158][102898] Updated weights for policy 1, policy_version 14520 (0.0007) +[2023-10-08 12:21:15,978][102897] Updated weights for policy 0, policy_version 14500 (0.0009) +[2023-10-08 12:21:16,346][102897] Updated weights for policy 0, policy_version 14510 (0.0009) +[2023-10-08 12:21:16,729][102897] Updated weights for policy 0, policy_version 14520 (0.0010) +[2023-10-08 12:21:16,875][101941] Fps is (10 sec: 13106.7, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 29720576. Throughput: 0: 1803.2, 1: 1792.8. Samples: 7444190. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:21:16,876][101941] Avg episode reward: [(0, '5.840'), (1, '5.550')] +[2023-10-08 12:21:19,034][102898] Updated weights for policy 1, policy_version 14530 (0.0009) +[2023-10-08 12:21:19,452][102898] Updated weights for policy 1, policy_version 14540 (0.0010) +[2023-10-08 12:21:19,814][102898] Updated weights for policy 1, policy_version 14550 (0.0007) +[2023-10-08 12:21:20,183][102898] Updated weights for policy 1, policy_version 14560 (0.0008) +[2023-10-08 12:21:20,551][102897] Updated weights for policy 0, policy_version 14530 (0.0011) +[2023-10-08 12:21:20,927][102897] Updated weights for policy 0, policy_version 14540 (0.0009) +[2023-10-08 12:21:21,291][102897] Updated weights for policy 0, policy_version 14550 (0.0008) +[2023-10-08 12:21:21,668][102897] Updated weights for policy 0, policy_version 14560 (0.0010) +[2023-10-08 12:21:21,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 29818880. Throughput: 0: 1787.2, 1: 1811.1. Samples: 7454986. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:21:21,875][101941] Avg episode reward: [(0, '6.250'), (1, '5.610')] +[2023-10-08 12:21:23,802][102898] Updated weights for policy 1, policy_version 14570 (0.0009) +[2023-10-08 12:21:24,168][102898] Updated weights for policy 1, policy_version 14580 (0.0007) +[2023-10-08 12:21:24,533][102898] Updated weights for policy 1, policy_version 14590 (0.0008) +[2023-10-08 12:21:25,494][102897] Updated weights for policy 0, policy_version 14570 (0.0008) +[2023-10-08 12:21:25,860][102897] Updated weights for policy 0, policy_version 14580 (0.0009) +[2023-10-08 12:21:26,237][102897] Updated weights for policy 0, policy_version 14590 (0.0009) +[2023-10-08 12:21:26,875][101941] Fps is (10 sec: 16384.6, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 29884416. Throughput: 0: 1800.4, 1: 1785.3. Samples: 7476066. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 12:21:26,875][101941] Avg episode reward: [(0, '6.290'), (1, '5.930')] +[2023-10-08 12:21:28,396][102898] Updated weights for policy 1, policy_version 14600 (0.0008) +[2023-10-08 12:21:28,763][102898] Updated weights for policy 1, policy_version 14610 (0.0008) +[2023-10-08 12:21:29,125][102898] Updated weights for policy 1, policy_version 14620 (0.0008) +[2023-10-08 12:21:30,123][102897] Updated weights for policy 0, policy_version 14600 (0.0007) +[2023-10-08 12:21:30,508][102897] Updated weights for policy 0, policy_version 14610 (0.0009) +[2023-10-08 12:21:30,882][102897] Updated weights for policy 0, policy_version 14620 (0.0009) +[2023-10-08 12:21:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 29949952. Throughput: 0: 1777.0, 1: 1782.5. Samples: 7497096. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 12:21:31,875][101941] Avg episode reward: [(0, '5.890'), (1, '6.920')] +[2023-10-08 12:21:32,907][102898] Updated weights for policy 1, policy_version 14630 (0.0007) +[2023-10-08 12:21:33,270][102898] Updated weights for policy 1, policy_version 14640 (0.0008) +[2023-10-08 12:21:33,633][102898] Updated weights for policy 1, policy_version 14650 (0.0007) +[2023-10-08 12:21:34,543][102897] Updated weights for policy 0, policy_version 14630 (0.0007) +[2023-10-08 12:21:34,913][102897] Updated weights for policy 0, policy_version 14640 (0.0008) +[2023-10-08 12:21:35,288][102897] Updated weights for policy 0, policy_version 14650 (0.0007) +[2023-10-08 12:21:36,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 30015488. Throughput: 0: 1805.5, 1: 1780.3. Samples: 7508378. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 12:21:36,876][101941] Avg episode reward: [(0, '6.070'), (1, '6.410')] +[2023-10-08 12:21:37,317][102898] Updated weights for policy 1, policy_version 14660 (0.0008) +[2023-10-08 12:21:37,695][102898] Updated weights for policy 1, policy_version 14670 (0.0009) +[2023-10-08 12:21:38,060][102898] Updated weights for policy 1, policy_version 14680 (0.0011) +[2023-10-08 12:21:39,069][102897] Updated weights for policy 0, policy_version 14660 (0.0007) +[2023-10-08 12:21:39,448][102897] Updated weights for policy 0, policy_version 14670 (0.0008) +[2023-10-08 12:21:39,813][102897] Updated weights for policy 0, policy_version 14680 (0.0007) +[2023-10-08 12:21:41,717][102898] Updated weights for policy 1, policy_version 14690 (0.0008) +[2023-10-08 12:21:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 30081024. Throughput: 0: 1788.7, 1: 1782.7. Samples: 7529756. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 12:21:41,876][101941] Avg episode reward: [(0, '6.800'), (1, '5.600')] +[2023-10-08 12:21:42,090][102898] Updated weights for policy 1, policy_version 14700 (0.0010) +[2023-10-08 12:21:42,467][102898] Updated weights for policy 1, policy_version 14710 (0.0011) +[2023-10-08 12:21:42,834][102898] Updated weights for policy 1, policy_version 14720 (0.0008) +[2023-10-08 12:21:43,632][102897] Updated weights for policy 0, policy_version 14690 (0.0008) +[2023-10-08 12:21:44,012][102897] Updated weights for policy 0, policy_version 14700 (0.0008) +[2023-10-08 12:21:44,385][102897] Updated weights for policy 0, policy_version 14710 (0.0010) +[2023-10-08 12:21:44,751][102897] Updated weights for policy 0, policy_version 14720 (0.0008) +[2023-10-08 12:21:46,571][102898] Updated weights for policy 1, policy_version 14730 (0.0009) +[2023-10-08 12:21:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 30146560. Throughput: 0: 1777.6, 1: 1806.5. Samples: 7551804. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 12:21:46,876][101941] Avg episode reward: [(0, '7.110'), (1, '5.570')] +[2023-10-08 12:21:46,887][102634] Saving new best policy, reward=7.110! +[2023-10-08 12:21:46,947][102898] Updated weights for policy 1, policy_version 14740 (0.0008) +[2023-10-08 12:21:47,314][102898] Updated weights for policy 1, policy_version 14750 (0.0007) +[2023-10-08 12:21:48,476][102897] Updated weights for policy 0, policy_version 14730 (0.0007) +[2023-10-08 12:21:48,843][102897] Updated weights for policy 0, policy_version 14740 (0.0007) +[2023-10-08 12:21:49,224][102897] Updated weights for policy 0, policy_version 14750 (0.0007) +[2023-10-08 12:21:51,021][102898] Updated weights for policy 1, policy_version 14760 (0.0009) +[2023-10-08 12:21:51,392][102898] Updated weights for policy 1, policy_version 14770 (0.0008) +[2023-10-08 12:21:51,749][102898] Updated weights for policy 1, policy_version 14780 (0.0007) +[2023-10-08 12:21:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 30212096. Throughput: 0: 1781.2, 1: 1782.7. Samples: 7561808. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 12:21:51,876][101941] Avg episode reward: [(0, '6.670'), (1, '5.720')] +[2023-10-08 12:21:53,009][102897] Updated weights for policy 0, policy_version 14760 (0.0010) +[2023-10-08 12:21:53,383][102897] Updated weights for policy 0, policy_version 14770 (0.0010) +[2023-10-08 12:21:53,755][102897] Updated weights for policy 0, policy_version 14780 (0.0008) +[2023-10-08 12:21:55,489][102898] Updated weights for policy 1, policy_version 14790 (0.0008) +[2023-10-08 12:21:55,858][102898] Updated weights for policy 1, policy_version 14800 (0.0009) +[2023-10-08 12:21:56,235][102898] Updated weights for policy 1, policy_version 14810 (0.0007) +[2023-10-08 12:21:56,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 30310400. Throughput: 0: 1771.8, 1: 1805.1. Samples: 7584094. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 12:21:56,876][101941] Avg episode reward: [(0, '6.640'), (1, '6.060')] +[2023-10-08 12:21:57,478][102897] Updated weights for policy 0, policy_version 14790 (0.0008) +[2023-10-08 12:21:57,856][102897] Updated weights for policy 0, policy_version 14800 (0.0009) +[2023-10-08 12:21:58,230][102897] Updated weights for policy 0, policy_version 14810 (0.0008) +[2023-10-08 12:21:59,879][102898] Updated weights for policy 1, policy_version 14820 (0.0010) +[2023-10-08 12:22:00,242][102898] Updated weights for policy 1, policy_version 14830 (0.0008) +[2023-10-08 12:22:00,610][102898] Updated weights for policy 1, policy_version 14840 (0.0007) +[2023-10-08 12:22:01,855][102897] Updated weights for policy 0, policy_version 14820 (0.0008) +[2023-10-08 12:22:01,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 30375936. Throughput: 0: 1795.6, 1: 1791.0. Samples: 7605584. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 12:22:01,876][101941] Avg episode reward: [(0, '5.900'), (1, '6.430')] +[2023-10-08 12:22:02,237][102897] Updated weights for policy 0, policy_version 14830 (0.0009) +[2023-10-08 12:22:02,604][102897] Updated weights for policy 0, policy_version 14840 (0.0010) +[2023-10-08 12:22:04,449][102898] Updated weights for policy 1, policy_version 14850 (0.0010) +[2023-10-08 12:22:04,849][102898] Updated weights for policy 1, policy_version 14860 (0.0007) +[2023-10-08 12:22:05,223][102898] Updated weights for policy 1, policy_version 14870 (0.0007) +[2023-10-08 12:22:05,588][102898] Updated weights for policy 1, policy_version 14880 (0.0008) +[2023-10-08 12:22:06,436][102897] Updated weights for policy 0, policy_version 14850 (0.0010) +[2023-10-08 12:22:06,810][102897] Updated weights for policy 0, policy_version 14860 (0.0010) +[2023-10-08 12:22:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 30441472. Throughput: 0: 1780.9, 1: 1807.5. Samples: 7616468. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 12:22:06,876][101941] Avg episode reward: [(0, '5.760'), (1, '6.320')] +[2023-10-08 12:22:07,186][102897] Updated weights for policy 0, policy_version 14870 (0.0007) +[2023-10-08 12:22:07,560][102897] Updated weights for policy 0, policy_version 14880 (0.0009) +[2023-10-08 12:22:09,256][102898] Updated weights for policy 1, policy_version 14890 (0.0010) +[2023-10-08 12:22:09,622][102898] Updated weights for policy 1, policy_version 14900 (0.0008) +[2023-10-08 12:22:09,996][102898] Updated weights for policy 1, policy_version 14910 (0.0008) +[2023-10-08 12:22:11,308][102897] Updated weights for policy 0, policy_version 14890 (0.0008) +[2023-10-08 12:22:11,682][102897] Updated weights for policy 0, policy_version 14900 (0.0008) +[2023-10-08 12:22:11,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 30507008. Throughput: 0: 1793.0, 1: 1805.0. Samples: 7637974. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:22:11,876][101941] Avg episode reward: [(0, '6.020'), (1, '5.910')] +[2023-10-08 12:22:12,052][102897] Updated weights for policy 0, policy_version 14910 (0.0010) +[2023-10-08 12:22:13,756][102898] Updated weights for policy 1, policy_version 14920 (0.0010) +[2023-10-08 12:22:14,123][102898] Updated weights for policy 1, policy_version 14930 (0.0011) +[2023-10-08 12:22:14,496][102898] Updated weights for policy 1, policy_version 14940 (0.0010) +[2023-10-08 12:22:15,770][102897] Updated weights for policy 0, policy_version 14920 (0.0009) +[2023-10-08 12:22:16,138][102897] Updated weights for policy 0, policy_version 14930 (0.0010) +[2023-10-08 12:22:16,515][102897] Updated weights for policy 0, policy_version 14940 (0.0008) +[2023-10-08 12:22:16,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 30605312. Throughput: 0: 1800.6, 1: 1810.2. Samples: 7659580. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:22:16,875][101941] Avg episode reward: [(0, '6.920'), (1, '6.040')] +[2023-10-08 12:22:16,884][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000014944_15302656.pth... +[2023-10-08 12:22:16,885][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000014944_15302656.pth... +[2023-10-08 12:22:16,925][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000013248_13565952.pth +[2023-10-08 12:22:16,928][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000013280_13598720.pth +[2023-10-08 12:22:17,856][102898] Updated weights for policy 1, policy_version 14950 (0.0007) +[2023-10-08 12:22:18,230][102898] Updated weights for policy 1, policy_version 14960 (0.0009) +[2023-10-08 12:22:18,591][102898] Updated weights for policy 1, policy_version 14970 (0.0007) +[2023-10-08 12:22:20,233][102897] Updated weights for policy 0, policy_version 14950 (0.0008) +[2023-10-08 12:22:20,610][102897] Updated weights for policy 0, policy_version 14960 (0.0008) +[2023-10-08 12:22:20,989][102897] Updated weights for policy 0, policy_version 14970 (0.0008) +[2023-10-08 12:22:21,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 30670848. Throughput: 0: 1791.8, 1: 1814.3. Samples: 7670652. Policy #0 lag: (min: 5.0, avg: 5.0, max: 5.0) +[2023-10-08 12:22:21,876][101941] Avg episode reward: [(0, '6.360'), (1, '6.210')] +[2023-10-08 12:22:22,316][102898] Updated weights for policy 1, policy_version 14980 (0.0010) +[2023-10-08 12:22:22,682][102898] Updated weights for policy 1, policy_version 14990 (0.0011) +[2023-10-08 12:22:23,050][102898] Updated weights for policy 1, policy_version 15000 (0.0010) +[2023-10-08 12:22:24,749][102897] Updated weights for policy 0, policy_version 14980 (0.0008) +[2023-10-08 12:22:25,122][102897] Updated weights for policy 0, policy_version 14990 (0.0007) +[2023-10-08 12:22:25,499][102897] Updated weights for policy 0, policy_version 15000 (0.0008) +[2023-10-08 12:22:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 30736384. Throughput: 0: 1797.7, 1: 1810.9. Samples: 7692144. Policy #0 lag: (min: 5.0, avg: 5.0, max: 5.0) +[2023-10-08 12:22:26,875][101941] Avg episode reward: [(0, '5.610'), (1, '5.980')] +[2023-10-08 12:22:26,962][102898] Updated weights for policy 1, policy_version 15010 (0.0010) +[2023-10-08 12:22:27,319][102898] Updated weights for policy 1, policy_version 15020 (0.0008) +[2023-10-08 12:22:27,691][102898] Updated weights for policy 1, policy_version 15030 (0.0008) +[2023-10-08 12:22:28,055][102898] Updated weights for policy 1, policy_version 15040 (0.0008) +[2023-10-08 12:22:29,180][102897] Updated weights for policy 0, policy_version 15010 (0.0009) +[2023-10-08 12:22:29,554][102897] Updated weights for policy 0, policy_version 15020 (0.0007) +[2023-10-08 12:22:29,926][102897] Updated weights for policy 0, policy_version 15030 (0.0007) +[2023-10-08 12:22:30,291][102897] Updated weights for policy 0, policy_version 15040 (0.0008) +[2023-10-08 12:22:31,609][102898] Updated weights for policy 1, policy_version 15050 (0.0010) +[2023-10-08 12:22:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 30801920. Throughput: 0: 1789.5, 1: 1813.4. Samples: 7713936. Policy #0 lag: (min: 5.0, avg: 5.0, max: 5.0) +[2023-10-08 12:22:31,876][101941] Avg episode reward: [(0, '5.500'), (1, '5.170')] +[2023-10-08 12:22:31,971][102898] Updated weights for policy 1, policy_version 15060 (0.0007) +[2023-10-08 12:22:32,342][102898] Updated weights for policy 1, policy_version 15070 (0.0008) +[2023-10-08 12:22:34,108][102897] Updated weights for policy 0, policy_version 15050 (0.0009) +[2023-10-08 12:22:34,482][102897] Updated weights for policy 0, policy_version 15060 (0.0009) +[2023-10-08 12:22:34,870][102897] Updated weights for policy 0, policy_version 15070 (0.0008) +[2023-10-08 12:22:36,150][102898] Updated weights for policy 1, policy_version 15080 (0.0007) +[2023-10-08 12:22:36,524][102898] Updated weights for policy 1, policy_version 15090 (0.0007) +[2023-10-08 12:22:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 30867456. Throughput: 0: 1802.9, 1: 1815.2. Samples: 7724626. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 12:22:36,876][101941] Avg episode reward: [(0, '5.880'), (1, '5.890')] +[2023-10-08 12:22:36,895][102898] Updated weights for policy 1, policy_version 15100 (0.0007) +[2023-10-08 12:22:38,704][102897] Updated weights for policy 0, policy_version 15080 (0.0009) +[2023-10-08 12:22:39,082][102897] Updated weights for policy 0, policy_version 15090 (0.0007) +[2023-10-08 12:22:39,448][102897] Updated weights for policy 0, policy_version 15100 (0.0007) +[2023-10-08 12:22:40,693][102898] Updated weights for policy 1, policy_version 15110 (0.0007) +[2023-10-08 12:22:41,056][102898] Updated weights for policy 1, policy_version 15120 (0.0008) +[2023-10-08 12:22:41,433][102898] Updated weights for policy 1, policy_version 15130 (0.0008) +[2023-10-08 12:22:41,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 30965760. Throughput: 0: 1791.6, 1: 1810.9. Samples: 7746210. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 12:22:41,875][101941] Avg episode reward: [(0, '6.240'), (1, '6.190')] +[2023-10-08 12:22:43,152][102897] Updated weights for policy 0, policy_version 15110 (0.0008) +[2023-10-08 12:22:43,532][102897] Updated weights for policy 0, policy_version 15120 (0.0009) +[2023-10-08 12:22:43,907][102897] Updated weights for policy 0, policy_version 15130 (0.0009) +[2023-10-08 12:22:45,348][102898] Updated weights for policy 1, policy_version 15140 (0.0008) +[2023-10-08 12:22:45,718][102898] Updated weights for policy 1, policy_version 15150 (0.0008) +[2023-10-08 12:22:46,079][102898] Updated weights for policy 1, policy_version 15160 (0.0008) +[2023-10-08 12:22:46,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 31031296. Throughput: 0: 1783.3, 1: 1804.0. Samples: 7767014. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 12:22:46,876][101941] Avg episode reward: [(0, '6.390'), (1, '5.940')] +[2023-10-08 12:22:47,716][102897] Updated weights for policy 0, policy_version 15140 (0.0008) +[2023-10-08 12:22:48,104][102897] Updated weights for policy 0, policy_version 15150 (0.0008) +[2023-10-08 12:22:48,492][102897] Updated weights for policy 0, policy_version 15160 (0.0009) +[2023-10-08 12:22:49,774][102898] Updated weights for policy 1, policy_version 15170 (0.0010) +[2023-10-08 12:22:50,181][102898] Updated weights for policy 1, policy_version 15180 (0.0008) +[2023-10-08 12:22:50,546][102898] Updated weights for policy 1, policy_version 15190 (0.0010) +[2023-10-08 12:22:50,915][102898] Updated weights for policy 1, policy_version 15200 (0.0007) +[2023-10-08 12:22:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 31096832. Throughput: 0: 1784.7, 1: 1807.0. Samples: 7778094. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:22:51,875][101941] Avg episode reward: [(0, '6.080'), (1, '5.910')] +[2023-10-08 12:22:52,211][102897] Updated weights for policy 0, policy_version 15170 (0.0008) +[2023-10-08 12:22:52,579][102897] Updated weights for policy 0, policy_version 15180 (0.0007) +[2023-10-08 12:22:52,957][102897] Updated weights for policy 0, policy_version 15190 (0.0009) +[2023-10-08 12:22:53,329][102897] Updated weights for policy 0, policy_version 15200 (0.0008) +[2023-10-08 12:22:54,732][102898] Updated weights for policy 1, policy_version 15210 (0.0010) +[2023-10-08 12:22:55,111][102898] Updated weights for policy 1, policy_version 15220 (0.0008) +[2023-10-08 12:22:55,488][102898] Updated weights for policy 1, policy_version 15230 (0.0009) +[2023-10-08 12:22:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 31162368. Throughput: 0: 1786.1, 1: 1794.1. Samples: 7799082. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:22:56,875][101941] Avg episode reward: [(0, '6.330'), (1, '6.270')] +[2023-10-08 12:22:57,053][102897] Updated weights for policy 0, policy_version 15210 (0.0009) +[2023-10-08 12:22:57,423][102897] Updated weights for policy 0, policy_version 15220 (0.0007) +[2023-10-08 12:22:57,801][102897] Updated weights for policy 0, policy_version 15230 (0.0007) +[2023-10-08 12:22:59,338][102898] Updated weights for policy 1, policy_version 15240 (0.0009) +[2023-10-08 12:22:59,698][102898] Updated weights for policy 1, policy_version 15250 (0.0007) +[2023-10-08 12:23:00,073][102898] Updated weights for policy 1, policy_version 15260 (0.0007) +[2023-10-08 12:23:01,558][102897] Updated weights for policy 0, policy_version 15240 (0.0007) +[2023-10-08 12:23:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 31227904. Throughput: 0: 1803.9, 1: 1784.2. Samples: 7821042. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:23:01,875][101941] Avg episode reward: [(0, '5.740'), (1, '6.340')] +[2023-10-08 12:23:01,920][102897] Updated weights for policy 0, policy_version 15250 (0.0008) +[2023-10-08 12:23:02,301][102897] Updated weights for policy 0, policy_version 15260 (0.0009) +[2023-10-08 12:23:03,807][102898] Updated weights for policy 1, policy_version 15270 (0.0010) +[2023-10-08 12:23:04,181][102898] Updated weights for policy 1, policy_version 15280 (0.0010) +[2023-10-08 12:23:04,550][102898] Updated weights for policy 1, policy_version 15290 (0.0008) +[2023-10-08 12:23:05,938][102897] Updated weights for policy 0, policy_version 15270 (0.0009) +[2023-10-08 12:23:06,313][102897] Updated weights for policy 0, policy_version 15280 (0.0009) +[2023-10-08 12:23:06,702][102897] Updated weights for policy 0, policy_version 15290 (0.0011) +[2023-10-08 12:23:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 31293440. Throughput: 0: 1786.1, 1: 1790.1. Samples: 7831580. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:23:06,876][101941] Avg episode reward: [(0, '6.120'), (1, '6.120')] +[2023-10-08 12:23:08,269][102898] Updated weights for policy 1, policy_version 15300 (0.0010) +[2023-10-08 12:23:08,641][102898] Updated weights for policy 1, policy_version 15310 (0.0009) +[2023-10-08 12:23:09,013][102898] Updated weights for policy 1, policy_version 15320 (0.0009) +[2023-10-08 12:23:10,403][102897] Updated weights for policy 0, policy_version 15300 (0.0009) +[2023-10-08 12:23:10,781][102897] Updated weights for policy 0, policy_version 15310 (0.0009) +[2023-10-08 12:23:11,153][102897] Updated weights for policy 0, policy_version 15320 (0.0008) +[2023-10-08 12:23:11,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 31391744. Throughput: 0: 1804.6, 1: 1778.5. Samples: 7853384. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:23:11,876][101941] Avg episode reward: [(0, '5.960'), (1, '5.950')] +[2023-10-08 12:23:12,816][102898] Updated weights for policy 1, policy_version 15330 (0.0008) +[2023-10-08 12:23:13,178][102898] Updated weights for policy 1, policy_version 15340 (0.0010) +[2023-10-08 12:23:13,550][102898] Updated weights for policy 1, policy_version 15350 (0.0007) +[2023-10-08 12:23:13,913][102898] Updated weights for policy 1, policy_version 15360 (0.0009) +[2023-10-08 12:23:15,116][102897] Updated weights for policy 0, policy_version 15330 (0.0008) +[2023-10-08 12:23:15,483][102897] Updated weights for policy 0, policy_version 15340 (0.0007) +[2023-10-08 12:23:15,857][102897] Updated weights for policy 0, policy_version 15350 (0.0008) +[2023-10-08 12:23:16,227][102897] Updated weights for policy 0, policy_version 15360 (0.0008) +[2023-10-08 12:23:16,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 31457280. Throughput: 0: 1785.6, 1: 1779.4. Samples: 7874360. Policy #0 lag: (min: 31.0, avg: 31.7, max: 48.0) +[2023-10-08 12:23:16,875][101941] Avg episode reward: [(0, '6.090'), (1, '5.990')] +[2023-10-08 12:23:17,743][102898] Updated weights for policy 1, policy_version 15370 (0.0008) +[2023-10-08 12:23:18,106][102898] Updated weights for policy 1, policy_version 15380 (0.0011) +[2023-10-08 12:23:18,472][102898] Updated weights for policy 1, policy_version 15390 (0.0010) +[2023-10-08 12:23:19,872][102897] Updated weights for policy 0, policy_version 15370 (0.0008) +[2023-10-08 12:23:20,248][102897] Updated weights for policy 0, policy_version 15380 (0.0010) +[2023-10-08 12:23:20,622][102897] Updated weights for policy 0, policy_version 15390 (0.0011) +[2023-10-08 12:23:21,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 31522816. Throughput: 0: 1801.6, 1: 1770.2. Samples: 7885360. Policy #0 lag: (min: 31.0, avg: 31.7, max: 48.0) +[2023-10-08 12:23:21,876][101941] Avg episode reward: [(0, '6.220'), (1, '6.300')] +[2023-10-08 12:23:22,408][102898] Updated weights for policy 1, policy_version 15400 (0.0008) +[2023-10-08 12:23:22,781][102898] Updated weights for policy 1, policy_version 15410 (0.0008) +[2023-10-08 12:23:23,145][102898] Updated weights for policy 1, policy_version 15420 (0.0008) +[2023-10-08 12:23:24,452][102897] Updated weights for policy 0, policy_version 15400 (0.0008) +[2023-10-08 12:23:24,813][102897] Updated weights for policy 0, policy_version 15410 (0.0010) +[2023-10-08 12:23:25,189][102897] Updated weights for policy 0, policy_version 15420 (0.0008) +[2023-10-08 12:23:26,792][102898] Updated weights for policy 1, policy_version 15430 (0.0009) +[2023-10-08 12:23:26,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 31588352. Throughput: 0: 1781.5, 1: 1774.8. Samples: 7906240. Policy #0 lag: (min: 31.0, avg: 31.7, max: 48.0) +[2023-10-08 12:23:26,876][101941] Avg episode reward: [(0, '6.650'), (1, '5.980')] +[2023-10-08 12:23:27,158][102898] Updated weights for policy 1, policy_version 15440 (0.0010) +[2023-10-08 12:23:27,532][102898] Updated weights for policy 1, policy_version 15450 (0.0010) +[2023-10-08 12:23:28,806][102897] Updated weights for policy 0, policy_version 15430 (0.0007) +[2023-10-08 12:23:29,179][102897] Updated weights for policy 0, policy_version 15440 (0.0008) +[2023-10-08 12:23:29,553][102897] Updated weights for policy 0, policy_version 15450 (0.0009) +[2023-10-08 12:23:31,324][102898] Updated weights for policy 1, policy_version 15460 (0.0008) +[2023-10-08 12:23:31,688][102898] Updated weights for policy 1, policy_version 15470 (0.0007) +[2023-10-08 12:23:31,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 31653888. Throughput: 0: 1779.9, 1: 1797.8. Samples: 7928012. Policy #0 lag: (min: 30.0, avg: 30.3, max: 42.0) +[2023-10-08 12:23:31,876][101941] Avg episode reward: [(0, '6.290'), (1, '6.400')] +[2023-10-08 12:23:32,064][102898] Updated weights for policy 1, policy_version 15480 (0.0008) +[2023-10-08 12:23:33,531][102897] Updated weights for policy 0, policy_version 15460 (0.0008) +[2023-10-08 12:23:33,918][102897] Updated weights for policy 0, policy_version 15470 (0.0008) +[2023-10-08 12:23:34,294][102897] Updated weights for policy 0, policy_version 15480 (0.0007) +[2023-10-08 12:23:35,904][102898] Updated weights for policy 1, policy_version 15490 (0.0007) +[2023-10-08 12:23:36,297][102898] Updated weights for policy 1, policy_version 15500 (0.0007) +[2023-10-08 12:23:36,656][102898] Updated weights for policy 1, policy_version 15510 (0.0007) +[2023-10-08 12:23:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 31719424. Throughput: 0: 1786.8, 1: 1774.5. Samples: 7938356. Policy #0 lag: (min: 30.0, avg: 30.3, max: 42.0) +[2023-10-08 12:23:36,876][101941] Avg episode reward: [(0, '5.520'), (1, '6.740')] +[2023-10-08 12:23:37,028][102898] Updated weights for policy 1, policy_version 15520 (0.0009) +[2023-10-08 12:23:38,004][102897] Updated weights for policy 0, policy_version 15490 (0.0008) +[2023-10-08 12:23:38,375][102897] Updated weights for policy 0, policy_version 15500 (0.0010) +[2023-10-08 12:23:38,742][102897] Updated weights for policy 0, policy_version 15510 (0.0008) +[2023-10-08 12:23:39,112][102897] Updated weights for policy 0, policy_version 15520 (0.0008) +[2023-10-08 12:23:40,830][102898] Updated weights for policy 1, policy_version 15530 (0.0007) +[2023-10-08 12:23:41,196][102898] Updated weights for policy 1, policy_version 15540 (0.0009) +[2023-10-08 12:23:41,555][102898] Updated weights for policy 1, policy_version 15550 (0.0008) +[2023-10-08 12:23:41,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 31817728. Throughput: 0: 1773.9, 1: 1803.4. Samples: 7960062. Policy #0 lag: (min: 30.0, avg: 30.3, max: 42.0) +[2023-10-08 12:23:41,876][101941] Avg episode reward: [(0, '5.810'), (1, '6.190')] +[2023-10-08 12:23:42,939][102897] Updated weights for policy 0, policy_version 15530 (0.0008) +[2023-10-08 12:23:43,308][102897] Updated weights for policy 0, policy_version 15540 (0.0008) +[2023-10-08 12:23:43,673][102897] Updated weights for policy 0, policy_version 15550 (0.0009) +[2023-10-08 12:23:45,133][102898] Updated weights for policy 1, policy_version 15560 (0.0008) +[2023-10-08 12:23:45,491][102898] Updated weights for policy 1, policy_version 15570 (0.0009) +[2023-10-08 12:23:45,855][102898] Updated weights for policy 1, policy_version 15580 (0.0008) +[2023-10-08 12:23:46,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 31883264. Throughput: 0: 1781.5, 1: 1777.4. Samples: 7981196. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:23:46,876][101941] Avg episode reward: [(0, '5.810'), (1, '6.040')] +[2023-10-08 12:23:47,504][102897] Updated weights for policy 0, policy_version 15560 (0.0008) +[2023-10-08 12:23:47,878][102897] Updated weights for policy 0, policy_version 15570 (0.0008) +[2023-10-08 12:23:48,255][102897] Updated weights for policy 0, policy_version 15580 (0.0010) +[2023-10-08 12:23:49,706][102898] Updated weights for policy 1, policy_version 15590 (0.0009) +[2023-10-08 12:23:50,072][102898] Updated weights for policy 1, policy_version 15600 (0.0009) +[2023-10-08 12:23:50,448][102898] Updated weights for policy 1, policy_version 15610 (0.0010) +[2023-10-08 12:23:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 31948800. Throughput: 0: 1770.5, 1: 1802.7. Samples: 7992374. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:23:51,875][101941] Avg episode reward: [(0, '6.170'), (1, '6.370')] +[2023-10-08 12:23:52,093][102897] Updated weights for policy 0, policy_version 15590 (0.0008) +[2023-10-08 12:23:52,470][102897] Updated weights for policy 0, policy_version 15600 (0.0007) +[2023-10-08 12:23:52,844][102897] Updated weights for policy 0, policy_version 15610 (0.0007) +[2023-10-08 12:23:54,308][102898] Updated weights for policy 1, policy_version 15620 (0.0010) +[2023-10-08 12:23:54,688][102898] Updated weights for policy 1, policy_version 15630 (0.0010) +[2023-10-08 12:23:55,055][102898] Updated weights for policy 1, policy_version 15640 (0.0010) +[2023-10-08 12:23:56,557][102897] Updated weights for policy 0, policy_version 15620 (0.0007) +[2023-10-08 12:23:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 32014336. Throughput: 0: 1776.3, 1: 1774.3. Samples: 8013164. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:23:56,876][101941] Avg episode reward: [(0, '6.550'), (1, '5.930')] +[2023-10-08 12:23:56,929][102897] Updated weights for policy 0, policy_version 15630 (0.0007) +[2023-10-08 12:23:57,307][102897] Updated weights for policy 0, policy_version 15640 (0.0008) +[2023-10-08 12:23:58,753][102898] Updated weights for policy 1, policy_version 15650 (0.0010) +[2023-10-08 12:23:59,116][102898] Updated weights for policy 1, policy_version 15660 (0.0010) +[2023-10-08 12:23:59,491][102898] Updated weights for policy 1, policy_version 15670 (0.0008) +[2023-10-08 12:23:59,861][102898] Updated weights for policy 1, policy_version 15680 (0.0007) +[2023-10-08 12:24:01,110][102897] Updated weights for policy 0, policy_version 15650 (0.0009) +[2023-10-08 12:24:01,484][102897] Updated weights for policy 0, policy_version 15660 (0.0009) +[2023-10-08 12:24:01,865][102897] Updated weights for policy 0, policy_version 15670 (0.0008) +[2023-10-08 12:24:01,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 32079872. Throughput: 0: 1797.4, 1: 1773.4. Samples: 8035044. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 12:24:01,876][101941] Avg episode reward: [(0, '6.690'), (1, '5.870')] +[2023-10-08 12:24:02,243][102897] Updated weights for policy 0, policy_version 15680 (0.0009) +[2023-10-08 12:24:03,761][102898] Updated weights for policy 1, policy_version 15690 (0.0007) +[2023-10-08 12:24:04,121][102898] Updated weights for policy 1, policy_version 15700 (0.0008) +[2023-10-08 12:24:04,491][102898] Updated weights for policy 1, policy_version 15710 (0.0010) +[2023-10-08 12:24:06,087][102897] Updated weights for policy 0, policy_version 15690 (0.0008) +[2023-10-08 12:24:06,456][102897] Updated weights for policy 0, policy_version 15700 (0.0007) +[2023-10-08 12:24:06,831][102897] Updated weights for policy 0, policy_version 15710 (0.0007) +[2023-10-08 12:24:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 32145408. Throughput: 0: 1774.5, 1: 1779.9. Samples: 8045308. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 12:24:06,876][101941] Avg episode reward: [(0, '6.350'), (1, '5.810')] +[2023-10-08 12:24:08,312][102898] Updated weights for policy 1, policy_version 15720 (0.0009) +[2023-10-08 12:24:08,694][102898] Updated weights for policy 1, policy_version 15730 (0.0009) +[2023-10-08 12:24:09,060][102898] Updated weights for policy 1, policy_version 15740 (0.0008) +[2023-10-08 12:24:10,519][102897] Updated weights for policy 0, policy_version 15720 (0.0009) +[2023-10-08 12:24:10,893][102897] Updated weights for policy 0, policy_version 15730 (0.0010) +[2023-10-08 12:24:11,275][102897] Updated weights for policy 0, policy_version 15740 (0.0010) +[2023-10-08 12:24:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 32243712. Throughput: 0: 1801.5, 1: 1771.6. Samples: 8067028. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:24:11,876][101941] Avg episode reward: [(0, '5.920'), (1, '5.650')] +[2023-10-08 12:24:12,800][102898] Updated weights for policy 1, policy_version 15750 (0.0008) +[2023-10-08 12:24:13,164][102898] Updated weights for policy 1, policy_version 15760 (0.0009) +[2023-10-08 12:24:13,536][102898] Updated weights for policy 1, policy_version 15770 (0.0008) +[2023-10-08 12:24:14,997][102897] Updated weights for policy 0, policy_version 15750 (0.0010) +[2023-10-08 12:24:15,373][102897] Updated weights for policy 0, policy_version 15760 (0.0010) +[2023-10-08 12:24:15,747][102897] Updated weights for policy 0, policy_version 15770 (0.0010) +[2023-10-08 12:24:16,875][101941] Fps is (10 sec: 16383.3, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 32309248. Throughput: 0: 1778.6, 1: 1787.4. Samples: 8088480. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:24:16,876][101941] Avg episode reward: [(0, '6.270'), (1, '5.850')] +[2023-10-08 12:24:16,889][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000015776_16154624.pth... +[2023-10-08 12:24:16,890][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000015776_16154624.pth... +[2023-10-08 12:24:16,921][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000014112_14450688.pth +[2023-10-08 12:24:16,932][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000014112_14450688.pth +[2023-10-08 12:24:17,349][102898] Updated weights for policy 1, policy_version 15780 (0.0009) +[2023-10-08 12:24:17,709][102898] Updated weights for policy 1, policy_version 15790 (0.0007) +[2023-10-08 12:24:18,075][102898] Updated weights for policy 1, policy_version 15800 (0.0008) +[2023-10-08 12:24:19,619][102897] Updated weights for policy 0, policy_version 15780 (0.0009) +[2023-10-08 12:24:20,018][102897] Updated weights for policy 0, policy_version 15790 (0.0010) +[2023-10-08 12:24:20,390][102897] Updated weights for policy 0, policy_version 15800 (0.0011) +[2023-10-08 12:24:21,751][102898] Updated weights for policy 1, policy_version 15810 (0.0008) +[2023-10-08 12:24:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 32374784. Throughput: 0: 1807.4, 1: 1774.8. Samples: 8099554. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:24:21,876][101941] Avg episode reward: [(0, '5.990'), (1, '6.080')] +[2023-10-08 12:24:22,130][102898] Updated weights for policy 1, policy_version 15820 (0.0007) +[2023-10-08 12:24:22,504][102898] Updated weights for policy 1, policy_version 15830 (0.0010) +[2023-10-08 12:24:22,868][102898] Updated weights for policy 1, policy_version 15840 (0.0008) +[2023-10-08 12:24:24,066][102897] Updated weights for policy 0, policy_version 15810 (0.0010) +[2023-10-08 12:24:24,429][102897] Updated weights for policy 0, policy_version 15820 (0.0009) +[2023-10-08 12:24:24,809][102897] Updated weights for policy 0, policy_version 15830 (0.0010) +[2023-10-08 12:24:25,191][102897] Updated weights for policy 0, policy_version 15840 (0.0007) +[2023-10-08 12:24:26,601][102898] Updated weights for policy 1, policy_version 15850 (0.0009) +[2023-10-08 12:24:26,875][101941] Fps is (10 sec: 13107.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 32440320. Throughput: 0: 1778.8, 1: 1780.1. Samples: 8120212. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:24:26,876][101941] Avg episode reward: [(0, '5.770'), (1, '6.370')] +[2023-10-08 12:24:26,973][102898] Updated weights for policy 1, policy_version 15860 (0.0007) +[2023-10-08 12:24:27,336][102898] Updated weights for policy 1, policy_version 15870 (0.0007) +[2023-10-08 12:24:28,754][102897] Updated weights for policy 0, policy_version 15850 (0.0007) +[2023-10-08 12:24:29,129][102897] Updated weights for policy 0, policy_version 15860 (0.0010) +[2023-10-08 12:24:29,503][102897] Updated weights for policy 0, policy_version 15870 (0.0008) +[2023-10-08 12:24:30,990][102898] Updated weights for policy 1, policy_version 15880 (0.0007) +[2023-10-08 12:24:31,354][102898] Updated weights for policy 1, policy_version 15890 (0.0007) +[2023-10-08 12:24:31,714][102898] Updated weights for policy 1, policy_version 15900 (0.0010) +[2023-10-08 12:24:31,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 32538624. Throughput: 0: 1777.3, 1: 1793.3. Samples: 8141874. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:24:31,875][101941] Avg episode reward: [(0, '5.820'), (1, '6.670')] +[2023-10-08 12:24:33,330][102897] Updated weights for policy 0, policy_version 15880 (0.0008) +[2023-10-08 12:24:33,697][102897] Updated weights for policy 0, policy_version 15890 (0.0007) +[2023-10-08 12:24:34,076][102897] Updated weights for policy 0, policy_version 15900 (0.0008) +[2023-10-08 12:24:35,644][102898] Updated weights for policy 1, policy_version 15910 (0.0009) +[2023-10-08 12:24:36,011][102898] Updated weights for policy 1, policy_version 15920 (0.0009) +[2023-10-08 12:24:36,363][102898] Updated weights for policy 1, policy_version 15930 (0.0009) +[2023-10-08 12:24:36,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 32604160. Throughput: 0: 1778.1, 1: 1776.0. Samples: 8152308. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:24:36,875][101941] Avg episode reward: [(0, '6.790'), (1, '6.510')] +[2023-10-08 12:24:37,770][102897] Updated weights for policy 0, policy_version 15910 (0.0009) +[2023-10-08 12:24:38,131][102897] Updated weights for policy 0, policy_version 15920 (0.0007) +[2023-10-08 12:24:38,512][102897] Updated weights for policy 0, policy_version 15930 (0.0010) +[2023-10-08 12:24:40,241][102898] Updated weights for policy 1, policy_version 15940 (0.0010) +[2023-10-08 12:24:40,609][102898] Updated weights for policy 1, policy_version 15950 (0.0007) +[2023-10-08 12:24:40,978][102898] Updated weights for policy 1, policy_version 15960 (0.0009) +[2023-10-08 12:24:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 32669696. Throughput: 0: 1776.3, 1: 1800.5. Samples: 8174120. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:24:41,876][101941] Avg episode reward: [(0, '6.700'), (1, '6.460')] +[2023-10-08 12:24:42,341][102897] Updated weights for policy 0, policy_version 15940 (0.0007) +[2023-10-08 12:24:42,717][102897] Updated weights for policy 0, policy_version 15950 (0.0008) +[2023-10-08 12:24:43,097][102897] Updated weights for policy 0, policy_version 15960 (0.0011) +[2023-10-08 12:24:44,737][102898] Updated weights for policy 1, policy_version 15970 (0.0007) +[2023-10-08 12:24:45,102][102898] Updated weights for policy 1, policy_version 15980 (0.0008) +[2023-10-08 12:24:45,473][102898] Updated weights for policy 1, policy_version 15990 (0.0008) +[2023-10-08 12:24:45,842][102898] Updated weights for policy 1, policy_version 16000 (0.0009) +[2023-10-08 12:24:46,723][102897] Updated weights for policy 0, policy_version 15970 (0.0009) +[2023-10-08 12:24:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 32735232. Throughput: 0: 1787.9, 1: 1778.4. Samples: 8195528. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:24:46,875][101941] Avg episode reward: [(0, '6.370'), (1, '6.020')] +[2023-10-08 12:24:47,108][102897] Updated weights for policy 0, policy_version 15980 (0.0010) +[2023-10-08 12:24:47,485][102897] Updated weights for policy 0, policy_version 15990 (0.0009) +[2023-10-08 12:24:47,854][102897] Updated weights for policy 0, policy_version 16000 (0.0008) +[2023-10-08 12:24:49,658][102898] Updated weights for policy 1, policy_version 16010 (0.0010) +[2023-10-08 12:24:50,021][102898] Updated weights for policy 1, policy_version 16020 (0.0011) +[2023-10-08 12:24:50,388][102898] Updated weights for policy 1, policy_version 16030 (0.0010) +[2023-10-08 12:24:51,801][102897] Updated weights for policy 0, policy_version 16010 (0.0010) +[2023-10-08 12:24:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 32800768. Throughput: 0: 1774.1, 1: 1803.4. Samples: 8206294. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:24:51,875][101941] Avg episode reward: [(0, '6.220'), (1, '6.480')] +[2023-10-08 12:24:52,164][102897] Updated weights for policy 0, policy_version 16020 (0.0010) +[2023-10-08 12:24:52,547][102897] Updated weights for policy 0, policy_version 16030 (0.0010) +[2023-10-08 12:24:54,111][102898] Updated weights for policy 1, policy_version 16040 (0.0009) +[2023-10-08 12:24:54,473][102898] Updated weights for policy 1, policy_version 16050 (0.0009) +[2023-10-08 12:24:54,843][102898] Updated weights for policy 1, policy_version 16060 (0.0009) +[2023-10-08 12:24:56,437][102897] Updated weights for policy 0, policy_version 16040 (0.0009) +[2023-10-08 12:24:56,804][102897] Updated weights for policy 0, policy_version 16050 (0.0008) +[2023-10-08 12:24:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 32866304. Throughput: 0: 1779.2, 1: 1783.5. Samples: 8227348. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 12:24:56,876][101941] Avg episode reward: [(0, '6.610'), (1, '6.810')] +[2023-10-08 12:24:57,174][102897] Updated weights for policy 0, policy_version 16060 (0.0010) +[2023-10-08 12:24:58,499][102898] Updated weights for policy 1, policy_version 16070 (0.0007) +[2023-10-08 12:24:58,868][102898] Updated weights for policy 1, policy_version 16080 (0.0008) +[2023-10-08 12:24:59,227][102898] Updated weights for policy 1, policy_version 16090 (0.0008) +[2023-10-08 12:25:00,833][102897] Updated weights for policy 0, policy_version 16070 (0.0007) +[2023-10-08 12:25:01,210][102897] Updated weights for policy 0, policy_version 16080 (0.0007) +[2023-10-08 12:25:01,576][102897] Updated weights for policy 0, policy_version 16090 (0.0008) +[2023-10-08 12:25:01,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 32964608. Throughput: 0: 1787.9, 1: 1785.6. Samples: 8249284. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 12:25:01,876][101941] Avg episode reward: [(0, '6.350'), (1, '6.960')] +[2023-10-08 12:25:02,985][102898] Updated weights for policy 1, policy_version 16100 (0.0008) +[2023-10-08 12:25:03,348][102898] Updated weights for policy 1, policy_version 16110 (0.0010) +[2023-10-08 12:25:03,716][102898] Updated weights for policy 1, policy_version 16120 (0.0009) +[2023-10-08 12:25:05,421][102897] Updated weights for policy 0, policy_version 16100 (0.0010) +[2023-10-08 12:25:05,815][102897] Updated weights for policy 0, policy_version 16110 (0.0007) +[2023-10-08 12:25:06,180][102897] Updated weights for policy 0, policy_version 16120 (0.0008) +[2023-10-08 12:25:06,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 33030144. Throughput: 0: 1773.0, 1: 1789.8. Samples: 8259878. Policy #0 lag: (min: 31.0, avg: 32.7, max: 59.0) +[2023-10-08 12:25:06,876][101941] Avg episode reward: [(0, '6.000'), (1, '6.990')] +[2023-10-08 12:25:07,462][102898] Updated weights for policy 1, policy_version 16130 (0.0008) +[2023-10-08 12:25:07,860][102898] Updated weights for policy 1, policy_version 16140 (0.0010) +[2023-10-08 12:25:08,227][102898] Updated weights for policy 1, policy_version 16150 (0.0010) +[2023-10-08 12:25:08,595][102898] Updated weights for policy 1, policy_version 16160 (0.0009) +[2023-10-08 12:25:10,103][102897] Updated weights for policy 0, policy_version 16130 (0.0009) +[2023-10-08 12:25:10,474][102897] Updated weights for policy 0, policy_version 16140 (0.0008) +[2023-10-08 12:25:10,849][102897] Updated weights for policy 0, policy_version 16150 (0.0007) +[2023-10-08 12:25:11,230][102897] Updated weights for policy 0, policy_version 16160 (0.0007) +[2023-10-08 12:25:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 33095680. Throughput: 0: 1796.0, 1: 1785.6. Samples: 8281380. Policy #0 lag: (min: 31.0, avg: 32.7, max: 59.0) +[2023-10-08 12:25:11,875][101941] Avg episode reward: [(0, '6.600'), (1, '6.520')] +[2023-10-08 12:25:12,495][102898] Updated weights for policy 1, policy_version 16170 (0.0007) +[2023-10-08 12:25:12,857][102898] Updated weights for policy 1, policy_version 16180 (0.0007) +[2023-10-08 12:25:13,227][102898] Updated weights for policy 1, policy_version 16190 (0.0007) +[2023-10-08 12:25:14,987][102897] Updated weights for policy 0, policy_version 16170 (0.0007) +[2023-10-08 12:25:15,351][102897] Updated weights for policy 0, policy_version 16180 (0.0009) +[2023-10-08 12:25:15,729][102897] Updated weights for policy 0, policy_version 16190 (0.0009) +[2023-10-08 12:25:16,798][102898] Updated weights for policy 1, policy_version 16200 (0.0009) +[2023-10-08 12:25:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.6, 300 sec: 14329.1). Total num frames: 33161216. Throughput: 0: 1775.8, 1: 1808.8. Samples: 8303182. Policy #0 lag: (min: 31.0, avg: 32.7, max: 59.0) +[2023-10-08 12:25:16,875][101941] Avg episode reward: [(0, '6.890'), (1, '6.370')] +[2023-10-08 12:25:17,159][102898] Updated weights for policy 1, policy_version 16210 (0.0008) +[2023-10-08 12:25:17,532][102898] Updated weights for policy 1, policy_version 16220 (0.0008) +[2023-10-08 12:25:19,364][102897] Updated weights for policy 0, policy_version 16200 (0.0010) +[2023-10-08 12:25:19,746][102897] Updated weights for policy 0, policy_version 16210 (0.0007) +[2023-10-08 12:25:20,125][102897] Updated weights for policy 0, policy_version 16220 (0.0010) +[2023-10-08 12:25:21,370][102898] Updated weights for policy 1, policy_version 16230 (0.0007) +[2023-10-08 12:25:21,743][102898] Updated weights for policy 1, policy_version 16240 (0.0007) +[2023-10-08 12:25:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 33226752. Throughput: 0: 1808.6, 1: 1790.2. Samples: 8314256. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 12:25:21,876][101941] Avg episode reward: [(0, '6.730'), (1, '6.300')] +[2023-10-08 12:25:22,106][102898] Updated weights for policy 1, policy_version 16250 (0.0009) +[2023-10-08 12:25:23,835][102897] Updated weights for policy 0, policy_version 16230 (0.0009) +[2023-10-08 12:25:24,209][102897] Updated weights for policy 0, policy_version 16240 (0.0009) +[2023-10-08 12:25:24,590][102897] Updated weights for policy 0, policy_version 16250 (0.0007) +[2023-10-08 12:25:25,956][102898] Updated weights for policy 1, policy_version 16260 (0.0008) +[2023-10-08 12:25:26,324][102898] Updated weights for policy 1, policy_version 16270 (0.0009) +[2023-10-08 12:25:26,692][102898] Updated weights for policy 1, policy_version 16280 (0.0009) +[2023-10-08 12:25:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 33292288. Throughput: 0: 1780.5, 1: 1800.2. Samples: 8335252. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 12:25:26,875][101941] Avg episode reward: [(0, '6.390'), (1, '6.580')] +[2023-10-08 12:25:28,202][102897] Updated weights for policy 0, policy_version 16260 (0.0009) +[2023-10-08 12:25:28,572][102897] Updated weights for policy 0, policy_version 16270 (0.0010) +[2023-10-08 12:25:28,935][102897] Updated weights for policy 0, policy_version 16280 (0.0011) +[2023-10-08 12:25:30,426][102898] Updated weights for policy 1, policy_version 16290 (0.0011) +[2023-10-08 12:25:30,794][102898] Updated weights for policy 1, policy_version 16300 (0.0009) +[2023-10-08 12:25:31,162][102898] Updated weights for policy 1, policy_version 16310 (0.0007) +[2023-10-08 12:25:31,537][102898] Updated weights for policy 1, policy_version 16320 (0.0009) +[2023-10-08 12:25:31,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 33390592. Throughput: 0: 1780.1, 1: 1793.7. Samples: 8356350. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 12:25:31,876][101941] Avg episode reward: [(0, '5.800'), (1, '6.420')] +[2023-10-08 12:25:32,653][102897] Updated weights for policy 0, policy_version 16290 (0.0009) +[2023-10-08 12:25:33,033][102897] Updated weights for policy 0, policy_version 16300 (0.0008) +[2023-10-08 12:25:33,399][102897] Updated weights for policy 0, policy_version 16310 (0.0010) +[2023-10-08 12:25:33,773][102897] Updated weights for policy 0, policy_version 16320 (0.0010) +[2023-10-08 12:25:35,438][102898] Updated weights for policy 1, policy_version 16330 (0.0008) +[2023-10-08 12:25:35,808][102898] Updated weights for policy 1, policy_version 16340 (0.0011) +[2023-10-08 12:25:36,179][102898] Updated weights for policy 1, policy_version 16350 (0.0007) +[2023-10-08 12:25:36,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 33456128. Throughput: 0: 1784.0, 1: 1792.5. Samples: 8367236. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:25:36,876][101941] Avg episode reward: [(0, '6.090'), (1, '5.560')] +[2023-10-08 12:25:37,594][102897] Updated weights for policy 0, policy_version 16330 (0.0009) +[2023-10-08 12:25:37,963][102897] Updated weights for policy 0, policy_version 16340 (0.0008) +[2023-10-08 12:25:38,350][102897] Updated weights for policy 0, policy_version 16350 (0.0008) +[2023-10-08 12:25:39,832][102898] Updated weights for policy 1, policy_version 16360 (0.0009) +[2023-10-08 12:25:40,197][102898] Updated weights for policy 1, policy_version 16370 (0.0008) +[2023-10-08 12:25:40,561][102898] Updated weights for policy 1, policy_version 16380 (0.0008) +[2023-10-08 12:25:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 33521664. Throughput: 0: 1787.2, 1: 1796.6. Samples: 8388620. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:25:41,875][101941] Avg episode reward: [(0, '6.010'), (1, '5.910')] +[2023-10-08 12:25:42,145][102897] Updated weights for policy 0, policy_version 16360 (0.0008) +[2023-10-08 12:25:42,518][102897] Updated weights for policy 0, policy_version 16370 (0.0008) +[2023-10-08 12:25:42,897][102897] Updated weights for policy 0, policy_version 16380 (0.0007) +[2023-10-08 12:25:44,319][102898] Updated weights for policy 1, policy_version 16390 (0.0008) +[2023-10-08 12:25:44,696][102898] Updated weights for policy 1, policy_version 16400 (0.0008) +[2023-10-08 12:25:45,059][102898] Updated weights for policy 1, policy_version 16410 (0.0009) +[2023-10-08 12:25:46,570][102897] Updated weights for policy 0, policy_version 16390 (0.0007) +[2023-10-08 12:25:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 33587200. Throughput: 0: 1807.9, 1: 1777.7. Samples: 8410638. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:25:46,876][101941] Avg episode reward: [(0, '6.700'), (1, '5.850')] +[2023-10-08 12:25:46,939][102897] Updated weights for policy 0, policy_version 16400 (0.0008) +[2023-10-08 12:25:47,316][102897] Updated weights for policy 0, policy_version 16410 (0.0009) +[2023-10-08 12:25:48,857][102898] Updated weights for policy 1, policy_version 16420 (0.0008) +[2023-10-08 12:25:49,228][102898] Updated weights for policy 1, policy_version 16430 (0.0007) +[2023-10-08 12:25:49,594][102898] Updated weights for policy 1, policy_version 16440 (0.0007) +[2023-10-08 12:25:51,203][102897] Updated weights for policy 0, policy_version 16420 (0.0010) +[2023-10-08 12:25:51,571][102897] Updated weights for policy 0, policy_version 16430 (0.0008) +[2023-10-08 12:25:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 33652736. Throughput: 0: 1791.6, 1: 1787.5. Samples: 8420938. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:25:51,876][101941] Avg episode reward: [(0, '6.220'), (1, '5.840')] +[2023-10-08 12:25:51,944][102897] Updated weights for policy 0, policy_version 16440 (0.0007) +[2023-10-08 12:25:53,440][102898] Updated weights for policy 1, policy_version 16450 (0.0009) +[2023-10-08 12:25:53,814][102898] Updated weights for policy 1, policy_version 16460 (0.0010) +[2023-10-08 12:25:54,177][102898] Updated weights for policy 1, policy_version 16470 (0.0008) +[2023-10-08 12:25:54,547][102898] Updated weights for policy 1, policy_version 16480 (0.0007) +[2023-10-08 12:25:55,666][102897] Updated weights for policy 0, policy_version 16450 (0.0007) +[2023-10-08 12:25:56,052][102897] Updated weights for policy 0, policy_version 16460 (0.0009) +[2023-10-08 12:25:56,428][102897] Updated weights for policy 0, policy_version 16470 (0.0008) +[2023-10-08 12:25:56,795][102897] Updated weights for policy 0, policy_version 16480 (0.0009) +[2023-10-08 12:25:56,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.5, 300 sec: 14329.1). Total num frames: 33751040. Throughput: 0: 1805.4, 1: 1775.1. Samples: 8442502. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:25:56,876][101941] Avg episode reward: [(0, '5.700'), (1, '5.570')] +[2023-10-08 12:25:58,353][102898] Updated weights for policy 1, policy_version 16490 (0.0008) +[2023-10-08 12:25:58,731][102898] Updated weights for policy 1, policy_version 16500 (0.0010) +[2023-10-08 12:25:59,099][102898] Updated weights for policy 1, policy_version 16510 (0.0007) +[2023-10-08 12:26:00,490][102897] Updated weights for policy 0, policy_version 16490 (0.0007) +[2023-10-08 12:26:00,867][102897] Updated weights for policy 0, policy_version 16500 (0.0008) +[2023-10-08 12:26:01,231][102897] Updated weights for policy 0, policy_version 16510 (0.0008) +[2023-10-08 12:26:01,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 33816576. Throughput: 0: 1788.5, 1: 1770.9. Samples: 8463354. Policy #0 lag: (min: 31.0, avg: 36.0, max: 63.0) +[2023-10-08 12:26:01,875][101941] Avg episode reward: [(0, '6.150'), (1, '6.180')] +[2023-10-08 12:26:02,939][102898] Updated weights for policy 1, policy_version 16520 (0.0010) +[2023-10-08 12:26:03,308][102898] Updated weights for policy 1, policy_version 16530 (0.0007) +[2023-10-08 12:26:03,664][102898] Updated weights for policy 1, policy_version 16540 (0.0007) +[2023-10-08 12:26:04,888][102897] Updated weights for policy 0, policy_version 16520 (0.0010) +[2023-10-08 12:26:05,261][102897] Updated weights for policy 0, policy_version 16530 (0.0010) +[2023-10-08 12:26:05,640][102897] Updated weights for policy 0, policy_version 16540 (0.0010) +[2023-10-08 12:26:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 33882112. Throughput: 0: 1793.9, 1: 1770.3. Samples: 8474646. Policy #0 lag: (min: 31.0, avg: 36.0, max: 63.0) +[2023-10-08 12:26:06,876][101941] Avg episode reward: [(0, '6.370'), (1, '6.570')] +[2023-10-08 12:26:07,296][102898] Updated weights for policy 1, policy_version 16550 (0.0007) +[2023-10-08 12:26:07,659][102898] Updated weights for policy 1, policy_version 16560 (0.0007) +[2023-10-08 12:26:08,024][102898] Updated weights for policy 1, policy_version 16570 (0.0007) +[2023-10-08 12:26:09,484][102897] Updated weights for policy 0, policy_version 16550 (0.0008) +[2023-10-08 12:26:09,863][102897] Updated weights for policy 0, policy_version 16560 (0.0007) +[2023-10-08 12:26:10,245][102897] Updated weights for policy 0, policy_version 16570 (0.0008) +[2023-10-08 12:26:11,725][102898] Updated weights for policy 1, policy_version 16580 (0.0009) +[2023-10-08 12:26:11,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 33947648. Throughput: 0: 1793.7, 1: 1781.0. Samples: 8496112. Policy #0 lag: (min: 31.0, avg: 36.0, max: 63.0) +[2023-10-08 12:26:11,876][101941] Avg episode reward: [(0, '5.650'), (1, '6.680')] +[2023-10-08 12:26:12,084][102898] Updated weights for policy 1, policy_version 16590 (0.0008) +[2023-10-08 12:26:12,456][102898] Updated weights for policy 1, policy_version 16600 (0.0008) +[2023-10-08 12:26:13,885][102897] Updated weights for policy 0, policy_version 16580 (0.0009) +[2023-10-08 12:26:14,247][102897] Updated weights for policy 0, policy_version 16590 (0.0011) +[2023-10-08 12:26:14,618][102897] Updated weights for policy 0, policy_version 16600 (0.0010) +[2023-10-08 12:26:16,158][102898] Updated weights for policy 1, policy_version 16610 (0.0008) +[2023-10-08 12:26:16,534][102898] Updated weights for policy 1, policy_version 16620 (0.0007) +[2023-10-08 12:26:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 34013184. Throughput: 0: 1791.6, 1: 1802.0. Samples: 8518062. Policy #0 lag: (min: 31.0, avg: 44.0, max: 63.0) +[2023-10-08 12:26:16,876][101941] Avg episode reward: [(0, '5.650'), (1, '6.660')] +[2023-10-08 12:26:16,885][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000016608_17006592.pth... +[2023-10-08 12:26:16,904][102898] Updated weights for policy 1, policy_version 16630 (0.0009) +[2023-10-08 12:26:16,914][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000014944_15302656.pth +[2023-10-08 12:26:16,918][102634] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p0/milestones/checkpoint_000016608_17006592.pth +[2023-10-08 12:26:17,271][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000016640_17039360.pth... +[2023-10-08 12:26:17,276][102898] Updated weights for policy 1, policy_version 16640 (0.0009) +[2023-10-08 12:26:17,299][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000014944_15302656.pth +[2023-10-08 12:26:17,303][102760] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p1/milestones/checkpoint_000016640_17039360.pth +[2023-10-08 12:26:18,393][102897] Updated weights for policy 0, policy_version 16610 (0.0008) +[2023-10-08 12:26:18,762][102897] Updated weights for policy 0, policy_version 16620 (0.0007) +[2023-10-08 12:26:19,135][102897] Updated weights for policy 0, policy_version 16630 (0.0007) +[2023-10-08 12:26:19,501][102897] Updated weights for policy 0, policy_version 16640 (0.0009) +[2023-10-08 12:26:21,016][102898] Updated weights for policy 1, policy_version 16650 (0.0008) +[2023-10-08 12:26:21,377][102898] Updated weights for policy 1, policy_version 16660 (0.0010) +[2023-10-08 12:26:21,750][102898] Updated weights for policy 1, policy_version 16670 (0.0010) +[2023-10-08 12:26:21,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 34111488. Throughput: 0: 1800.8, 1: 1785.6. Samples: 8528624. Policy #0 lag: (min: 31.0, avg: 44.0, max: 63.0) +[2023-10-08 12:26:21,876][101941] Avg episode reward: [(0, '6.130'), (1, '6.730')] +[2023-10-08 12:26:23,259][102897] Updated weights for policy 0, policy_version 16650 (0.0011) +[2023-10-08 12:26:23,643][102897] Updated weights for policy 0, policy_version 16660 (0.0010) +[2023-10-08 12:26:24,014][102897] Updated weights for policy 0, policy_version 16670 (0.0011) +[2023-10-08 12:26:25,479][102898] Updated weights for policy 1, policy_version 16680 (0.0009) +[2023-10-08 12:26:25,847][102898] Updated weights for policy 1, policy_version 16690 (0.0007) +[2023-10-08 12:26:26,218][102898] Updated weights for policy 1, policy_version 16700 (0.0008) +[2023-10-08 12:26:26,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 34177024. Throughput: 0: 1796.4, 1: 1802.0. Samples: 8550550. Policy #0 lag: (min: 31.0, avg: 44.0, max: 63.0) +[2023-10-08 12:26:26,876][101941] Avg episode reward: [(0, '6.780'), (1, '6.180')] +[2023-10-08 12:26:27,670][102897] Updated weights for policy 0, policy_version 16680 (0.0008) +[2023-10-08 12:26:28,046][102897] Updated weights for policy 0, policy_version 16690 (0.0009) +[2023-10-08 12:26:28,428][102897] Updated weights for policy 0, policy_version 16700 (0.0007) +[2023-10-08 12:26:29,992][102898] Updated weights for policy 1, policy_version 16710 (0.0007) +[2023-10-08 12:26:30,362][102898] Updated weights for policy 1, policy_version 16720 (0.0008) +[2023-10-08 12:26:30,720][102898] Updated weights for policy 1, policy_version 16730 (0.0009) +[2023-10-08 12:26:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 34242560. Throughput: 0: 1799.3, 1: 1792.1. Samples: 8572250. Policy #0 lag: (min: 22.0, avg: 23.3, max: 46.0) +[2023-10-08 12:26:31,876][101941] Avg episode reward: [(0, '6.070'), (1, '6.320')] +[2023-10-08 12:26:32,036][102897] Updated weights for policy 0, policy_version 16710 (0.0007) +[2023-10-08 12:26:32,406][102897] Updated weights for policy 0, policy_version 16720 (0.0008) +[2023-10-08 12:26:32,788][102897] Updated weights for policy 0, policy_version 16730 (0.0009) +[2023-10-08 12:26:34,487][102898] Updated weights for policy 1, policy_version 16740 (0.0008) +[2023-10-08 12:26:34,846][102898] Updated weights for policy 1, policy_version 16750 (0.0009) +[2023-10-08 12:26:35,210][102898] Updated weights for policy 1, policy_version 16760 (0.0010) +[2023-10-08 12:26:36,513][102897] Updated weights for policy 0, policy_version 16740 (0.0010) +[2023-10-08 12:26:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 34308096. Throughput: 0: 1801.1, 1: 1810.9. Samples: 8583476. Policy #0 lag: (min: 22.0, avg: 23.3, max: 46.0) +[2023-10-08 12:26:36,876][101941] Avg episode reward: [(0, '5.970'), (1, '6.050')] +[2023-10-08 12:26:36,899][102897] Updated weights for policy 0, policy_version 16750 (0.0010) +[2023-10-08 12:26:37,276][102897] Updated weights for policy 0, policy_version 16760 (0.0009) +[2023-10-08 12:26:38,836][102898] Updated weights for policy 1, policy_version 16770 (0.0009) +[2023-10-08 12:26:39,198][102898] Updated weights for policy 1, policy_version 16780 (0.0008) +[2023-10-08 12:26:39,566][102898] Updated weights for policy 1, policy_version 16790 (0.0009) +[2023-10-08 12:26:39,943][102898] Updated weights for policy 1, policy_version 16800 (0.0008) +[2023-10-08 12:26:40,940][102897] Updated weights for policy 0, policy_version 16770 (0.0009) +[2023-10-08 12:26:41,314][102897] Updated weights for policy 0, policy_version 16780 (0.0008) +[2023-10-08 12:26:41,689][102897] Updated weights for policy 0, policy_version 16790 (0.0007) +[2023-10-08 12:26:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 34373632. Throughput: 0: 1801.7, 1: 1798.8. Samples: 8604522. Policy #0 lag: (min: 22.0, avg: 23.3, max: 46.0) +[2023-10-08 12:26:41,876][101941] Avg episode reward: [(0, '6.060'), (1, '5.870')] +[2023-10-08 12:26:42,062][102897] Updated weights for policy 0, policy_version 16800 (0.0007) +[2023-10-08 12:26:44,026][102898] Updated weights for policy 1, policy_version 16810 (0.0007) +[2023-10-08 12:26:44,384][102898] Updated weights for policy 1, policy_version 16820 (0.0008) +[2023-10-08 12:26:44,751][102898] Updated weights for policy 1, policy_version 16830 (0.0009) +[2023-10-08 12:26:45,869][102897] Updated weights for policy 0, policy_version 16810 (0.0008) +[2023-10-08 12:26:46,245][102897] Updated weights for policy 0, policy_version 16820 (0.0007) +[2023-10-08 12:26:46,620][102897] Updated weights for policy 0, policy_version 16830 (0.0007) +[2023-10-08 12:26:46,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 34471936. Throughput: 0: 1813.1, 1: 1792.2. Samples: 8625592. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 12:26:46,876][101941] Avg episode reward: [(0, '6.150'), (1, '6.100')] +[2023-10-08 12:26:48,424][102898] Updated weights for policy 1, policy_version 16840 (0.0009) +[2023-10-08 12:26:48,790][102898] Updated weights for policy 1, policy_version 16850 (0.0010) +[2023-10-08 12:26:49,166][102898] Updated weights for policy 1, policy_version 16860 (0.0007) +[2023-10-08 12:26:50,143][102897] Updated weights for policy 0, policy_version 16840 (0.0009) +[2023-10-08 12:26:50,512][102897] Updated weights for policy 0, policy_version 16850 (0.0009) +[2023-10-08 12:26:50,881][102897] Updated weights for policy 0, policy_version 16860 (0.0009) +[2023-10-08 12:26:51,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 34537472. Throughput: 0: 1804.8, 1: 1792.7. Samples: 8636532. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 12:26:51,875][101941] Avg episode reward: [(0, '6.080'), (1, '6.540')] +[2023-10-08 12:26:53,021][102898] Updated weights for policy 1, policy_version 16870 (0.0009) +[2023-10-08 12:26:53,386][102898] Updated weights for policy 1, policy_version 16880 (0.0008) +[2023-10-08 12:26:53,749][102898] Updated weights for policy 1, policy_version 16890 (0.0007) +[2023-10-08 12:26:54,799][102897] Updated weights for policy 0, policy_version 16870 (0.0008) +[2023-10-08 12:26:55,175][102897] Updated weights for policy 0, policy_version 16880 (0.0009) +[2023-10-08 12:26:55,551][102897] Updated weights for policy 0, policy_version 16890 (0.0008) +[2023-10-08 12:26:56,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 34603008. Throughput: 0: 1807.7, 1: 1782.6. Samples: 8657672. Policy #0 lag: (min: 31.0, avg: 35.6, max: 63.0) +[2023-10-08 12:26:56,875][101941] Avg episode reward: [(0, '6.510'), (1, '6.640')] +[2023-10-08 12:26:57,442][102898] Updated weights for policy 1, policy_version 16900 (0.0008) +[2023-10-08 12:26:57,808][102898] Updated weights for policy 1, policy_version 16910 (0.0008) +[2023-10-08 12:26:58,177][102898] Updated weights for policy 1, policy_version 16920 (0.0008) +[2023-10-08 12:26:59,194][102897] Updated weights for policy 0, policy_version 16900 (0.0008) +[2023-10-08 12:26:59,565][102897] Updated weights for policy 0, policy_version 16910 (0.0009) +[2023-10-08 12:26:59,940][102897] Updated weights for policy 0, policy_version 16920 (0.0008) +[2023-10-08 12:27:01,875][101941] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 34668544. Throughput: 0: 1798.0, 1: 1791.9. Samples: 8679608. Policy #0 lag: (min: 31.0, avg: 35.6, max: 63.0) +[2023-10-08 12:27:01,876][101941] Avg episode reward: [(0, '6.180'), (1, '6.840')] +[2023-10-08 12:27:01,893][102898] Updated weights for policy 1, policy_version 16930 (0.0007) +[2023-10-08 12:27:02,256][102898] Updated weights for policy 1, policy_version 16940 (0.0007) +[2023-10-08 12:27:02,620][102898] Updated weights for policy 1, policy_version 16950 (0.0007) +[2023-10-08 12:27:02,989][102898] Updated weights for policy 1, policy_version 16960 (0.0007) +[2023-10-08 12:27:03,725][102897] Updated weights for policy 0, policy_version 16930 (0.0008) +[2023-10-08 12:27:04,102][102897] Updated weights for policy 0, policy_version 16940 (0.0008) +[2023-10-08 12:27:04,483][102897] Updated weights for policy 0, policy_version 16950 (0.0008) +[2023-10-08 12:27:04,847][102897] Updated weights for policy 0, policy_version 16960 (0.0008) +[2023-10-08 12:27:06,763][102898] Updated weights for policy 1, policy_version 16970 (0.0009) +[2023-10-08 12:27:06,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 34734080. Throughput: 0: 1803.2, 1: 1785.4. Samples: 8690112. Policy #0 lag: (min: 31.0, avg: 35.6, max: 63.0) +[2023-10-08 12:27:06,876][101941] Avg episode reward: [(0, '5.200'), (1, '6.640')] +[2023-10-08 12:27:07,136][102898] Updated weights for policy 1, policy_version 16980 (0.0008) +[2023-10-08 12:27:07,516][102898] Updated weights for policy 1, policy_version 16990 (0.0008) +[2023-10-08 12:27:08,650][102897] Updated weights for policy 0, policy_version 16970 (0.0008) +[2023-10-08 12:27:09,027][102897] Updated weights for policy 0, policy_version 16980 (0.0007) +[2023-10-08 12:27:09,393][102897] Updated weights for policy 0, policy_version 16990 (0.0009) +[2023-10-08 12:27:11,293][102898] Updated weights for policy 1, policy_version 17000 (0.0008) +[2023-10-08 12:27:11,660][102898] Updated weights for policy 1, policy_version 17010 (0.0009) +[2023-10-08 12:27:11,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 34799616. Throughput: 0: 1789.0, 1: 1797.2. Samples: 8711926. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:27:11,876][101941] Avg episode reward: [(0, '5.270'), (1, '6.440')] +[2023-10-08 12:27:12,024][102898] Updated weights for policy 1, policy_version 17020 (0.0009) +[2023-10-08 12:27:13,280][102897] Updated weights for policy 0, policy_version 17000 (0.0008) +[2023-10-08 12:27:13,652][102897] Updated weights for policy 0, policy_version 17010 (0.0008) +[2023-10-08 12:27:14,015][102897] Updated weights for policy 0, policy_version 17020 (0.0011) +[2023-10-08 12:27:15,776][102898] Updated weights for policy 1, policy_version 17030 (0.0008) +[2023-10-08 12:27:16,147][102898] Updated weights for policy 1, policy_version 17040 (0.0009) +[2023-10-08 12:27:16,510][102898] Updated weights for policy 1, policy_version 17050 (0.0009) +[2023-10-08 12:27:16,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 34897920. Throughput: 0: 1781.7, 1: 1794.9. Samples: 8733198. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:27:16,876][101941] Avg episode reward: [(0, '5.750'), (1, '6.270')] +[2023-10-08 12:27:17,800][102897] Updated weights for policy 0, policy_version 17030 (0.0009) +[2023-10-08 12:27:18,178][102897] Updated weights for policy 0, policy_version 17040 (0.0008) +[2023-10-08 12:27:18,540][102897] Updated weights for policy 0, policy_version 17050 (0.0008) +[2023-10-08 12:27:20,349][102898] Updated weights for policy 1, policy_version 17060 (0.0007) +[2023-10-08 12:27:20,717][102898] Updated weights for policy 1, policy_version 17070 (0.0007) +[2023-10-08 12:27:21,085][102898] Updated weights for policy 1, policy_version 17080 (0.0008) +[2023-10-08 12:27:21,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 34963456. Throughput: 0: 1776.1, 1: 1787.7. Samples: 8743846. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:27:21,876][101941] Avg episode reward: [(0, '5.900'), (1, '6.110')] +[2023-10-08 12:27:22,356][102897] Updated weights for policy 0, policy_version 17060 (0.0010) +[2023-10-08 12:27:22,724][102897] Updated weights for policy 0, policy_version 17070 (0.0010) +[2023-10-08 12:27:23,097][102897] Updated weights for policy 0, policy_version 17080 (0.0009) +[2023-10-08 12:27:24,601][102898] Updated weights for policy 1, policy_version 17090 (0.0008) +[2023-10-08 12:27:24,967][102898] Updated weights for policy 1, policy_version 17100 (0.0008) +[2023-10-08 12:27:25,342][102898] Updated weights for policy 1, policy_version 17110 (0.0008) +[2023-10-08 12:27:25,697][102898] Updated weights for policy 1, policy_version 17120 (0.0009) +[2023-10-08 12:27:26,717][102897] Updated weights for policy 0, policy_version 17090 (0.0009) +[2023-10-08 12:27:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 35028992. Throughput: 0: 1777.6, 1: 1796.9. Samples: 8765372. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:27:26,876][101941] Avg episode reward: [(0, '6.020'), (1, '6.230')] +[2023-10-08 12:27:27,077][102897] Updated weights for policy 0, policy_version 17100 (0.0008) +[2023-10-08 12:27:27,456][102897] Updated weights for policy 0, policy_version 17110 (0.0008) +[2023-10-08 12:27:27,830][102897] Updated weights for policy 0, policy_version 17120 (0.0010) +[2023-10-08 12:27:29,666][102898] Updated weights for policy 1, policy_version 17130 (0.0007) +[2023-10-08 12:27:30,031][102898] Updated weights for policy 1, policy_version 17140 (0.0008) +[2023-10-08 12:27:30,403][102898] Updated weights for policy 1, policy_version 17150 (0.0007) +[2023-10-08 12:27:31,501][102897] Updated weights for policy 0, policy_version 17130 (0.0009) +[2023-10-08 12:27:31,875][102897] Updated weights for policy 0, policy_version 17140 (0.0010) +[2023-10-08 12:27:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 35094528. Throughput: 0: 1802.5, 1: 1794.0. Samples: 8787432. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:27:31,876][101941] Avg episode reward: [(0, '6.060'), (1, '6.810')] +[2023-10-08 12:27:32,259][102897] Updated weights for policy 0, policy_version 17150 (0.0007) +[2023-10-08 12:27:34,010][102898] Updated weights for policy 1, policy_version 17160 (0.0008) +[2023-10-08 12:27:34,376][102898] Updated weights for policy 1, policy_version 17170 (0.0009) +[2023-10-08 12:27:34,743][102898] Updated weights for policy 1, policy_version 17180 (0.0008) +[2023-10-08 12:27:36,121][102897] Updated weights for policy 0, policy_version 17160 (0.0009) +[2023-10-08 12:27:36,502][102897] Updated weights for policy 0, policy_version 17170 (0.0008) +[2023-10-08 12:27:36,865][102897] Updated weights for policy 0, policy_version 17180 (0.0008) +[2023-10-08 12:27:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 35160064. Throughput: 0: 1778.0, 1: 1806.8. Samples: 8797850. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:27:36,875][101941] Avg episode reward: [(0, '5.990'), (1, '6.320')] +[2023-10-08 12:27:38,582][102898] Updated weights for policy 1, policy_version 17190 (0.0008) +[2023-10-08 12:27:38,949][102898] Updated weights for policy 1, policy_version 17200 (0.0009) +[2023-10-08 12:27:39,311][102898] Updated weights for policy 1, policy_version 17210 (0.0007) +[2023-10-08 12:27:40,689][102897] Updated weights for policy 0, policy_version 17190 (0.0010) +[2023-10-08 12:27:41,063][102897] Updated weights for policy 0, policy_version 17200 (0.0009) +[2023-10-08 12:27:41,444][102897] Updated weights for policy 0, policy_version 17210 (0.0008) +[2023-10-08 12:27:41,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 35258368. Throughput: 0: 1805.2, 1: 1794.9. Samples: 8819678. Policy #0 lag: (min: 3.0, avg: 3.1, max: 9.0) +[2023-10-08 12:27:41,875][101941] Avg episode reward: [(0, '6.030'), (1, '6.100')] +[2023-10-08 12:27:43,029][102898] Updated weights for policy 1, policy_version 17220 (0.0007) +[2023-10-08 12:27:43,391][102898] Updated weights for policy 1, policy_version 17230 (0.0008) +[2023-10-08 12:27:43,770][102898] Updated weights for policy 1, policy_version 17240 (0.0009) +[2023-10-08 12:27:45,164][102897] Updated weights for policy 0, policy_version 17220 (0.0008) +[2023-10-08 12:27:45,539][102897] Updated weights for policy 0, policy_version 17230 (0.0008) +[2023-10-08 12:27:45,903][102897] Updated weights for policy 0, policy_version 17240 (0.0009) +[2023-10-08 12:27:46,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 35323904. Throughput: 0: 1781.0, 1: 1796.8. Samples: 8840610. Policy #0 lag: (min: 3.0, avg: 3.1, max: 9.0) +[2023-10-08 12:27:46,876][101941] Avg episode reward: [(0, '6.580'), (1, '6.360')] +[2023-10-08 12:27:47,426][102898] Updated weights for policy 1, policy_version 17250 (0.0009) +[2023-10-08 12:27:47,802][102898] Updated weights for policy 1, policy_version 17260 (0.0009) +[2023-10-08 12:27:48,162][102898] Updated weights for policy 1, policy_version 17270 (0.0010) +[2023-10-08 12:27:48,529][102898] Updated weights for policy 1, policy_version 17280 (0.0008) +[2023-10-08 12:27:49,759][102897] Updated weights for policy 0, policy_version 17250 (0.0009) +[2023-10-08 12:27:50,141][102897] Updated weights for policy 0, policy_version 17260 (0.0007) +[2023-10-08 12:27:50,511][102897] Updated weights for policy 0, policy_version 17270 (0.0008) +[2023-10-08 12:27:50,882][102897] Updated weights for policy 0, policy_version 17280 (0.0011) +[2023-10-08 12:27:51,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 35389440. Throughput: 0: 1800.7, 1: 1792.6. Samples: 8851810. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:27:51,876][101941] Avg episode reward: [(0, '6.070'), (1, '6.350')] +[2023-10-08 12:27:52,328][102898] Updated weights for policy 1, policy_version 17290 (0.0007) +[2023-10-08 12:27:52,702][102898] Updated weights for policy 1, policy_version 17300 (0.0008) +[2023-10-08 12:27:53,069][102898] Updated weights for policy 1, policy_version 17310 (0.0009) +[2023-10-08 12:27:54,530][102897] Updated weights for policy 0, policy_version 17290 (0.0009) +[2023-10-08 12:27:54,890][102897] Updated weights for policy 0, policy_version 17300 (0.0011) +[2023-10-08 12:27:55,262][102897] Updated weights for policy 0, policy_version 17310 (0.0010) +[2023-10-08 12:27:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 35454976. Throughput: 0: 1786.0, 1: 1788.5. Samples: 8872776. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:27:56,875][101941] Avg episode reward: [(0, '5.740'), (1, '6.170')] +[2023-10-08 12:27:56,878][102898] Updated weights for policy 1, policy_version 17320 (0.0007) +[2023-10-08 12:27:57,244][102898] Updated weights for policy 1, policy_version 17330 (0.0011) +[2023-10-08 12:27:57,627][102898] Updated weights for policy 1, policy_version 17340 (0.0009) +[2023-10-08 12:27:59,102][102897] Updated weights for policy 0, policy_version 17320 (0.0008) +[2023-10-08 12:27:59,481][102897] Updated weights for policy 0, policy_version 17330 (0.0009) +[2023-10-08 12:27:59,854][102897] Updated weights for policy 0, policy_version 17340 (0.0007) +[2023-10-08 12:28:01,368][102898] Updated weights for policy 1, policy_version 17350 (0.0008) +[2023-10-08 12:28:01,740][102898] Updated weights for policy 1, policy_version 17360 (0.0008) +[2023-10-08 12:28:01,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 35520512. Throughput: 0: 1783.1, 1: 1807.2. Samples: 8894762. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:28:01,876][101941] Avg episode reward: [(0, '6.470'), (1, '6.340')] +[2023-10-08 12:28:02,103][102898] Updated weights for policy 1, policy_version 17370 (0.0010) +[2023-10-08 12:28:03,609][102897] Updated weights for policy 0, policy_version 17350 (0.0008) +[2023-10-08 12:28:03,986][102897] Updated weights for policy 0, policy_version 17360 (0.0010) +[2023-10-08 12:28:04,360][102897] Updated weights for policy 0, policy_version 17370 (0.0011) +[2023-10-08 12:28:05,868][102898] Updated weights for policy 1, policy_version 17380 (0.0009) +[2023-10-08 12:28:06,239][102898] Updated weights for policy 1, policy_version 17390 (0.0010) +[2023-10-08 12:28:06,603][102898] Updated weights for policy 1, policy_version 17400 (0.0010) +[2023-10-08 12:28:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 35586048. Throughput: 0: 1794.9, 1: 1794.1. Samples: 8905348. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 12:28:06,876][101941] Avg episode reward: [(0, '6.410'), (1, '6.720')] +[2023-10-08 12:28:08,209][102897] Updated weights for policy 0, policy_version 17380 (0.0010) +[2023-10-08 12:28:08,608][102897] Updated weights for policy 0, policy_version 17390 (0.0008) +[2023-10-08 12:28:08,981][102897] Updated weights for policy 0, policy_version 17400 (0.0007) +[2023-10-08 12:28:10,438][102898] Updated weights for policy 1, policy_version 17410 (0.0011) +[2023-10-08 12:28:10,800][102898] Updated weights for policy 1, policy_version 17420 (0.0010) +[2023-10-08 12:28:11,181][102898] Updated weights for policy 1, policy_version 17430 (0.0010) +[2023-10-08 12:28:11,551][102898] Updated weights for policy 1, policy_version 17440 (0.0010) +[2023-10-08 12:28:11,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 35684352. Throughput: 0: 1781.0, 1: 1807.2. Samples: 8926842. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 12:28:11,876][101941] Avg episode reward: [(0, '5.970'), (1, '6.810')] +[2023-10-08 12:28:12,788][102897] Updated weights for policy 0, policy_version 17410 (0.0007) +[2023-10-08 12:28:13,167][102897] Updated weights for policy 0, policy_version 17420 (0.0011) +[2023-10-08 12:28:13,541][102897] Updated weights for policy 0, policy_version 17430 (0.0008) +[2023-10-08 12:28:13,914][102897] Updated weights for policy 0, policy_version 17440 (0.0008) +[2023-10-08 12:28:15,314][102898] Updated weights for policy 1, policy_version 17450 (0.0007) +[2023-10-08 12:28:15,683][102898] Updated weights for policy 1, policy_version 17460 (0.0008) +[2023-10-08 12:28:16,049][102898] Updated weights for policy 1, policy_version 17470 (0.0007) +[2023-10-08 12:28:16,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 35749888. Throughput: 0: 1782.9, 1: 1788.3. Samples: 8948134. Policy #0 lag: (min: 31.0, avg: 37.5, max: 63.0) +[2023-10-08 12:28:16,876][101941] Avg episode reward: [(0, '5.850'), (1, '6.820')] +[2023-10-08 12:28:16,884][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000017440_17858560.pth... +[2023-10-08 12:28:16,884][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000017472_17891328.pth... +[2023-10-08 12:28:16,926][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000015776_16154624.pth +[2023-10-08 12:28:16,926][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000015776_16154624.pth +[2023-10-08 12:28:17,674][102897] Updated weights for policy 0, policy_version 17450 (0.0009) +[2023-10-08 12:28:18,050][102897] Updated weights for policy 0, policy_version 17460 (0.0011) +[2023-10-08 12:28:18,419][102897] Updated weights for policy 0, policy_version 17470 (0.0010) +[2023-10-08 12:28:19,739][102898] Updated weights for policy 1, policy_version 17480 (0.0007) +[2023-10-08 12:28:20,114][102898] Updated weights for policy 1, policy_version 17490 (0.0007) +[2023-10-08 12:28:20,485][102898] Updated weights for policy 1, policy_version 17500 (0.0010) +[2023-10-08 12:28:21,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 35815424. Throughput: 0: 1776.7, 1: 1808.5. Samples: 8959182. Policy #0 lag: (min: 3.0, avg: 3.4, max: 17.0) +[2023-10-08 12:28:21,875][101941] Avg episode reward: [(0, '5.890'), (1, '6.800')] +[2023-10-08 12:28:22,229][102897] Updated weights for policy 0, policy_version 17480 (0.0011) +[2023-10-08 12:28:22,606][102897] Updated weights for policy 0, policy_version 17490 (0.0010) +[2023-10-08 12:28:22,965][102897] Updated weights for policy 0, policy_version 17500 (0.0009) +[2023-10-08 12:28:24,051][102898] Updated weights for policy 1, policy_version 17510 (0.0009) +[2023-10-08 12:28:24,424][102898] Updated weights for policy 1, policy_version 17520 (0.0007) +[2023-10-08 12:28:24,786][102898] Updated weights for policy 1, policy_version 17530 (0.0008) +[2023-10-08 12:28:26,666][102897] Updated weights for policy 0, policy_version 17510 (0.0010) +[2023-10-08 12:28:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 35880960. Throughput: 0: 1770.2, 1: 1793.5. Samples: 8980046. Policy #0 lag: (min: 3.0, avg: 3.4, max: 17.0) +[2023-10-08 12:28:26,875][101941] Avg episode reward: [(0, '6.150'), (1, '6.530')] +[2023-10-08 12:28:27,047][102897] Updated weights for policy 0, policy_version 17520 (0.0008) +[2023-10-08 12:28:27,420][102897] Updated weights for policy 0, policy_version 17530 (0.0007) +[2023-10-08 12:28:28,453][102898] Updated weights for policy 1, policy_version 17540 (0.0008) +[2023-10-08 12:28:28,828][102898] Updated weights for policy 1, policy_version 17550 (0.0007) +[2023-10-08 12:28:29,190][102898] Updated weights for policy 1, policy_version 17560 (0.0007) +[2023-10-08 12:28:31,224][102897] Updated weights for policy 0, policy_version 17540 (0.0008) +[2023-10-08 12:28:31,584][102897] Updated weights for policy 0, policy_version 17550 (0.0009) +[2023-10-08 12:28:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 35946496. Throughput: 0: 1793.2, 1: 1794.2. Samples: 9002042. Policy #0 lag: (min: 3.0, avg: 3.4, max: 17.0) +[2023-10-08 12:28:31,875][101941] Avg episode reward: [(0, '6.790'), (1, '6.640')] +[2023-10-08 12:28:31,966][102897] Updated weights for policy 0, policy_version 17560 (0.0008) +[2023-10-08 12:28:32,961][102898] Updated weights for policy 1, policy_version 17570 (0.0007) +[2023-10-08 12:28:33,337][102898] Updated weights for policy 1, policy_version 17580 (0.0007) +[2023-10-08 12:28:33,710][102898] Updated weights for policy 1, policy_version 17590 (0.0009) +[2023-10-08 12:28:34,080][102898] Updated weights for policy 1, policy_version 17600 (0.0007) +[2023-10-08 12:28:35,762][102897] Updated weights for policy 0, policy_version 17570 (0.0007) +[2023-10-08 12:28:36,143][102897] Updated weights for policy 0, policy_version 17580 (0.0008) +[2023-10-08 12:28:36,519][102897] Updated weights for policy 0, policy_version 17590 (0.0008) +[2023-10-08 12:28:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 36012032. Throughput: 0: 1770.5, 1: 1795.7. Samples: 9012292. Policy #0 lag: (min: 31.0, avg: 37.9, max: 63.0) +[2023-10-08 12:28:36,876][101941] Avg episode reward: [(0, '6.500'), (1, '6.820')] +[2023-10-08 12:28:36,884][102897] Updated weights for policy 0, policy_version 17600 (0.0008) +[2023-10-08 12:28:37,805][102898] Updated weights for policy 1, policy_version 17610 (0.0009) +[2023-10-08 12:28:38,173][102898] Updated weights for policy 1, policy_version 17620 (0.0008) +[2023-10-08 12:28:38,552][102898] Updated weights for policy 1, policy_version 17630 (0.0007) +[2023-10-08 12:28:40,596][102897] Updated weights for policy 0, policy_version 17610 (0.0007) +[2023-10-08 12:28:40,965][102897] Updated weights for policy 0, policy_version 17620 (0.0008) +[2023-10-08 12:28:41,346][102897] Updated weights for policy 0, policy_version 17630 (0.0009) +[2023-10-08 12:28:41,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 36110336. Throughput: 0: 1799.4, 1: 1793.4. Samples: 9034450. Policy #0 lag: (min: 31.0, avg: 37.9, max: 63.0) +[2023-10-08 12:28:41,876][101941] Avg episode reward: [(0, '6.160'), (1, '6.530')] +[2023-10-08 12:28:42,350][102898] Updated weights for policy 1, policy_version 17640 (0.0007) +[2023-10-08 12:28:42,714][102898] Updated weights for policy 1, policy_version 17650 (0.0007) +[2023-10-08 12:28:43,082][102898] Updated weights for policy 1, policy_version 17660 (0.0007) +[2023-10-08 12:28:45,155][102897] Updated weights for policy 0, policy_version 17640 (0.0007) +[2023-10-08 12:28:45,534][102897] Updated weights for policy 0, policy_version 17650 (0.0010) +[2023-10-08 12:28:45,908][102897] Updated weights for policy 0, policy_version 17660 (0.0011) +[2023-10-08 12:28:46,771][102898] Updated weights for policy 1, policy_version 17670 (0.0008) +[2023-10-08 12:28:46,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 36175872. Throughput: 0: 1773.0, 1: 1802.5. Samples: 9055662. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:28:46,876][101941] Avg episode reward: [(0, '6.040'), (1, '6.600')] +[2023-10-08 12:28:47,144][102898] Updated weights for policy 1, policy_version 17680 (0.0007) +[2023-10-08 12:28:47,507][102898] Updated weights for policy 1, policy_version 17690 (0.0008) +[2023-10-08 12:28:49,710][102897] Updated weights for policy 0, policy_version 17670 (0.0008) +[2023-10-08 12:28:50,081][102897] Updated weights for policy 0, policy_version 17680 (0.0009) +[2023-10-08 12:28:50,454][102897] Updated weights for policy 0, policy_version 17690 (0.0008) +[2023-10-08 12:28:51,422][102898] Updated weights for policy 1, policy_version 17700 (0.0009) +[2023-10-08 12:28:51,776][102898] Updated weights for policy 1, policy_version 17710 (0.0009) +[2023-10-08 12:28:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 36241408. Throughput: 0: 1799.5, 1: 1790.2. Samples: 9066884. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:28:51,876][101941] Avg episode reward: [(0, '5.950'), (1, '7.020')] +[2023-10-08 12:28:52,141][102898] Updated weights for policy 1, policy_version 17720 (0.0010) +[2023-10-08 12:28:52,430][102760] Saving new best policy, reward=7.020! +[2023-10-08 12:28:54,114][102897] Updated weights for policy 0, policy_version 17700 (0.0010) +[2023-10-08 12:28:54,488][102897] Updated weights for policy 0, policy_version 17710 (0.0008) +[2023-10-08 12:28:54,861][102897] Updated weights for policy 0, policy_version 17720 (0.0011) +[2023-10-08 12:28:55,911][102898] Updated weights for policy 1, policy_version 17730 (0.0011) +[2023-10-08 12:28:56,284][102898] Updated weights for policy 1, policy_version 17740 (0.0007) +[2023-10-08 12:28:56,648][102898] Updated weights for policy 1, policy_version 17750 (0.0010) +[2023-10-08 12:28:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 36306944. Throughput: 0: 1774.8, 1: 1794.7. Samples: 9087468. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:28:56,875][101941] Avg episode reward: [(0, '5.950'), (1, '6.890')] +[2023-10-08 12:28:57,015][102898] Updated weights for policy 1, policy_version 17760 (0.0008) +[2023-10-08 12:28:58,595][102897] Updated weights for policy 0, policy_version 17730 (0.0009) +[2023-10-08 12:28:58,995][102897] Updated weights for policy 0, policy_version 17740 (0.0008) +[2023-10-08 12:28:59,373][102897] Updated weights for policy 0, policy_version 17750 (0.0008) +[2023-10-08 12:28:59,746][102897] Updated weights for policy 0, policy_version 17760 (0.0008) +[2023-10-08 12:29:00,785][102898] Updated weights for policy 1, policy_version 17770 (0.0009) +[2023-10-08 12:29:01,161][102898] Updated weights for policy 1, policy_version 17780 (0.0008) +[2023-10-08 12:29:01,528][102898] Updated weights for policy 1, policy_version 17790 (0.0008) +[2023-10-08 12:29:01,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 36405248. Throughput: 0: 1773.5, 1: 1791.2. Samples: 9108544. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:29:01,875][101941] Avg episode reward: [(0, '6.410'), (1, '6.440')] +[2023-10-08 12:29:03,568][102897] Updated weights for policy 0, policy_version 17770 (0.0008) +[2023-10-08 12:29:03,933][102897] Updated weights for policy 0, policy_version 17780 (0.0008) +[2023-10-08 12:29:04,309][102897] Updated weights for policy 0, policy_version 17790 (0.0007) +[2023-10-08 12:29:05,213][102898] Updated weights for policy 1, policy_version 17800 (0.0008) +[2023-10-08 12:29:05,584][102898] Updated weights for policy 1, policy_version 17810 (0.0009) +[2023-10-08 12:29:05,951][102898] Updated weights for policy 1, policy_version 17820 (0.0009) +[2023-10-08 12:29:06,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 36470784. Throughput: 0: 1774.8, 1: 1791.5. Samples: 9119662. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:29:06,876][101941] Avg episode reward: [(0, '6.220'), (1, '6.820')] +[2023-10-08 12:29:08,106][102897] Updated weights for policy 0, policy_version 17800 (0.0008) +[2023-10-08 12:29:08,472][102897] Updated weights for policy 0, policy_version 17810 (0.0007) +[2023-10-08 12:29:08,846][102897] Updated weights for policy 0, policy_version 17820 (0.0008) +[2023-10-08 12:29:09,684][102898] Updated weights for policy 1, policy_version 17830 (0.0008) +[2023-10-08 12:29:10,053][102898] Updated weights for policy 1, policy_version 17840 (0.0009) +[2023-10-08 12:29:10,428][102898] Updated weights for policy 1, policy_version 17850 (0.0011) +[2023-10-08 12:29:11,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 36536320. Throughput: 0: 1775.2, 1: 1797.1. Samples: 9140798. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:29:11,876][101941] Avg episode reward: [(0, '5.910'), (1, '7.010')] +[2023-10-08 12:29:12,662][102897] Updated weights for policy 0, policy_version 17830 (0.0009) +[2023-10-08 12:29:13,034][102897] Updated weights for policy 0, policy_version 17840 (0.0009) +[2023-10-08 12:29:13,401][102897] Updated weights for policy 0, policy_version 17850 (0.0008) +[2023-10-08 12:29:14,086][102898] Updated weights for policy 1, policy_version 17860 (0.0008) +[2023-10-08 12:29:14,449][102898] Updated weights for policy 1, policy_version 17870 (0.0009) +[2023-10-08 12:29:14,822][102898] Updated weights for policy 1, policy_version 17880 (0.0009) +[2023-10-08 12:29:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 36601856. Throughput: 0: 1788.7, 1: 1794.3. Samples: 9163274. Policy #0 lag: (min: 1.0, avg: 12.3, max: 33.0) +[2023-10-08 12:29:16,876][101941] Avg episode reward: [(0, '5.770'), (1, '6.940')] +[2023-10-08 12:29:17,194][102897] Updated weights for policy 0, policy_version 17860 (0.0007) +[2023-10-08 12:29:17,569][102897] Updated weights for policy 0, policy_version 17870 (0.0009) +[2023-10-08 12:29:17,936][102897] Updated weights for policy 0, policy_version 17880 (0.0007) +[2023-10-08 12:29:18,475][102898] Updated weights for policy 1, policy_version 17890 (0.0010) +[2023-10-08 12:29:18,837][102898] Updated weights for policy 1, policy_version 17900 (0.0008) +[2023-10-08 12:29:19,202][102898] Updated weights for policy 1, policy_version 17910 (0.0010) +[2023-10-08 12:29:19,565][102898] Updated weights for policy 1, policy_version 17920 (0.0007) +[2023-10-08 12:29:21,702][102897] Updated weights for policy 0, policy_version 17890 (0.0007) +[2023-10-08 12:29:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 36667392. Throughput: 0: 1778.6, 1: 1801.6. Samples: 9173402. Policy #0 lag: (min: 1.0, avg: 12.3, max: 33.0) +[2023-10-08 12:29:21,876][101941] Avg episode reward: [(0, '6.460'), (1, '6.300')] +[2023-10-08 12:29:22,073][102897] Updated weights for policy 0, policy_version 17900 (0.0009) +[2023-10-08 12:29:22,444][102897] Updated weights for policy 0, policy_version 17910 (0.0008) +[2023-10-08 12:29:22,815][102897] Updated weights for policy 0, policy_version 17920 (0.0007) +[2023-10-08 12:29:23,291][102898] Updated weights for policy 1, policy_version 17930 (0.0009) +[2023-10-08 12:29:23,657][102898] Updated weights for policy 1, policy_version 17940 (0.0008) +[2023-10-08 12:29:24,034][102898] Updated weights for policy 1, policy_version 17950 (0.0009) +[2023-10-08 12:29:26,618][102897] Updated weights for policy 0, policy_version 17930 (0.0007) +[2023-10-08 12:29:26,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 36732928. Throughput: 0: 1777.8, 1: 1796.5. Samples: 9195294. Policy #0 lag: (min: 1.0, avg: 12.3, max: 33.0) +[2023-10-08 12:29:26,875][101941] Avg episode reward: [(0, '6.010'), (1, '6.100')] +[2023-10-08 12:29:27,003][102897] Updated weights for policy 0, policy_version 17940 (0.0009) +[2023-10-08 12:29:27,377][102897] Updated weights for policy 0, policy_version 17950 (0.0007) +[2023-10-08 12:29:27,891][102898] Updated weights for policy 1, policy_version 17960 (0.0010) +[2023-10-08 12:29:28,254][102898] Updated weights for policy 1, policy_version 17970 (0.0010) +[2023-10-08 12:29:28,618][102898] Updated weights for policy 1, policy_version 17980 (0.0008) +[2023-10-08 12:29:31,245][102897] Updated weights for policy 0, policy_version 17960 (0.0009) +[2023-10-08 12:29:31,619][102897] Updated weights for policy 0, policy_version 17970 (0.0008) +[2023-10-08 12:29:31,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 36798464. Throughput: 0: 1793.8, 1: 1789.1. Samples: 9216890. Policy #0 lag: (min: 19.0, avg: 25.3, max: 51.0) +[2023-10-08 12:29:31,876][101941] Avg episode reward: [(0, '5.750'), (1, '6.600')] +[2023-10-08 12:29:31,998][102897] Updated weights for policy 0, policy_version 17980 (0.0009) +[2023-10-08 12:29:32,408][102898] Updated weights for policy 1, policy_version 17990 (0.0007) +[2023-10-08 12:29:32,783][102898] Updated weights for policy 1, policy_version 18000 (0.0008) +[2023-10-08 12:29:33,157][102898] Updated weights for policy 1, policy_version 18010 (0.0009) +[2023-10-08 12:29:35,569][102897] Updated weights for policy 0, policy_version 17990 (0.0008) +[2023-10-08 12:29:35,935][102897] Updated weights for policy 0, policy_version 18000 (0.0008) +[2023-10-08 12:29:36,311][102897] Updated weights for policy 0, policy_version 18010 (0.0008) +[2023-10-08 12:29:36,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 36896768. Throughput: 0: 1773.5, 1: 1787.7. Samples: 9227140. Policy #0 lag: (min: 19.0, avg: 25.3, max: 51.0) +[2023-10-08 12:29:36,876][101941] Avg episode reward: [(0, '5.770'), (1, '6.870')] +[2023-10-08 12:29:36,959][102898] Updated weights for policy 1, policy_version 18020 (0.0007) +[2023-10-08 12:29:37,328][102898] Updated weights for policy 1, policy_version 18030 (0.0007) +[2023-10-08 12:29:37,697][102898] Updated weights for policy 1, policy_version 18040 (0.0009) +[2023-10-08 12:29:40,025][102897] Updated weights for policy 0, policy_version 18020 (0.0009) +[2023-10-08 12:29:40,408][102897] Updated weights for policy 0, policy_version 18030 (0.0008) +[2023-10-08 12:29:40,774][102897] Updated weights for policy 0, policy_version 18040 (0.0010) +[2023-10-08 12:29:41,570][102898] Updated weights for policy 1, policy_version 18050 (0.0009) +[2023-10-08 12:29:41,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 36962304. Throughput: 0: 1798.2, 1: 1790.6. Samples: 9248964. Policy #0 lag: (min: 9.0, avg: 15.7, max: 41.0) +[2023-10-08 12:29:41,876][101941] Avg episode reward: [(0, '6.120'), (1, '6.020')] +[2023-10-08 12:29:41,938][102898] Updated weights for policy 1, policy_version 18060 (0.0010) +[2023-10-08 12:29:42,304][102898] Updated weights for policy 1, policy_version 18070 (0.0008) +[2023-10-08 12:29:42,665][102898] Updated weights for policy 1, policy_version 18080 (0.0007) +[2023-10-08 12:29:44,515][102897] Updated weights for policy 0, policy_version 18050 (0.0009) +[2023-10-08 12:29:44,897][102897] Updated weights for policy 0, policy_version 18060 (0.0007) +[2023-10-08 12:29:45,267][102897] Updated weights for policy 0, policy_version 18070 (0.0008) +[2023-10-08 12:29:45,640][102897] Updated weights for policy 0, policy_version 18080 (0.0011) +[2023-10-08 12:29:46,582][102898] Updated weights for policy 1, policy_version 18090 (0.0007) +[2023-10-08 12:29:46,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 37027840. Throughput: 0: 1775.3, 1: 1814.6. Samples: 9270090. Policy #0 lag: (min: 9.0, avg: 15.7, max: 41.0) +[2023-10-08 12:29:46,876][101941] Avg episode reward: [(0, '6.610'), (1, '6.340')] +[2023-10-08 12:29:46,950][102898] Updated weights for policy 1, policy_version 18100 (0.0007) +[2023-10-08 12:29:47,317][102898] Updated weights for policy 1, policy_version 18110 (0.0007) +[2023-10-08 12:29:49,498][102897] Updated weights for policy 0, policy_version 18090 (0.0007) +[2023-10-08 12:29:49,873][102897] Updated weights for policy 0, policy_version 18100 (0.0008) +[2023-10-08 12:29:50,237][102897] Updated weights for policy 0, policy_version 18110 (0.0008) +[2023-10-08 12:29:51,056][102898] Updated weights for policy 1, policy_version 18120 (0.0009) +[2023-10-08 12:29:51,421][102898] Updated weights for policy 1, policy_version 18130 (0.0010) +[2023-10-08 12:29:51,796][102898] Updated weights for policy 1, policy_version 18140 (0.0009) +[2023-10-08 12:29:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 37093376. Throughput: 0: 1803.5, 1: 1788.1. Samples: 9281284. Policy #0 lag: (min: 9.0, avg: 15.7, max: 41.0) +[2023-10-08 12:29:51,876][101941] Avg episode reward: [(0, '6.060'), (1, '6.560')] +[2023-10-08 12:29:53,958][102897] Updated weights for policy 0, policy_version 18120 (0.0010) +[2023-10-08 12:29:54,322][102897] Updated weights for policy 0, policy_version 18130 (0.0010) +[2023-10-08 12:29:54,705][102897] Updated weights for policy 0, policy_version 18140 (0.0008) +[2023-10-08 12:29:55,549][102898] Updated weights for policy 1, policy_version 18150 (0.0007) +[2023-10-08 12:29:55,923][102898] Updated weights for policy 1, policy_version 18160 (0.0008) +[2023-10-08 12:29:56,294][102898] Updated weights for policy 1, policy_version 18170 (0.0007) +[2023-10-08 12:29:56,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 37191680. Throughput: 0: 1781.2, 1: 1808.3. Samples: 9302324. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 12:29:56,876][101941] Avg episode reward: [(0, '5.750'), (1, '5.780')] +[2023-10-08 12:29:58,552][102897] Updated weights for policy 0, policy_version 18150 (0.0007) +[2023-10-08 12:29:58,925][102897] Updated weights for policy 0, policy_version 18160 (0.0008) +[2023-10-08 12:29:59,291][102897] Updated weights for policy 0, policy_version 18170 (0.0010) +[2023-10-08 12:30:00,111][102898] Updated weights for policy 1, policy_version 18180 (0.0008) +[2023-10-08 12:30:00,479][102898] Updated weights for policy 1, policy_version 18190 (0.0008) +[2023-10-08 12:30:00,844][102898] Updated weights for policy 1, policy_version 18200 (0.0008) +[2023-10-08 12:30:01,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 37257216. Throughput: 0: 1778.1, 1: 1776.8. Samples: 9323244. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 12:30:01,876][101941] Avg episode reward: [(0, '6.010'), (1, '5.720')] +[2023-10-08 12:30:03,088][102897] Updated weights for policy 0, policy_version 18180 (0.0008) +[2023-10-08 12:30:03,478][102897] Updated weights for policy 0, policy_version 18190 (0.0009) +[2023-10-08 12:30:03,840][102897] Updated weights for policy 0, policy_version 18200 (0.0009) +[2023-10-08 12:30:04,646][102898] Updated weights for policy 1, policy_version 18210 (0.0008) +[2023-10-08 12:30:05,011][102898] Updated weights for policy 1, policy_version 18220 (0.0010) +[2023-10-08 12:30:05,388][102898] Updated weights for policy 1, policy_version 18230 (0.0010) +[2023-10-08 12:30:05,740][102898] Updated weights for policy 1, policy_version 18240 (0.0010) +[2023-10-08 12:30:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 37322752. Throughput: 0: 1775.4, 1: 1798.3. Samples: 9334220. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 12:30:06,876][101941] Avg episode reward: [(0, '6.270'), (1, '6.270')] +[2023-10-08 12:30:07,729][102897] Updated weights for policy 0, policy_version 18210 (0.0009) +[2023-10-08 12:30:08,098][102897] Updated weights for policy 0, policy_version 18220 (0.0008) +[2023-10-08 12:30:08,477][102897] Updated weights for policy 0, policy_version 18230 (0.0009) +[2023-10-08 12:30:08,846][102897] Updated weights for policy 0, policy_version 18240 (0.0007) +[2023-10-08 12:30:09,320][102898] Updated weights for policy 1, policy_version 18250 (0.0007) +[2023-10-08 12:30:09,683][102898] Updated weights for policy 1, policy_version 18260 (0.0007) +[2023-10-08 12:30:10,057][102898] Updated weights for policy 1, policy_version 18270 (0.0007) +[2023-10-08 12:30:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 37388288. Throughput: 0: 1775.6, 1: 1775.5. Samples: 9355092. Policy #0 lag: (min: 0.0, avg: 28.0, max: 32.0) +[2023-10-08 12:30:11,876][101941] Avg episode reward: [(0, '7.290'), (1, '6.620')] +[2023-10-08 12:30:11,877][102634] Saving new best policy, reward=7.290! +[2023-10-08 12:30:12,716][102897] Updated weights for policy 0, policy_version 18250 (0.0007) +[2023-10-08 12:30:13,084][102897] Updated weights for policy 0, policy_version 18260 (0.0007) +[2023-10-08 12:30:13,459][102897] Updated weights for policy 0, policy_version 18270 (0.0008) +[2023-10-08 12:30:13,901][102898] Updated weights for policy 1, policy_version 18280 (0.0010) +[2023-10-08 12:30:14,269][102898] Updated weights for policy 1, policy_version 18290 (0.0009) +[2023-10-08 12:30:14,638][102898] Updated weights for policy 1, policy_version 18300 (0.0008) +[2023-10-08 12:30:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 37453824. Throughput: 0: 1792.4, 1: 1775.2. Samples: 9377434. Policy #0 lag: (min: 0.0, avg: 28.0, max: 32.0) +[2023-10-08 12:30:16,876][101941] Avg episode reward: [(0, '7.230'), (1, '6.750')] +[2023-10-08 12:30:16,883][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000018304_18743296.pth... +[2023-10-08 12:30:16,916][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000016640_17039360.pth +[2023-10-08 12:30:17,095][102897] Updated weights for policy 0, policy_version 18280 (0.0010) +[2023-10-08 12:30:17,474][102897] Updated weights for policy 0, policy_version 18290 (0.0010) +[2023-10-08 12:30:17,849][102897] Updated weights for policy 0, policy_version 18300 (0.0008) +[2023-10-08 12:30:17,989][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000018304_18743296.pth... +[2023-10-08 12:30:18,018][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000016608_17006592.pth +[2023-10-08 12:30:18,382][102898] Updated weights for policy 1, policy_version 18310 (0.0009) +[2023-10-08 12:30:18,754][102898] Updated weights for policy 1, policy_version 18320 (0.0009) +[2023-10-08 12:30:19,120][102898] Updated weights for policy 1, policy_version 18330 (0.0008) +[2023-10-08 12:30:21,583][102897] Updated weights for policy 0, policy_version 18310 (0.0009) +[2023-10-08 12:30:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 37519360. Throughput: 0: 1774.6, 1: 1779.4. Samples: 9387070. Policy #0 lag: (min: 0.0, avg: 28.0, max: 32.0) +[2023-10-08 12:30:21,875][101941] Avg episode reward: [(0, '6.430'), (1, '6.770')] +[2023-10-08 12:30:21,949][102897] Updated weights for policy 0, policy_version 18320 (0.0009) +[2023-10-08 12:30:22,317][102897] Updated weights for policy 0, policy_version 18330 (0.0008) +[2023-10-08 12:30:23,061][102898] Updated weights for policy 1, policy_version 18340 (0.0007) +[2023-10-08 12:30:23,433][102898] Updated weights for policy 1, policy_version 18350 (0.0008) +[2023-10-08 12:30:23,800][102898] Updated weights for policy 1, policy_version 18360 (0.0009) +[2023-10-08 12:30:26,075][102897] Updated weights for policy 0, policy_version 18340 (0.0011) +[2023-10-08 12:30:26,447][102897] Updated weights for policy 0, policy_version 18350 (0.0008) +[2023-10-08 12:30:26,819][102897] Updated weights for policy 0, policy_version 18360 (0.0008) +[2023-10-08 12:30:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 37584896. Throughput: 0: 1788.7, 1: 1769.0. Samples: 9409062. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 12:30:26,875][101941] Avg episode reward: [(0, '6.030'), (1, '6.840')] +[2023-10-08 12:30:27,628][102898] Updated weights for policy 1, policy_version 18370 (0.0009) +[2023-10-08 12:30:27,991][102898] Updated weights for policy 1, policy_version 18380 (0.0009) +[2023-10-08 12:30:28,364][102898] Updated weights for policy 1, policy_version 18390 (0.0009) +[2023-10-08 12:30:28,740][102898] Updated weights for policy 1, policy_version 18400 (0.0010) +[2023-10-08 12:30:30,516][102897] Updated weights for policy 0, policy_version 18370 (0.0010) +[2023-10-08 12:30:30,924][102897] Updated weights for policy 0, policy_version 18380 (0.0009) +[2023-10-08 12:30:31,292][102897] Updated weights for policy 0, policy_version 18390 (0.0009) +[2023-10-08 12:30:31,668][102897] Updated weights for policy 0, policy_version 18400 (0.0010) +[2023-10-08 12:30:31,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 37683200. Throughput: 0: 1781.5, 1: 1772.3. Samples: 9430010. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 12:30:31,875][101941] Avg episode reward: [(0, '6.910'), (1, '6.450')] +[2023-10-08 12:30:32,734][102898] Updated weights for policy 1, policy_version 18410 (0.0009) +[2023-10-08 12:30:33,104][102898] Updated weights for policy 1, policy_version 18420 (0.0008) +[2023-10-08 12:30:33,473][102898] Updated weights for policy 1, policy_version 18430 (0.0007) +[2023-10-08 12:30:35,389][102897] Updated weights for policy 0, policy_version 18410 (0.0008) +[2023-10-08 12:30:35,762][102897] Updated weights for policy 0, policy_version 18420 (0.0009) +[2023-10-08 12:30:36,133][102897] Updated weights for policy 0, policy_version 18430 (0.0007) +[2023-10-08 12:30:36,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 37748736. Throughput: 0: 1777.8, 1: 1766.1. Samples: 9440758. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 12:30:36,876][101941] Avg episode reward: [(0, '6.130'), (1, '6.400')] +[2023-10-08 12:30:37,123][102898] Updated weights for policy 1, policy_version 18440 (0.0007) +[2023-10-08 12:30:37,485][102898] Updated weights for policy 1, policy_version 18450 (0.0008) +[2023-10-08 12:30:37,856][102898] Updated weights for policy 1, policy_version 18460 (0.0008) +[2023-10-08 12:30:39,819][102897] Updated weights for policy 0, policy_version 18440 (0.0009) +[2023-10-08 12:30:40,194][102897] Updated weights for policy 0, policy_version 18450 (0.0008) +[2023-10-08 12:30:40,566][102897] Updated weights for policy 0, policy_version 18460 (0.0009) +[2023-10-08 12:30:41,644][102898] Updated weights for policy 1, policy_version 18470 (0.0009) +[2023-10-08 12:30:41,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 37814272. Throughput: 0: 1781.8, 1: 1772.8. Samples: 9462282. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:30:41,876][101941] Avg episode reward: [(0, '5.570'), (1, '6.700')] +[2023-10-08 12:30:42,014][102898] Updated weights for policy 1, policy_version 18480 (0.0007) +[2023-10-08 12:30:42,376][102898] Updated weights for policy 1, policy_version 18490 (0.0010) +[2023-10-08 12:30:44,258][102897] Updated weights for policy 0, policy_version 18470 (0.0009) +[2023-10-08 12:30:44,633][102897] Updated weights for policy 0, policy_version 18480 (0.0008) +[2023-10-08 12:30:45,000][102897] Updated weights for policy 0, policy_version 18490 (0.0008) +[2023-10-08 12:30:46,190][102898] Updated weights for policy 1, policy_version 18500 (0.0007) +[2023-10-08 12:30:46,559][102898] Updated weights for policy 1, policy_version 18510 (0.0008) +[2023-10-08 12:30:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 37879808. Throughput: 0: 1778.0, 1: 1788.7. Samples: 9483746. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:30:46,876][101941] Avg episode reward: [(0, '5.470'), (1, '6.510')] +[2023-10-08 12:30:46,924][102898] Updated weights for policy 1, policy_version 18520 (0.0007) +[2023-10-08 12:30:48,777][102897] Updated weights for policy 0, policy_version 18500 (0.0008) +[2023-10-08 12:30:49,150][102897] Updated weights for policy 0, policy_version 18510 (0.0009) +[2023-10-08 12:30:49,519][102897] Updated weights for policy 0, policy_version 18520 (0.0008) +[2023-10-08 12:30:50,672][102898] Updated weights for policy 1, policy_version 18530 (0.0007) +[2023-10-08 12:30:51,042][102898] Updated weights for policy 1, policy_version 18540 (0.0008) +[2023-10-08 12:30:51,416][102898] Updated weights for policy 1, policy_version 18550 (0.0009) +[2023-10-08 12:30:51,785][102898] Updated weights for policy 1, policy_version 18560 (0.0007) +[2023-10-08 12:30:51,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 37978112. Throughput: 0: 1795.9, 1: 1768.1. Samples: 9494600. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:30:51,876][101941] Avg episode reward: [(0, '6.040'), (1, '6.310')] +[2023-10-08 12:30:53,345][102897] Updated weights for policy 0, policy_version 18530 (0.0008) +[2023-10-08 12:30:53,711][102897] Updated weights for policy 0, policy_version 18540 (0.0008) +[2023-10-08 12:30:54,090][102897] Updated weights for policy 0, policy_version 18550 (0.0010) +[2023-10-08 12:30:54,461][102897] Updated weights for policy 0, policy_version 18560 (0.0009) +[2023-10-08 12:30:55,548][102898] Updated weights for policy 1, policy_version 18570 (0.0009) +[2023-10-08 12:30:55,922][102898] Updated weights for policy 1, policy_version 18580 (0.0008) +[2023-10-08 12:30:56,291][102898] Updated weights for policy 1, policy_version 18590 (0.0008) +[2023-10-08 12:30:56,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 38043648. Throughput: 0: 1784.6, 1: 1790.1. Samples: 9515954. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:30:56,876][101941] Avg episode reward: [(0, '6.020'), (1, '6.190')] +[2023-10-08 12:30:58,246][102897] Updated weights for policy 0, policy_version 18570 (0.0007) +[2023-10-08 12:30:58,618][102897] Updated weights for policy 0, policy_version 18580 (0.0008) +[2023-10-08 12:30:59,006][102897] Updated weights for policy 0, policy_version 18590 (0.0010) +[2023-10-08 12:31:00,133][102898] Updated weights for policy 1, policy_version 18600 (0.0008) +[2023-10-08 12:31:00,501][102898] Updated weights for policy 1, policy_version 18610 (0.0009) +[2023-10-08 12:31:00,881][102898] Updated weights for policy 1, policy_version 18620 (0.0008) +[2023-10-08 12:31:01,875][101941] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 38109184. Throughput: 0: 1784.3, 1: 1770.2. Samples: 9537386. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:31:01,877][101941] Avg episode reward: [(0, '5.580'), (1, '6.440')] +[2023-10-08 12:31:02,587][102897] Updated weights for policy 0, policy_version 18600 (0.0009) +[2023-10-08 12:31:02,971][102897] Updated weights for policy 0, policy_version 18610 (0.0007) +[2023-10-08 12:31:03,335][102897] Updated weights for policy 0, policy_version 18620 (0.0009) +[2023-10-08 12:31:04,598][102898] Updated weights for policy 1, policy_version 18630 (0.0008) +[2023-10-08 12:31:04,969][102898] Updated weights for policy 1, policy_version 18640 (0.0007) +[2023-10-08 12:31:05,331][102898] Updated weights for policy 1, policy_version 18650 (0.0007) +[2023-10-08 12:31:06,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 38174720. Throughput: 0: 1784.7, 1: 1799.7. Samples: 9548370. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:31:06,876][101941] Avg episode reward: [(0, '5.760'), (1, '6.440')] +[2023-10-08 12:31:07,262][102897] Updated weights for policy 0, policy_version 18630 (0.0009) +[2023-10-08 12:31:07,634][102897] Updated weights for policy 0, policy_version 18640 (0.0011) +[2023-10-08 12:31:08,013][102897] Updated weights for policy 0, policy_version 18650 (0.0009) +[2023-10-08 12:31:08,904][102898] Updated weights for policy 1, policy_version 18660 (0.0007) +[2023-10-08 12:31:09,276][102898] Updated weights for policy 1, policy_version 18670 (0.0008) +[2023-10-08 12:31:09,653][102898] Updated weights for policy 1, policy_version 18680 (0.0008) +[2023-10-08 12:31:11,814][102897] Updated weights for policy 0, policy_version 18660 (0.0009) +[2023-10-08 12:31:11,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 38240256. Throughput: 0: 1777.9, 1: 1784.8. Samples: 9569382. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:31:11,876][101941] Avg episode reward: [(0, '6.300'), (1, '6.360')] +[2023-10-08 12:31:12,184][102897] Updated weights for policy 0, policy_version 18670 (0.0008) +[2023-10-08 12:31:12,558][102897] Updated weights for policy 0, policy_version 18680 (0.0008) +[2023-10-08 12:31:13,343][102898] Updated weights for policy 1, policy_version 18690 (0.0009) +[2023-10-08 12:31:13,718][102898] Updated weights for policy 1, policy_version 18700 (0.0008) +[2023-10-08 12:31:14,094][102898] Updated weights for policy 1, policy_version 18710 (0.0010) +[2023-10-08 12:31:14,462][102898] Updated weights for policy 1, policy_version 18720 (0.0008) +[2023-10-08 12:31:16,432][102897] Updated weights for policy 0, policy_version 18690 (0.0008) +[2023-10-08 12:31:16,820][102897] Updated weights for policy 0, policy_version 18700 (0.0007) +[2023-10-08 12:31:16,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 38305792. Throughput: 0: 1797.7, 1: 1790.1. Samples: 9591464. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:31:16,875][101941] Avg episode reward: [(0, '6.570'), (1, '6.530')] +[2023-10-08 12:31:17,192][102897] Updated weights for policy 0, policy_version 18710 (0.0007) +[2023-10-08 12:31:17,570][102897] Updated weights for policy 0, policy_version 18720 (0.0009) +[2023-10-08 12:31:18,259][102898] Updated weights for policy 1, policy_version 18730 (0.0010) +[2023-10-08 12:31:18,627][102898] Updated weights for policy 1, policy_version 18740 (0.0010) +[2023-10-08 12:31:18,993][102898] Updated weights for policy 1, policy_version 18750 (0.0010) +[2023-10-08 12:31:21,334][102897] Updated weights for policy 0, policy_version 18730 (0.0010) +[2023-10-08 12:31:21,709][102897] Updated weights for policy 0, policy_version 18740 (0.0010) +[2023-10-08 12:31:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 38371328. Throughput: 0: 1776.5, 1: 1789.6. Samples: 9601230. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:31:21,876][101941] Avg episode reward: [(0, '5.910'), (1, '6.740')] +[2023-10-08 12:31:22,084][102897] Updated weights for policy 0, policy_version 18750 (0.0009) +[2023-10-08 12:31:22,715][102898] Updated weights for policy 1, policy_version 18760 (0.0009) +[2023-10-08 12:31:23,076][102898] Updated weights for policy 1, policy_version 18770 (0.0007) +[2023-10-08 12:31:23,449][102898] Updated weights for policy 1, policy_version 18780 (0.0008) +[2023-10-08 12:31:25,971][102897] Updated weights for policy 0, policy_version 18760 (0.0007) +[2023-10-08 12:31:26,343][102897] Updated weights for policy 0, policy_version 18770 (0.0009) +[2023-10-08 12:31:26,726][102897] Updated weights for policy 0, policy_version 18780 (0.0009) +[2023-10-08 12:31:26,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 38469632. Throughput: 0: 1791.6, 1: 1792.5. Samples: 9623566. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:31:26,875][101941] Avg episode reward: [(0, '5.930'), (1, '6.180')] +[2023-10-08 12:31:27,104][102898] Updated weights for policy 1, policy_version 18790 (0.0007) +[2023-10-08 12:31:27,468][102898] Updated weights for policy 1, policy_version 18800 (0.0010) +[2023-10-08 12:31:27,847][102898] Updated weights for policy 1, policy_version 18810 (0.0011) +[2023-10-08 12:31:30,492][102897] Updated weights for policy 0, policy_version 18790 (0.0009) +[2023-10-08 12:31:30,865][102897] Updated weights for policy 0, policy_version 18800 (0.0008) +[2023-10-08 12:31:31,242][102897] Updated weights for policy 0, policy_version 18810 (0.0010) +[2023-10-08 12:31:31,700][102898] Updated weights for policy 1, policy_version 18820 (0.0009) +[2023-10-08 12:31:31,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 38535168. Throughput: 0: 1767.8, 1: 1808.3. Samples: 9644672. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:31:31,876][101941] Avg episode reward: [(0, '5.900'), (1, '6.720')] +[2023-10-08 12:31:32,065][102898] Updated weights for policy 1, policy_version 18830 (0.0009) +[2023-10-08 12:31:32,438][102898] Updated weights for policy 1, policy_version 18840 (0.0007) +[2023-10-08 12:31:35,016][102897] Updated weights for policy 0, policy_version 18820 (0.0010) +[2023-10-08 12:31:35,387][102897] Updated weights for policy 0, policy_version 18830 (0.0008) +[2023-10-08 12:31:35,764][102897] Updated weights for policy 0, policy_version 18840 (0.0009) +[2023-10-08 12:31:36,211][102898] Updated weights for policy 1, policy_version 18850 (0.0007) +[2023-10-08 12:31:36,573][102898] Updated weights for policy 1, policy_version 18860 (0.0008) +[2023-10-08 12:31:36,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 38600704. Throughput: 0: 1785.4, 1: 1798.5. Samples: 9655878. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:31:36,876][101941] Avg episode reward: [(0, '5.780'), (1, '6.900')] +[2023-10-08 12:31:36,946][102898] Updated weights for policy 1, policy_version 18870 (0.0011) +[2023-10-08 12:31:37,319][102898] Updated weights for policy 1, policy_version 18880 (0.0007) +[2023-10-08 12:31:39,552][102897] Updated weights for policy 0, policy_version 18850 (0.0009) +[2023-10-08 12:31:39,928][102897] Updated weights for policy 0, policy_version 18860 (0.0008) +[2023-10-08 12:31:40,306][102897] Updated weights for policy 0, policy_version 18870 (0.0008) +[2023-10-08 12:31:40,678][102897] Updated weights for policy 0, policy_version 18880 (0.0008) +[2023-10-08 12:31:41,091][102898] Updated weights for policy 1, policy_version 18890 (0.0010) +[2023-10-08 12:31:41,463][102898] Updated weights for policy 1, policy_version 18900 (0.0011) +[2023-10-08 12:31:41,828][102898] Updated weights for policy 1, policy_version 18910 (0.0007) +[2023-10-08 12:31:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 38666240. Throughput: 0: 1775.2, 1: 1805.8. Samples: 9677096. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:31:41,876][101941] Avg episode reward: [(0, '6.100'), (1, '6.090')] +[2023-10-08 12:31:44,410][102897] Updated weights for policy 0, policy_version 18890 (0.0011) +[2023-10-08 12:31:44,781][102897] Updated weights for policy 0, policy_version 18900 (0.0008) +[2023-10-08 12:31:45,146][102897] Updated weights for policy 0, policy_version 18910 (0.0008) +[2023-10-08 12:31:45,454][102898] Updated weights for policy 1, policy_version 18920 (0.0009) +[2023-10-08 12:31:45,831][102898] Updated weights for policy 1, policy_version 18930 (0.0010) +[2023-10-08 12:31:46,203][102898] Updated weights for policy 1, policy_version 18940 (0.0011) +[2023-10-08 12:31:46,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 38764544. Throughput: 0: 1765.0, 1: 1800.0. Samples: 9697808. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:31:46,876][101941] Avg episode reward: [(0, '6.130'), (1, '5.960')] +[2023-10-08 12:31:49,150][102897] Updated weights for policy 0, policy_version 18920 (0.0007) +[2023-10-08 12:31:49,522][102897] Updated weights for policy 0, policy_version 18930 (0.0008) +[2023-10-08 12:31:49,893][102897] Updated weights for policy 0, policy_version 18940 (0.0008) +[2023-10-08 12:31:50,073][102898] Updated weights for policy 1, policy_version 18950 (0.0008) +[2023-10-08 12:31:50,452][102898] Updated weights for policy 1, policy_version 18960 (0.0010) +[2023-10-08 12:31:50,809][102898] Updated weights for policy 1, policy_version 18970 (0.0009) +[2023-10-08 12:31:51,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 38830080. Throughput: 0: 1784.1, 1: 1800.2. Samples: 9709666. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:31:51,876][101941] Avg episode reward: [(0, '6.070'), (1, '6.360')] +[2023-10-08 12:31:53,569][102897] Updated weights for policy 0, policy_version 18950 (0.0008) +[2023-10-08 12:31:53,945][102897] Updated weights for policy 0, policy_version 18960 (0.0009) +[2023-10-08 12:31:54,316][102897] Updated weights for policy 0, policy_version 18970 (0.0007) +[2023-10-08 12:31:54,564][102898] Updated weights for policy 1, policy_version 18980 (0.0007) +[2023-10-08 12:31:54,927][102898] Updated weights for policy 1, policy_version 18990 (0.0009) +[2023-10-08 12:31:55,293][102898] Updated weights for policy 1, policy_version 19000 (0.0007) +[2023-10-08 12:31:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 38895616. Throughput: 0: 1774.6, 1: 1796.4. Samples: 9730078. Policy #0 lag: (min: 31.0, avg: 36.5, max: 63.0) +[2023-10-08 12:31:56,876][101941] Avg episode reward: [(0, '6.170'), (1, '6.510')] +[2023-10-08 12:31:57,933][102897] Updated weights for policy 0, policy_version 18980 (0.0008) +[2023-10-08 12:31:58,303][102897] Updated weights for policy 0, policy_version 18990 (0.0007) +[2023-10-08 12:31:58,677][102897] Updated weights for policy 0, policy_version 19000 (0.0007) +[2023-10-08 12:31:59,010][102898] Updated weights for policy 1, policy_version 19010 (0.0010) +[2023-10-08 12:31:59,383][102898] Updated weights for policy 1, policy_version 19020 (0.0011) +[2023-10-08 12:31:59,745][102898] Updated weights for policy 1, policy_version 19030 (0.0010) +[2023-10-08 12:32:00,114][102898] Updated weights for policy 1, policy_version 19040 (0.0011) +[2023-10-08 12:32:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 38961152. Throughput: 0: 1792.3, 1: 1786.3. Samples: 9752502. Policy #0 lag: (min: 31.0, avg: 36.5, max: 63.0) +[2023-10-08 12:32:01,876][101941] Avg episode reward: [(0, '5.520'), (1, '6.210')] +[2023-10-08 12:32:02,423][102897] Updated weights for policy 0, policy_version 19010 (0.0008) +[2023-10-08 12:32:02,828][102897] Updated weights for policy 0, policy_version 19020 (0.0009) +[2023-10-08 12:32:03,202][102897] Updated weights for policy 0, policy_version 19030 (0.0008) +[2023-10-08 12:32:03,569][102897] Updated weights for policy 0, policy_version 19040 (0.0008) +[2023-10-08 12:32:03,959][102898] Updated weights for policy 1, policy_version 19050 (0.0008) +[2023-10-08 12:32:04,327][102898] Updated weights for policy 1, policy_version 19060 (0.0008) +[2023-10-08 12:32:04,687][102898] Updated weights for policy 1, policy_version 19070 (0.0008) +[2023-10-08 12:32:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 39026688. Throughput: 0: 1786.7, 1: 1797.2. Samples: 9762508. Policy #0 lag: (min: 31.0, avg: 36.5, max: 63.0) +[2023-10-08 12:32:06,875][101941] Avg episode reward: [(0, '5.700'), (1, '6.640')] +[2023-10-08 12:32:07,323][102897] Updated weights for policy 0, policy_version 19050 (0.0009) +[2023-10-08 12:32:07,698][102897] Updated weights for policy 0, policy_version 19060 (0.0007) +[2023-10-08 12:32:08,077][102897] Updated weights for policy 0, policy_version 19070 (0.0008) +[2023-10-08 12:32:08,641][102898] Updated weights for policy 1, policy_version 19080 (0.0009) +[2023-10-08 12:32:09,006][102898] Updated weights for policy 1, policy_version 19090 (0.0007) +[2023-10-08 12:32:09,382][102898] Updated weights for policy 1, policy_version 19100 (0.0008) +[2023-10-08 12:32:11,696][102897] Updated weights for policy 0, policy_version 19080 (0.0009) +[2023-10-08 12:32:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 39092224. Throughput: 0: 1796.7, 1: 1777.0. Samples: 9784382. Policy #0 lag: (min: 31.0, avg: 36.5, max: 63.0) +[2023-10-08 12:32:11,875][101941] Avg episode reward: [(0, '6.680'), (1, '6.770')] +[2023-10-08 12:32:12,081][102897] Updated weights for policy 0, policy_version 19090 (0.0009) +[2023-10-08 12:32:12,454][102897] Updated weights for policy 0, policy_version 19100 (0.0008) +[2023-10-08 12:32:13,110][102898] Updated weights for policy 1, policy_version 19110 (0.0010) +[2023-10-08 12:32:13,478][102898] Updated weights for policy 1, policy_version 19120 (0.0007) +[2023-10-08 12:32:13,837][102898] Updated weights for policy 1, policy_version 19130 (0.0007) +[2023-10-08 12:32:16,103][102897] Updated weights for policy 0, policy_version 19110 (0.0009) +[2023-10-08 12:32:16,485][102897] Updated weights for policy 0, policy_version 19120 (0.0011) +[2023-10-08 12:32:16,847][102897] Updated weights for policy 0, policy_version 19130 (0.0007) +[2023-10-08 12:32:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 39157760. Throughput: 0: 1816.9, 1: 1779.4. Samples: 9806502. Policy #0 lag: (min: 26.0, avg: 30.2, max: 57.0) +[2023-10-08 12:32:16,876][101941] Avg episode reward: [(0, '6.640'), (1, '6.600')] +[2023-10-08 12:32:16,885][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000019136_19595264.pth... +[2023-10-08 12:32:16,926][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000017472_17891328.pth +[2023-10-08 12:32:17,069][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000019136_19595264.pth... +[2023-10-08 12:32:17,099][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000017440_17858560.pth +[2023-10-08 12:32:17,543][102898] Updated weights for policy 1, policy_version 19140 (0.0008) +[2023-10-08 12:32:17,914][102898] Updated weights for policy 1, policy_version 19150 (0.0009) +[2023-10-08 12:32:18,270][102898] Updated weights for policy 1, policy_version 19160 (0.0010) +[2023-10-08 12:32:20,595][102897] Updated weights for policy 0, policy_version 19140 (0.0008) +[2023-10-08 12:32:20,975][102897] Updated weights for policy 0, policy_version 19150 (0.0007) +[2023-10-08 12:32:21,345][102897] Updated weights for policy 0, policy_version 19160 (0.0007) +[2023-10-08 12:32:21,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 39256064. Throughput: 0: 1798.6, 1: 1775.6. Samples: 9816720. Policy #0 lag: (min: 26.0, avg: 30.2, max: 57.0) +[2023-10-08 12:32:21,876][101941] Avg episode reward: [(0, '7.270'), (1, '6.580')] +[2023-10-08 12:32:22,251][102898] Updated weights for policy 1, policy_version 19170 (0.0010) +[2023-10-08 12:32:22,628][102898] Updated weights for policy 1, policy_version 19180 (0.0008) +[2023-10-08 12:32:23,002][102898] Updated weights for policy 1, policy_version 19190 (0.0009) +[2023-10-08 12:32:23,373][102898] Updated weights for policy 1, policy_version 19200 (0.0008) +[2023-10-08 12:32:25,108][102897] Updated weights for policy 0, policy_version 19170 (0.0009) +[2023-10-08 12:32:25,483][102897] Updated weights for policy 0, policy_version 19180 (0.0009) +[2023-10-08 12:32:25,859][102897] Updated weights for policy 0, policy_version 19190 (0.0011) +[2023-10-08 12:32:26,228][102897] Updated weights for policy 0, policy_version 19200 (0.0008) +[2023-10-08 12:32:26,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 39321600. Throughput: 0: 1815.8, 1: 1776.8. Samples: 9838760. Policy #0 lag: (min: 26.0, avg: 30.2, max: 57.0) +[2023-10-08 12:32:26,875][101941] Avg episode reward: [(0, '7.070'), (1, '6.660')] +[2023-10-08 12:32:27,078][102898] Updated weights for policy 1, policy_version 19210 (0.0011) +[2023-10-08 12:32:27,440][102898] Updated weights for policy 1, policy_version 19220 (0.0010) +[2023-10-08 12:32:27,807][102898] Updated weights for policy 1, policy_version 19230 (0.0010) +[2023-10-08 12:32:29,971][102897] Updated weights for policy 0, policy_version 19210 (0.0008) +[2023-10-08 12:32:30,340][102897] Updated weights for policy 0, policy_version 19220 (0.0008) +[2023-10-08 12:32:30,725][102897] Updated weights for policy 0, policy_version 19230 (0.0008) +[2023-10-08 12:32:31,453][102898] Updated weights for policy 1, policy_version 19240 (0.0011) +[2023-10-08 12:32:31,820][102898] Updated weights for policy 1, policy_version 19250 (0.0009) +[2023-10-08 12:32:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 39387136. Throughput: 0: 1801.6, 1: 1798.6. Samples: 9859818. Policy #0 lag: (min: 26.0, avg: 44.7, max: 58.0) +[2023-10-08 12:32:31,876][101941] Avg episode reward: [(0, '6.360'), (1, '6.630')] +[2023-10-08 12:32:32,195][102898] Updated weights for policy 1, policy_version 19260 (0.0008) +[2023-10-08 12:32:34,286][102897] Updated weights for policy 0, policy_version 19240 (0.0008) +[2023-10-08 12:32:34,669][102897] Updated weights for policy 0, policy_version 19250 (0.0009) +[2023-10-08 12:32:35,038][102897] Updated weights for policy 0, policy_version 19260 (0.0009) +[2023-10-08 12:32:36,030][102898] Updated weights for policy 1, policy_version 19270 (0.0008) +[2023-10-08 12:32:36,397][102898] Updated weights for policy 1, policy_version 19280 (0.0007) +[2023-10-08 12:32:36,760][102898] Updated weights for policy 1, policy_version 19290 (0.0008) +[2023-10-08 12:32:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 39452672. Throughput: 0: 1814.1, 1: 1777.7. Samples: 9871292. Policy #0 lag: (min: 26.0, avg: 44.7, max: 58.0) +[2023-10-08 12:32:36,875][101941] Avg episode reward: [(0, '6.190'), (1, '7.080')] +[2023-10-08 12:32:36,979][102760] Saving new best policy, reward=7.080! +[2023-10-08 12:32:38,708][102897] Updated weights for policy 0, policy_version 19270 (0.0009) +[2023-10-08 12:32:39,074][102897] Updated weights for policy 0, policy_version 19280 (0.0010) +[2023-10-08 12:32:39,447][102897] Updated weights for policy 0, policy_version 19290 (0.0010) +[2023-10-08 12:32:40,390][102898] Updated weights for policy 1, policy_version 19300 (0.0010) +[2023-10-08 12:32:40,761][102898] Updated weights for policy 1, policy_version 19310 (0.0007) +[2023-10-08 12:32:41,125][102898] Updated weights for policy 1, policy_version 19320 (0.0008) +[2023-10-08 12:32:41,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 39550976. Throughput: 0: 1804.8, 1: 1804.3. Samples: 9892488. Policy #0 lag: (min: 26.0, avg: 44.7, max: 58.0) +[2023-10-08 12:32:41,876][101941] Avg episode reward: [(0, '5.890'), (1, '6.650')] +[2023-10-08 12:32:43,236][102897] Updated weights for policy 0, policy_version 19300 (0.0008) +[2023-10-08 12:32:43,599][102897] Updated weights for policy 0, policy_version 19310 (0.0009) +[2023-10-08 12:32:43,980][102897] Updated weights for policy 0, policy_version 19320 (0.0007) +[2023-10-08 12:32:44,938][102898] Updated weights for policy 1, policy_version 19330 (0.0007) +[2023-10-08 12:32:45,304][102898] Updated weights for policy 1, policy_version 19340 (0.0010) +[2023-10-08 12:32:45,670][102898] Updated weights for policy 1, policy_version 19350 (0.0010) +[2023-10-08 12:32:46,046][102898] Updated weights for policy 1, policy_version 19360 (0.0009) +[2023-10-08 12:32:46,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 39616512. Throughput: 0: 1799.6, 1: 1782.2. Samples: 9913684. Policy #0 lag: (min: 26.0, avg: 44.7, max: 58.0) +[2023-10-08 12:32:46,876][101941] Avg episode reward: [(0, '5.480'), (1, '6.000')] +[2023-10-08 12:32:47,671][102897] Updated weights for policy 0, policy_version 19330 (0.0007) +[2023-10-08 12:32:48,047][102897] Updated weights for policy 0, policy_version 19340 (0.0007) +[2023-10-08 12:32:48,425][102897] Updated weights for policy 0, policy_version 19350 (0.0008) +[2023-10-08 12:32:48,795][102897] Updated weights for policy 0, policy_version 19360 (0.0007) +[2023-10-08 12:32:49,793][102898] Updated weights for policy 1, policy_version 19370 (0.0009) +[2023-10-08 12:32:50,170][102898] Updated weights for policy 1, policy_version 19380 (0.0008) +[2023-10-08 12:32:50,532][102898] Updated weights for policy 1, policy_version 19390 (0.0009) +[2023-10-08 12:32:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 39682048. Throughput: 0: 1801.9, 1: 1802.4. Samples: 9924704. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:32:51,876][101941] Avg episode reward: [(0, '5.600'), (1, '6.400')] +[2023-10-08 12:32:52,380][102897] Updated weights for policy 0, policy_version 19370 (0.0008) +[2023-10-08 12:32:52,759][102897] Updated weights for policy 0, policy_version 19380 (0.0008) +[2023-10-08 12:32:53,133][102897] Updated weights for policy 0, policy_version 19390 (0.0008) +[2023-10-08 12:32:54,360][102898] Updated weights for policy 1, policy_version 19400 (0.0009) +[2023-10-08 12:32:54,724][102898] Updated weights for policy 1, policy_version 19410 (0.0010) +[2023-10-08 12:32:55,103][102898] Updated weights for policy 1, policy_version 19420 (0.0010) +[2023-10-08 12:32:56,827][102897] Updated weights for policy 0, policy_version 19400 (0.0009) +[2023-10-08 12:32:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 39747584. Throughput: 0: 1803.1, 1: 1783.0. Samples: 9945760. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:32:56,876][101941] Avg episode reward: [(0, '5.590'), (1, '6.880')] +[2023-10-08 12:32:57,192][102897] Updated weights for policy 0, policy_version 19410 (0.0007) +[2023-10-08 12:32:57,565][102897] Updated weights for policy 0, policy_version 19420 (0.0009) +[2023-10-08 12:32:58,885][102898] Updated weights for policy 1, policy_version 19430 (0.0008) +[2023-10-08 12:32:59,262][102898] Updated weights for policy 1, policy_version 19440 (0.0007) +[2023-10-08 12:32:59,626][102898] Updated weights for policy 1, policy_version 19450 (0.0007) +[2023-10-08 12:33:01,459][102897] Updated weights for policy 0, policy_version 19430 (0.0008) +[2023-10-08 12:33:01,824][102897] Updated weights for policy 0, policy_version 19440 (0.0010) +[2023-10-08 12:33:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 39813120. Throughput: 0: 1806.4, 1: 1777.3. Samples: 9967766. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:33:01,876][101941] Avg episode reward: [(0, '6.060'), (1, '7.290')] +[2023-10-08 12:33:01,883][102760] Saving new best policy, reward=7.290! +[2023-10-08 12:33:02,201][102897] Updated weights for policy 0, policy_version 19450 (0.0010) +[2023-10-08 12:33:03,484][102898] Updated weights for policy 1, policy_version 19460 (0.0009) +[2023-10-08 12:33:03,836][102898] Updated weights for policy 1, policy_version 19470 (0.0008) +[2023-10-08 12:33:04,210][102898] Updated weights for policy 1, policy_version 19480 (0.0008) +[2023-10-08 12:33:05,931][102897] Updated weights for policy 0, policy_version 19460 (0.0008) +[2023-10-08 12:33:06,306][102897] Updated weights for policy 0, policy_version 19470 (0.0009) +[2023-10-08 12:33:06,684][102897] Updated weights for policy 0, policy_version 19480 (0.0008) +[2023-10-08 12:33:06,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 39878656. Throughput: 0: 1800.0, 1: 1783.9. Samples: 9977998. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:33:06,876][101941] Avg episode reward: [(0, '6.050'), (1, '7.350')] +[2023-10-08 12:33:06,877][102760] Saving new best policy, reward=7.350! +[2023-10-08 12:33:07,962][102898] Updated weights for policy 1, policy_version 19490 (0.0008) +[2023-10-08 12:33:08,336][102898] Updated weights for policy 1, policy_version 19500 (0.0011) +[2023-10-08 12:33:08,709][102898] Updated weights for policy 1, policy_version 19510 (0.0007) +[2023-10-08 12:33:09,077][102898] Updated weights for policy 1, policy_version 19520 (0.0007) +[2023-10-08 12:33:10,414][102897] Updated weights for policy 0, policy_version 19490 (0.0007) +[2023-10-08 12:33:10,785][102897] Updated weights for policy 0, policy_version 19500 (0.0010) +[2023-10-08 12:33:11,164][102897] Updated weights for policy 0, policy_version 19510 (0.0008) +[2023-10-08 12:33:11,527][102897] Updated weights for policy 0, policy_version 19520 (0.0007) +[2023-10-08 12:33:11,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 39976960. Throughput: 0: 1802.0, 1: 1778.7. Samples: 9999892. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) +[2023-10-08 12:33:11,876][101941] Avg episode reward: [(0, '6.340'), (1, '6.980')] +[2023-10-08 12:33:12,871][102898] Updated weights for policy 1, policy_version 19530 (0.0008) +[2023-10-08 12:33:13,236][102898] Updated weights for policy 1, policy_version 19540 (0.0007) +[2023-10-08 12:33:13,596][102898] Updated weights for policy 1, policy_version 19550 (0.0007) +[2023-10-08 12:33:15,310][102897] Updated weights for policy 0, policy_version 19530 (0.0008) +[2023-10-08 12:33:15,671][102897] Updated weights for policy 0, policy_version 19540 (0.0007) +[2023-10-08 12:33:16,044][102897] Updated weights for policy 0, policy_version 19550 (0.0007) +[2023-10-08 12:33:16,875][101941] Fps is (10 sec: 16383.2, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 40042496. Throughput: 0: 1795.3, 1: 1790.2. Samples: 10021166. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) +[2023-10-08 12:33:16,877][101941] Avg episode reward: [(0, '6.620'), (1, '6.020')] +[2023-10-08 12:33:17,413][102898] Updated weights for policy 1, policy_version 19560 (0.0010) +[2023-10-08 12:33:17,789][102898] Updated weights for policy 1, policy_version 19570 (0.0009) +[2023-10-08 12:33:18,157][102898] Updated weights for policy 1, policy_version 19580 (0.0010) +[2023-10-08 12:33:19,971][102897] Updated weights for policy 0, policy_version 19560 (0.0009) +[2023-10-08 12:33:20,348][102897] Updated weights for policy 0, policy_version 19570 (0.0010) +[2023-10-08 12:33:20,718][102897] Updated weights for policy 0, policy_version 19580 (0.0011) +[2023-10-08 12:33:21,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 40108032. Throughput: 0: 1799.9, 1: 1779.7. Samples: 10032376. Policy #0 lag: (min: 31.0, avg: 35.7, max: 63.0) +[2023-10-08 12:33:21,875][101941] Avg episode reward: [(0, '5.970'), (1, '6.110')] +[2023-10-08 12:33:21,893][102898] Updated weights for policy 1, policy_version 19590 (0.0008) +[2023-10-08 12:33:22,256][102898] Updated weights for policy 1, policy_version 19600 (0.0009) +[2023-10-08 12:33:22,623][102898] Updated weights for policy 1, policy_version 19610 (0.0009) +[2023-10-08 12:33:24,536][102897] Updated weights for policy 0, policy_version 19590 (0.0009) +[2023-10-08 12:33:24,919][102897] Updated weights for policy 0, policy_version 19600 (0.0009) +[2023-10-08 12:33:25,288][102897] Updated weights for policy 0, policy_version 19610 (0.0009) +[2023-10-08 12:33:26,389][102898] Updated weights for policy 1, policy_version 19620 (0.0008) +[2023-10-08 12:33:26,756][102898] Updated weights for policy 1, policy_version 19630 (0.0007) +[2023-10-08 12:33:26,875][101941] Fps is (10 sec: 13107.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 40173568. Throughput: 0: 1793.6, 1: 1785.9. Samples: 10053566. Policy #0 lag: (min: 24.0, avg: 48.5, max: 56.0) +[2023-10-08 12:33:26,875][101941] Avg episode reward: [(0, '6.010'), (1, '6.470')] +[2023-10-08 12:33:27,131][102898] Updated weights for policy 1, policy_version 19640 (0.0008) +[2023-10-08 12:33:29,005][102897] Updated weights for policy 0, policy_version 19620 (0.0009) +[2023-10-08 12:33:29,388][102897] Updated weights for policy 0, policy_version 19630 (0.0009) +[2023-10-08 12:33:29,763][102897] Updated weights for policy 0, policy_version 19640 (0.0007) +[2023-10-08 12:33:30,973][102898] Updated weights for policy 1, policy_version 19650 (0.0008) +[2023-10-08 12:33:31,352][102898] Updated weights for policy 1, policy_version 19660 (0.0010) +[2023-10-08 12:33:31,716][102898] Updated weights for policy 1, policy_version 19670 (0.0010) +[2023-10-08 12:33:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 40239104. Throughput: 0: 1785.6, 1: 1798.8. Samples: 10074978. Policy #0 lag: (min: 24.0, avg: 48.5, max: 56.0) +[2023-10-08 12:33:31,875][101941] Avg episode reward: [(0, '6.420'), (1, '6.410')] +[2023-10-08 12:33:32,084][102898] Updated weights for policy 1, policy_version 19680 (0.0010) +[2023-10-08 12:33:33,692][102897] Updated weights for policy 0, policy_version 19650 (0.0010) +[2023-10-08 12:33:34,092][102897] Updated weights for policy 0, policy_version 19660 (0.0009) +[2023-10-08 12:33:34,465][102897] Updated weights for policy 0, policy_version 19670 (0.0008) +[2023-10-08 12:33:34,828][102897] Updated weights for policy 0, policy_version 19680 (0.0008) +[2023-10-08 12:33:35,932][102898] Updated weights for policy 1, policy_version 19690 (0.0008) +[2023-10-08 12:33:36,292][102898] Updated weights for policy 1, policy_version 19700 (0.0007) +[2023-10-08 12:33:36,671][102898] Updated weights for policy 1, policy_version 19710 (0.0008) +[2023-10-08 12:33:36,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 40337408. Throughput: 0: 1793.4, 1: 1780.6. Samples: 10085534. Policy #0 lag: (min: 24.0, avg: 48.5, max: 56.0) +[2023-10-08 12:33:36,876][101941] Avg episode reward: [(0, '6.630'), (1, '6.320')] +[2023-10-08 12:33:38,542][102897] Updated weights for policy 0, policy_version 19690 (0.0007) +[2023-10-08 12:33:38,912][102897] Updated weights for policy 0, policy_version 19700 (0.0008) +[2023-10-08 12:33:39,277][102897] Updated weights for policy 0, policy_version 19710 (0.0009) +[2023-10-08 12:33:40,312][102898] Updated weights for policy 1, policy_version 19720 (0.0009) +[2023-10-08 12:33:40,678][102898] Updated weights for policy 1, policy_version 19730 (0.0010) +[2023-10-08 12:33:41,054][102898] Updated weights for policy 1, policy_version 19740 (0.0011) +[2023-10-08 12:33:41,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 40402944. Throughput: 0: 1782.0, 1: 1803.5. Samples: 10107110. Policy #0 lag: (min: 24.0, avg: 48.5, max: 56.0) +[2023-10-08 12:33:41,876][101941] Avg episode reward: [(0, '6.200'), (1, '6.800')] +[2023-10-08 12:33:42,937][102897] Updated weights for policy 0, policy_version 19720 (0.0009) +[2023-10-08 12:33:43,307][102897] Updated weights for policy 0, policy_version 19730 (0.0010) +[2023-10-08 12:33:43,682][102897] Updated weights for policy 0, policy_version 19740 (0.0009) +[2023-10-08 12:33:44,847][102898] Updated weights for policy 1, policy_version 19750 (0.0011) +[2023-10-08 12:33:45,223][102898] Updated weights for policy 1, policy_version 19760 (0.0009) +[2023-10-08 12:33:45,583][102898] Updated weights for policy 1, policy_version 19770 (0.0009) +[2023-10-08 12:33:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 40468480. Throughput: 0: 1787.4, 1: 1784.7. Samples: 10128510. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:33:46,876][101941] Avg episode reward: [(0, '6.960'), (1, '6.940')] +[2023-10-08 12:33:47,439][102897] Updated weights for policy 0, policy_version 19750 (0.0009) +[2023-10-08 12:33:47,804][102897] Updated weights for policy 0, policy_version 19760 (0.0008) +[2023-10-08 12:33:48,179][102897] Updated weights for policy 0, policy_version 19770 (0.0007) +[2023-10-08 12:33:49,158][102898] Updated weights for policy 1, policy_version 19780 (0.0008) +[2023-10-08 12:33:49,525][102898] Updated weights for policy 1, policy_version 19790 (0.0007) +[2023-10-08 12:33:49,894][102898] Updated weights for policy 1, policy_version 19800 (0.0008) +[2023-10-08 12:33:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 40534016. Throughput: 0: 1776.4, 1: 1804.8. Samples: 10139154. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:33:51,877][101941] Avg episode reward: [(0, '6.790'), (1, '7.130')] +[2023-10-08 12:33:51,957][102897] Updated weights for policy 0, policy_version 19780 (0.0007) +[2023-10-08 12:33:52,332][102897] Updated weights for policy 0, policy_version 19790 (0.0007) +[2023-10-08 12:33:52,698][102897] Updated weights for policy 0, policy_version 19800 (0.0007) +[2023-10-08 12:33:53,827][102898] Updated weights for policy 1, policy_version 19810 (0.0008) +[2023-10-08 12:33:54,201][102898] Updated weights for policy 1, policy_version 19820 (0.0009) +[2023-10-08 12:33:54,564][102898] Updated weights for policy 1, policy_version 19830 (0.0008) +[2023-10-08 12:33:54,933][102898] Updated weights for policy 1, policy_version 19840 (0.0008) +[2023-10-08 12:33:56,350][102897] Updated weights for policy 0, policy_version 19810 (0.0007) +[2023-10-08 12:33:56,722][102897] Updated weights for policy 0, policy_version 19820 (0.0009) +[2023-10-08 12:33:56,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 40599552. Throughput: 0: 1786.0, 1: 1789.3. Samples: 10160780. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:33:56,876][101941] Avg episode reward: [(0, '5.890'), (1, '6.690')] +[2023-10-08 12:33:57,106][102897] Updated weights for policy 0, policy_version 19830 (0.0007) +[2023-10-08 12:33:57,469][102897] Updated weights for policy 0, policy_version 19840 (0.0007) +[2023-10-08 12:33:58,675][102898] Updated weights for policy 1, policy_version 19850 (0.0007) +[2023-10-08 12:33:59,041][102898] Updated weights for policy 1, policy_version 19860 (0.0008) +[2023-10-08 12:33:59,405][102898] Updated weights for policy 1, policy_version 19870 (0.0009) +[2023-10-08 12:34:01,203][102897] Updated weights for policy 0, policy_version 19850 (0.0007) +[2023-10-08 12:34:01,576][102897] Updated weights for policy 0, policy_version 19860 (0.0010) +[2023-10-08 12:34:01,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 40665088. Throughput: 0: 1804.9, 1: 1781.1. Samples: 10182532. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:34:01,875][101941] Avg episode reward: [(0, '5.550'), (1, '6.800')] +[2023-10-08 12:34:01,948][102897] Updated weights for policy 0, policy_version 19870 (0.0009) +[2023-10-08 12:34:03,037][102898] Updated weights for policy 1, policy_version 19880 (0.0007) +[2023-10-08 12:34:03,404][102898] Updated weights for policy 1, policy_version 19890 (0.0008) +[2023-10-08 12:34:03,778][102898] Updated weights for policy 1, policy_version 19900 (0.0008) +[2023-10-08 12:34:05,806][102897] Updated weights for policy 0, policy_version 19880 (0.0008) +[2023-10-08 12:34:06,187][102897] Updated weights for policy 0, policy_version 19890 (0.0008) +[2023-10-08 12:34:06,556][102897] Updated weights for policy 0, policy_version 19900 (0.0009) +[2023-10-08 12:34:06,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 40763392. Throughput: 0: 1785.0, 1: 1782.7. Samples: 10192920. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:34:06,876][101941] Avg episode reward: [(0, '5.970'), (1, '6.870')] +[2023-10-08 12:34:07,600][102898] Updated weights for policy 1, policy_version 19910 (0.0008) +[2023-10-08 12:34:07,955][102898] Updated weights for policy 1, policy_version 19920 (0.0009) +[2023-10-08 12:34:08,329][102898] Updated weights for policy 1, policy_version 19930 (0.0009) +[2023-10-08 12:34:10,324][102897] Updated weights for policy 0, policy_version 19910 (0.0009) +[2023-10-08 12:34:10,696][102897] Updated weights for policy 0, policy_version 19920 (0.0010) +[2023-10-08 12:34:11,063][102897] Updated weights for policy 0, policy_version 19930 (0.0010) +[2023-10-08 12:34:11,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 40828928. Throughput: 0: 1800.7, 1: 1774.8. Samples: 10214464. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:34:11,875][101941] Avg episode reward: [(0, '5.970'), (1, '6.700')] +[2023-10-08 12:34:12,145][102898] Updated weights for policy 1, policy_version 19940 (0.0009) +[2023-10-08 12:34:12,517][102898] Updated weights for policy 1, policy_version 19950 (0.0008) +[2023-10-08 12:34:12,886][102898] Updated weights for policy 1, policy_version 19960 (0.0008) +[2023-10-08 12:34:14,646][102897] Updated weights for policy 0, policy_version 19940 (0.0009) +[2023-10-08 12:34:15,019][102897] Updated weights for policy 0, policy_version 19950 (0.0007) +[2023-10-08 12:34:15,383][102897] Updated weights for policy 0, policy_version 19960 (0.0008) +[2023-10-08 12:34:16,475][102898] Updated weights for policy 1, policy_version 19970 (0.0008) +[2023-10-08 12:34:16,832][102898] Updated weights for policy 1, policy_version 19980 (0.0009) +[2023-10-08 12:34:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.6, 300 sec: 14329.1). Total num frames: 40894464. Throughput: 0: 1787.4, 1: 1794.2. Samples: 10236150. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:34:16,876][101941] Avg episode reward: [(0, '6.130'), (1, '6.020')] +[2023-10-08 12:34:16,884][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000019968_20447232.pth... +[2023-10-08 12:34:16,921][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000018304_18743296.pth +[2023-10-08 12:34:17,205][102898] Updated weights for policy 1, policy_version 19990 (0.0007) +[2023-10-08 12:34:17,566][102898] Updated weights for policy 1, policy_version 20000 (0.0008) +[2023-10-08 12:34:17,566][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000020000_20480000.pth... +[2023-10-08 12:34:17,595][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000018304_18743296.pth +[2023-10-08 12:34:19,206][102897] Updated weights for policy 0, policy_version 19970 (0.0009) +[2023-10-08 12:34:19,604][102897] Updated weights for policy 0, policy_version 19980 (0.0008) +[2023-10-08 12:34:19,987][102897] Updated weights for policy 0, policy_version 19990 (0.0007) +[2023-10-08 12:34:20,358][102897] Updated weights for policy 0, policy_version 20000 (0.0007) +[2023-10-08 12:34:21,272][102898] Updated weights for policy 1, policy_version 20010 (0.0009) +[2023-10-08 12:34:21,640][102898] Updated weights for policy 1, policy_version 20020 (0.0007) +[2023-10-08 12:34:21,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 40960000. Throughput: 0: 1803.0, 1: 1784.8. Samples: 10246986. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:34:21,876][101941] Avg episode reward: [(0, '6.020'), (1, '6.110')] +[2023-10-08 12:34:22,006][102898] Updated weights for policy 1, policy_version 20030 (0.0007) +[2023-10-08 12:34:24,138][102897] Updated weights for policy 0, policy_version 20010 (0.0010) +[2023-10-08 12:34:24,504][102897] Updated weights for policy 0, policy_version 20020 (0.0008) +[2023-10-08 12:34:24,886][102897] Updated weights for policy 0, policy_version 20030 (0.0009) +[2023-10-08 12:34:25,633][102898] Updated weights for policy 1, policy_version 20040 (0.0007) +[2023-10-08 12:34:26,003][102898] Updated weights for policy 1, policy_version 20050 (0.0007) +[2023-10-08 12:34:26,382][102898] Updated weights for policy 1, policy_version 20060 (0.0007) +[2023-10-08 12:34:26,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 41058304. Throughput: 0: 1779.1, 1: 1803.1. Samples: 10268308. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:34:26,876][101941] Avg episode reward: [(0, '6.330'), (1, '6.480')] +[2023-10-08 12:34:28,691][102897] Updated weights for policy 0, policy_version 20040 (0.0007) +[2023-10-08 12:34:29,064][102897] Updated weights for policy 0, policy_version 20050 (0.0011) +[2023-10-08 12:34:29,448][102897] Updated weights for policy 0, policy_version 20060 (0.0008) +[2023-10-08 12:34:30,093][102898] Updated weights for policy 1, policy_version 20070 (0.0007) +[2023-10-08 12:34:30,462][102898] Updated weights for policy 1, policy_version 20080 (0.0008) +[2023-10-08 12:34:30,831][102898] Updated weights for policy 1, policy_version 20090 (0.0008) +[2023-10-08 12:34:31,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 41123840. Throughput: 0: 1778.6, 1: 1799.2. Samples: 10289510. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:34:31,876][101941] Avg episode reward: [(0, '6.390'), (1, '6.230')] +[2023-10-08 12:34:33,307][102897] Updated weights for policy 0, policy_version 20070 (0.0010) +[2023-10-08 12:34:33,686][102897] Updated weights for policy 0, policy_version 20080 (0.0008) +[2023-10-08 12:34:34,053][102897] Updated weights for policy 0, policy_version 20090 (0.0007) +[2023-10-08 12:34:34,603][102898] Updated weights for policy 1, policy_version 20100 (0.0007) +[2023-10-08 12:34:34,967][102898] Updated weights for policy 1, policy_version 20110 (0.0008) +[2023-10-08 12:34:35,337][102898] Updated weights for policy 1, policy_version 20120 (0.0009) +[2023-10-08 12:34:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 41189376. Throughput: 0: 1776.5, 1: 1808.7. Samples: 10300490. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:34:36,876][101941] Avg episode reward: [(0, '6.410'), (1, '6.460')] +[2023-10-08 12:34:37,793][102897] Updated weights for policy 0, policy_version 20100 (0.0009) +[2023-10-08 12:34:38,159][102897] Updated weights for policy 0, policy_version 20110 (0.0010) +[2023-10-08 12:34:38,546][102897] Updated weights for policy 0, policy_version 20120 (0.0009) +[2023-10-08 12:34:39,098][102898] Updated weights for policy 1, policy_version 20130 (0.0008) +[2023-10-08 12:34:39,466][102898] Updated weights for policy 1, policy_version 20140 (0.0010) +[2023-10-08 12:34:39,828][102898] Updated weights for policy 1, policy_version 20150 (0.0009) +[2023-10-08 12:34:40,190][102898] Updated weights for policy 1, policy_version 20160 (0.0010) +[2023-10-08 12:34:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 41254912. Throughput: 0: 1772.7, 1: 1797.8. Samples: 10321450. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:34:41,875][101941] Avg episode reward: [(0, '6.380'), (1, '6.780')] +[2023-10-08 12:34:42,436][102897] Updated weights for policy 0, policy_version 20130 (0.0009) +[2023-10-08 12:34:42,804][102897] Updated weights for policy 0, policy_version 20140 (0.0007) +[2023-10-08 12:34:43,183][102897] Updated weights for policy 0, policy_version 20150 (0.0007) +[2023-10-08 12:34:43,559][102897] Updated weights for policy 0, policy_version 20160 (0.0010) +[2023-10-08 12:34:43,942][102898] Updated weights for policy 1, policy_version 20170 (0.0009) +[2023-10-08 12:34:44,313][102898] Updated weights for policy 1, policy_version 20180 (0.0007) +[2023-10-08 12:34:44,682][102898] Updated weights for policy 1, policy_version 20190 (0.0007) +[2023-10-08 12:34:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 41320448. Throughput: 0: 1779.6, 1: 1801.8. Samples: 10343698. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:34:46,876][101941] Avg episode reward: [(0, '6.540'), (1, '6.110')] +[2023-10-08 12:34:47,372][102897] Updated weights for policy 0, policy_version 20170 (0.0011) +[2023-10-08 12:34:47,756][102897] Updated weights for policy 0, policy_version 20180 (0.0011) +[2023-10-08 12:34:48,122][102897] Updated weights for policy 0, policy_version 20190 (0.0010) +[2023-10-08 12:34:48,449][102898] Updated weights for policy 1, policy_version 20200 (0.0008) +[2023-10-08 12:34:48,806][102898] Updated weights for policy 1, policy_version 20210 (0.0008) +[2023-10-08 12:34:49,183][102898] Updated weights for policy 1, policy_version 20220 (0.0008) +[2023-10-08 12:34:51,866][102897] Updated weights for policy 0, policy_version 20200 (0.0010) +[2023-10-08 12:34:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 41385984. Throughput: 0: 1764.5, 1: 1804.5. Samples: 10353526. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:34:51,876][101941] Avg episode reward: [(0, '6.140'), (1, '6.040')] +[2023-10-08 12:34:52,235][102897] Updated weights for policy 0, policy_version 20210 (0.0010) +[2023-10-08 12:34:52,602][102897] Updated weights for policy 0, policy_version 20220 (0.0010) +[2023-10-08 12:34:52,965][102898] Updated weights for policy 1, policy_version 20230 (0.0008) +[2023-10-08 12:34:53,337][102898] Updated weights for policy 1, policy_version 20240 (0.0008) +[2023-10-08 12:34:53,711][102898] Updated weights for policy 1, policy_version 20250 (0.0010) +[2023-10-08 12:34:56,537][102897] Updated weights for policy 0, policy_version 20230 (0.0010) +[2023-10-08 12:34:56,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 41451520. Throughput: 0: 1779.2, 1: 1813.6. Samples: 10376144. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:34:56,876][101941] Avg episode reward: [(0, '6.190'), (1, '6.900')] +[2023-10-08 12:34:56,913][102897] Updated weights for policy 0, policy_version 20240 (0.0008) +[2023-10-08 12:34:57,295][102897] Updated weights for policy 0, policy_version 20250 (0.0008) +[2023-10-08 12:34:57,410][102898] Updated weights for policy 1, policy_version 20260 (0.0009) +[2023-10-08 12:34:57,786][102898] Updated weights for policy 1, policy_version 20270 (0.0008) +[2023-10-08 12:34:58,146][102898] Updated weights for policy 1, policy_version 20280 (0.0009) +[2023-10-08 12:35:01,070][102897] Updated weights for policy 0, policy_version 20260 (0.0009) +[2023-10-08 12:35:01,449][102897] Updated weights for policy 0, policy_version 20270 (0.0007) +[2023-10-08 12:35:01,826][102897] Updated weights for policy 0, policy_version 20280 (0.0007) +[2023-10-08 12:35:01,874][102898] Updated weights for policy 1, policy_version 20290 (0.0009) +[2023-10-08 12:35:01,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 41517056. Throughput: 0: 1779.8, 1: 1809.7. Samples: 10397678. Policy #0 lag: (min: 31.0, avg: 31.5, max: 46.0) +[2023-10-08 12:35:01,876][101941] Avg episode reward: [(0, '6.480'), (1, '6.950')] +[2023-10-08 12:35:02,239][102898] Updated weights for policy 1, policy_version 20300 (0.0007) +[2023-10-08 12:35:02,606][102898] Updated weights for policy 1, policy_version 20310 (0.0007) +[2023-10-08 12:35:02,977][102898] Updated weights for policy 1, policy_version 20320 (0.0011) +[2023-10-08 12:35:05,512][102897] Updated weights for policy 0, policy_version 20290 (0.0009) +[2023-10-08 12:35:05,927][102897] Updated weights for policy 0, policy_version 20300 (0.0010) +[2023-10-08 12:35:06,302][102897] Updated weights for policy 0, policy_version 20310 (0.0011) +[2023-10-08 12:35:06,675][102897] Updated weights for policy 0, policy_version 20320 (0.0009) +[2023-10-08 12:35:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 41615360. Throughput: 0: 1771.6, 1: 1803.1. Samples: 10407846. Policy #0 lag: (min: 31.0, avg: 31.5, max: 46.0) +[2023-10-08 12:35:06,876][101941] Avg episode reward: [(0, '5.910'), (1, '6.870')] +[2023-10-08 12:35:06,976][102898] Updated weights for policy 1, policy_version 20330 (0.0010) +[2023-10-08 12:35:07,347][102898] Updated weights for policy 1, policy_version 20340 (0.0008) +[2023-10-08 12:35:07,718][102898] Updated weights for policy 1, policy_version 20350 (0.0008) +[2023-10-08 12:35:10,362][102897] Updated weights for policy 0, policy_version 20330 (0.0010) +[2023-10-08 12:35:10,725][102897] Updated weights for policy 0, policy_version 20340 (0.0007) +[2023-10-08 12:35:11,098][102897] Updated weights for policy 0, policy_version 20350 (0.0007) +[2023-10-08 12:35:11,463][102898] Updated weights for policy 1, policy_version 20360 (0.0009) +[2023-10-08 12:35:11,835][102898] Updated weights for policy 1, policy_version 20370 (0.0010) +[2023-10-08 12:35:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 41680896. Throughput: 0: 1790.2, 1: 1793.2. Samples: 10429558. Policy #0 lag: (min: 31.0, avg: 31.5, max: 46.0) +[2023-10-08 12:35:11,876][101941] Avg episode reward: [(0, '5.460'), (1, '7.070')] +[2023-10-08 12:35:12,207][102898] Updated weights for policy 1, policy_version 20380 (0.0008) +[2023-10-08 12:35:14,819][102897] Updated weights for policy 0, policy_version 20360 (0.0007) +[2023-10-08 12:35:15,194][102897] Updated weights for policy 0, policy_version 20370 (0.0008) +[2023-10-08 12:35:15,568][102897] Updated weights for policy 0, policy_version 20380 (0.0010) +[2023-10-08 12:35:15,824][102898] Updated weights for policy 1, policy_version 20390 (0.0008) +[2023-10-08 12:35:16,206][102898] Updated weights for policy 1, policy_version 20400 (0.0011) +[2023-10-08 12:35:16,571][102898] Updated weights for policy 1, policy_version 20410 (0.0010) +[2023-10-08 12:35:16,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 41779200. Throughput: 0: 1770.1, 1: 1794.4. Samples: 10449916. Policy #0 lag: (min: 18.0, avg: 20.7, max: 50.0) +[2023-10-08 12:35:16,876][101941] Avg episode reward: [(0, '6.260'), (1, '7.160')] +[2023-10-08 12:35:19,164][102897] Updated weights for policy 0, policy_version 20390 (0.0008) +[2023-10-08 12:35:19,536][102897] Updated weights for policy 0, policy_version 20400 (0.0009) +[2023-10-08 12:35:19,915][102897] Updated weights for policy 0, policy_version 20410 (0.0008) +[2023-10-08 12:35:20,299][102898] Updated weights for policy 1, policy_version 20420 (0.0009) +[2023-10-08 12:35:20,676][102898] Updated weights for policy 1, policy_version 20430 (0.0007) +[2023-10-08 12:35:21,056][102898] Updated weights for policy 1, policy_version 20440 (0.0007) +[2023-10-08 12:35:21,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 41844736. Throughput: 0: 1798.3, 1: 1783.2. Samples: 10461658. Policy #0 lag: (min: 18.0, avg: 20.7, max: 50.0) +[2023-10-08 12:35:21,875][101941] Avg episode reward: [(0, '6.890'), (1, '7.130')] +[2023-10-08 12:35:23,651][102897] Updated weights for policy 0, policy_version 20420 (0.0009) +[2023-10-08 12:35:24,021][102897] Updated weights for policy 0, policy_version 20430 (0.0007) +[2023-10-08 12:35:24,406][102897] Updated weights for policy 0, policy_version 20440 (0.0008) +[2023-10-08 12:35:24,808][102898] Updated weights for policy 1, policy_version 20450 (0.0009) +[2023-10-08 12:35:25,183][102898] Updated weights for policy 1, policy_version 20460 (0.0010) +[2023-10-08 12:35:25,543][102898] Updated weights for policy 1, policy_version 20470 (0.0009) +[2023-10-08 12:35:25,910][102898] Updated weights for policy 1, policy_version 20480 (0.0010) +[2023-10-08 12:35:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 41910272. Throughput: 0: 1777.1, 1: 1798.4. Samples: 10482346. Policy #0 lag: (min: 18.0, avg: 20.7, max: 50.0) +[2023-10-08 12:35:26,876][101941] Avg episode reward: [(0, '6.060'), (1, '6.990')] +[2023-10-08 12:35:28,304][102897] Updated weights for policy 0, policy_version 20450 (0.0008) +[2023-10-08 12:35:28,675][102897] Updated weights for policy 0, policy_version 20460 (0.0010) +[2023-10-08 12:35:29,044][102897] Updated weights for policy 0, policy_version 20470 (0.0009) +[2023-10-08 12:35:29,413][102897] Updated weights for policy 0, policy_version 20480 (0.0009) +[2023-10-08 12:35:29,803][102898] Updated weights for policy 1, policy_version 20490 (0.0009) +[2023-10-08 12:35:30,177][102898] Updated weights for policy 1, policy_version 20500 (0.0008) +[2023-10-08 12:35:30,558][102898] Updated weights for policy 1, policy_version 20510 (0.0009) +[2023-10-08 12:35:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 41975808. Throughput: 0: 1780.1, 1: 1779.1. Samples: 10503860. Policy #0 lag: (min: 18.0, avg: 20.7, max: 50.0) +[2023-10-08 12:35:31,876][101941] Avg episode reward: [(0, '5.530'), (1, '6.320')] +[2023-10-08 12:35:33,141][102897] Updated weights for policy 0, policy_version 20490 (0.0010) +[2023-10-08 12:35:33,510][102897] Updated weights for policy 0, policy_version 20500 (0.0008) +[2023-10-08 12:35:33,888][102897] Updated weights for policy 0, policy_version 20510 (0.0009) +[2023-10-08 12:35:34,235][102898] Updated weights for policy 1, policy_version 20520 (0.0009) +[2023-10-08 12:35:34,604][102898] Updated weights for policy 1, policy_version 20530 (0.0008) +[2023-10-08 12:35:34,979][102898] Updated weights for policy 1, policy_version 20540 (0.0011) +[2023-10-08 12:35:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 42041344. Throughput: 0: 1784.1, 1: 1795.2. Samples: 10514594. Policy #0 lag: (min: 30.0, avg: 33.0, max: 62.0) +[2023-10-08 12:35:36,876][101941] Avg episode reward: [(0, '5.720'), (1, '6.720')] +[2023-10-08 12:35:37,599][102897] Updated weights for policy 0, policy_version 20520 (0.0007) +[2023-10-08 12:35:37,972][102897] Updated weights for policy 0, policy_version 20530 (0.0008) +[2023-10-08 12:35:38,345][102897] Updated weights for policy 0, policy_version 20540 (0.0008) +[2023-10-08 12:35:38,701][102898] Updated weights for policy 1, policy_version 20550 (0.0008) +[2023-10-08 12:35:39,076][102898] Updated weights for policy 1, policy_version 20560 (0.0008) +[2023-10-08 12:35:39,441][102898] Updated weights for policy 1, policy_version 20570 (0.0007) +[2023-10-08 12:35:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 42106880. Throughput: 0: 1784.4, 1: 1771.9. Samples: 10536180. Policy #0 lag: (min: 30.0, avg: 33.0, max: 62.0) +[2023-10-08 12:35:41,876][101941] Avg episode reward: [(0, '5.720'), (1, '7.170')] +[2023-10-08 12:35:42,116][102897] Updated weights for policy 0, policy_version 20550 (0.0010) +[2023-10-08 12:35:42,500][102897] Updated weights for policy 0, policy_version 20560 (0.0007) +[2023-10-08 12:35:42,883][102897] Updated weights for policy 0, policy_version 20570 (0.0007) +[2023-10-08 12:35:43,213][102898] Updated weights for policy 1, policy_version 20580 (0.0008) +[2023-10-08 12:35:43,591][102898] Updated weights for policy 1, policy_version 20590 (0.0007) +[2023-10-08 12:35:43,954][102898] Updated weights for policy 1, policy_version 20600 (0.0011) +[2023-10-08 12:35:46,697][102897] Updated weights for policy 0, policy_version 20580 (0.0008) +[2023-10-08 12:35:46,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 42172416. Throughput: 0: 1800.3, 1: 1775.1. Samples: 10558568. Policy #0 lag: (min: 30.0, avg: 33.0, max: 62.0) +[2023-10-08 12:35:46,875][101941] Avg episode reward: [(0, '5.850'), (1, '6.770')] +[2023-10-08 12:35:47,069][102897] Updated weights for policy 0, policy_version 20590 (0.0008) +[2023-10-08 12:35:47,440][102897] Updated weights for policy 0, policy_version 20600 (0.0008) +[2023-10-08 12:35:47,747][102898] Updated weights for policy 1, policy_version 20610 (0.0008) +[2023-10-08 12:35:48,115][102898] Updated weights for policy 1, policy_version 20620 (0.0008) +[2023-10-08 12:35:48,482][102898] Updated weights for policy 1, policy_version 20630 (0.0007) +[2023-10-08 12:35:48,855][102898] Updated weights for policy 1, policy_version 20640 (0.0008) +[2023-10-08 12:35:51,406][102897] Updated weights for policy 0, policy_version 20610 (0.0008) +[2023-10-08 12:35:51,813][102897] Updated weights for policy 0, policy_version 20620 (0.0008) +[2023-10-08 12:35:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 42237952. Throughput: 0: 1782.8, 1: 1780.1. Samples: 10568174. Policy #0 lag: (min: 30.0, avg: 33.0, max: 62.0) +[2023-10-08 12:35:51,875][101941] Avg episode reward: [(0, '6.390'), (1, '7.030')] +[2023-10-08 12:35:52,197][102897] Updated weights for policy 0, policy_version 20630 (0.0007) +[2023-10-08 12:35:52,559][102897] Updated weights for policy 0, policy_version 20640 (0.0008) +[2023-10-08 12:35:52,622][102898] Updated weights for policy 1, policy_version 20650 (0.0007) +[2023-10-08 12:35:53,005][102898] Updated weights for policy 1, policy_version 20660 (0.0010) +[2023-10-08 12:35:53,378][102898] Updated weights for policy 1, policy_version 20670 (0.0008) +[2023-10-08 12:35:56,131][102897] Updated weights for policy 0, policy_version 20650 (0.0009) +[2023-10-08 12:35:56,507][102897] Updated weights for policy 0, policy_version 20660 (0.0009) +[2023-10-08 12:35:56,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 42303488. Throughput: 0: 1788.6, 1: 1781.4. Samples: 10590206. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:35:56,876][101941] Avg episode reward: [(0, '6.150'), (1, '6.990')] +[2023-10-08 12:35:56,884][102897] Updated weights for policy 0, policy_version 20670 (0.0007) +[2023-10-08 12:35:57,194][102898] Updated weights for policy 1, policy_version 20680 (0.0009) +[2023-10-08 12:35:57,566][102898] Updated weights for policy 1, policy_version 20690 (0.0009) +[2023-10-08 12:35:57,935][102898] Updated weights for policy 1, policy_version 20700 (0.0009) +[2023-10-08 12:36:00,699][102897] Updated weights for policy 0, policy_version 20680 (0.0007) +[2023-10-08 12:36:01,065][102897] Updated weights for policy 0, policy_version 20690 (0.0010) +[2023-10-08 12:36:01,433][102897] Updated weights for policy 0, policy_version 20700 (0.0009) +[2023-10-08 12:36:01,669][102898] Updated weights for policy 1, policy_version 20710 (0.0008) +[2023-10-08 12:36:01,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 42401792. Throughput: 0: 1783.4, 1: 1799.9. Samples: 10611162. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:36:01,876][101941] Avg episode reward: [(0, '5.980'), (1, '6.740')] +[2023-10-08 12:36:02,043][102898] Updated weights for policy 1, policy_version 20720 (0.0007) +[2023-10-08 12:36:02,413][102898] Updated weights for policy 1, policy_version 20730 (0.0007) +[2023-10-08 12:36:05,121][102897] Updated weights for policy 0, policy_version 20710 (0.0007) +[2023-10-08 12:36:05,502][102897] Updated weights for policy 0, policy_version 20720 (0.0007) +[2023-10-08 12:36:05,865][102897] Updated weights for policy 0, policy_version 20730 (0.0007) +[2023-10-08 12:36:06,189][102898] Updated weights for policy 1, policy_version 20740 (0.0007) +[2023-10-08 12:36:06,557][102898] Updated weights for policy 1, policy_version 20750 (0.0007) +[2023-10-08 12:36:06,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 42467328. Throughput: 0: 1790.0, 1: 1776.4. Samples: 10622144. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:36:06,876][101941] Avg episode reward: [(0, '6.710'), (1, '7.090')] +[2023-10-08 12:36:06,925][102898] Updated weights for policy 1, policy_version 20760 (0.0007) +[2023-10-08 12:36:09,491][102897] Updated weights for policy 0, policy_version 20740 (0.0008) +[2023-10-08 12:36:09,869][102897] Updated weights for policy 0, policy_version 20750 (0.0008) +[2023-10-08 12:36:10,239][102897] Updated weights for policy 0, policy_version 20760 (0.0008) +[2023-10-08 12:36:10,705][102898] Updated weights for policy 1, policy_version 20770 (0.0007) +[2023-10-08 12:36:11,069][102898] Updated weights for policy 1, policy_version 20780 (0.0008) +[2023-10-08 12:36:11,434][102898] Updated weights for policy 1, policy_version 20790 (0.0009) +[2023-10-08 12:36:11,805][102898] Updated weights for policy 1, policy_version 20800 (0.0007) +[2023-10-08 12:36:11,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 42565632. Throughput: 0: 1792.5, 1: 1792.8. Samples: 10643680. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:36:11,875][101941] Avg episode reward: [(0, '6.070'), (1, '7.000')] +[2023-10-08 12:36:14,077][102897] Updated weights for policy 0, policy_version 20770 (0.0010) +[2023-10-08 12:36:14,440][102897] Updated weights for policy 0, policy_version 20780 (0.0011) +[2023-10-08 12:36:14,808][102897] Updated weights for policy 0, policy_version 20790 (0.0010) +[2023-10-08 12:36:15,178][102897] Updated weights for policy 0, policy_version 20800 (0.0010) +[2023-10-08 12:36:15,756][102898] Updated weights for policy 1, policy_version 20810 (0.0007) +[2023-10-08 12:36:16,125][102898] Updated weights for policy 1, policy_version 20820 (0.0008) +[2023-10-08 12:36:16,491][102898] Updated weights for policy 1, policy_version 20830 (0.0009) +[2023-10-08 12:36:16,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 42631168. Throughput: 0: 1781.4, 1: 1785.4. Samples: 10664366. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:36:16,876][101941] Avg episode reward: [(0, '6.190'), (1, '6.690')] +[2023-10-08 12:36:16,888][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000020832_21331968.pth... +[2023-10-08 12:36:16,888][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000020800_21299200.pth... +[2023-10-08 12:36:16,918][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000019136_19595264.pth +[2023-10-08 12:36:16,927][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000019136_19595264.pth +[2023-10-08 12:36:18,961][102897] Updated weights for policy 0, policy_version 20810 (0.0007) +[2023-10-08 12:36:19,336][102897] Updated weights for policy 0, policy_version 20820 (0.0008) +[2023-10-08 12:36:19,710][102897] Updated weights for policy 0, policy_version 20830 (0.0009) +[2023-10-08 12:36:20,135][102898] Updated weights for policy 1, policy_version 20840 (0.0008) +[2023-10-08 12:36:20,506][102898] Updated weights for policy 1, policy_version 20850 (0.0007) +[2023-10-08 12:36:20,875][102898] Updated weights for policy 1, policy_version 20860 (0.0008) +[2023-10-08 12:36:21,875][101941] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 42696704. Throughput: 0: 1789.9, 1: 1797.9. Samples: 10676044. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:36:21,877][101941] Avg episode reward: [(0, '6.390'), (1, '6.720')] +[2023-10-08 12:36:23,457][102897] Updated weights for policy 0, policy_version 20840 (0.0011) +[2023-10-08 12:36:23,823][102897] Updated weights for policy 0, policy_version 20850 (0.0010) +[2023-10-08 12:36:24,187][102897] Updated weights for policy 0, policy_version 20860 (0.0008) +[2023-10-08 12:36:24,664][102898] Updated weights for policy 1, policy_version 20870 (0.0009) +[2023-10-08 12:36:25,033][102898] Updated weights for policy 1, policy_version 20880 (0.0010) +[2023-10-08 12:36:25,403][102898] Updated weights for policy 1, policy_version 20890 (0.0008) +[2023-10-08 12:36:26,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 42762240. Throughput: 0: 1775.1, 1: 1789.7. Samples: 10696596. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:36:26,876][101941] Avg episode reward: [(0, '6.660'), (1, '6.740')] +[2023-10-08 12:36:28,026][102897] Updated weights for policy 0, policy_version 20870 (0.0009) +[2023-10-08 12:36:28,410][102897] Updated weights for policy 0, policy_version 20880 (0.0009) +[2023-10-08 12:36:28,776][102897] Updated weights for policy 0, policy_version 20890 (0.0007) +[2023-10-08 12:36:29,240][102898] Updated weights for policy 1, policy_version 20900 (0.0010) +[2023-10-08 12:36:29,613][102898] Updated weights for policy 1, policy_version 20910 (0.0007) +[2023-10-08 12:36:29,974][102898] Updated weights for policy 1, policy_version 20920 (0.0007) +[2023-10-08 12:36:31,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 42827776. Throughput: 0: 1777.6, 1: 1777.4. Samples: 10718540. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 12:36:31,876][101941] Avg episode reward: [(0, '6.170'), (1, '6.530')] +[2023-10-08 12:36:32,734][102897] Updated weights for policy 0, policy_version 20900 (0.0008) +[2023-10-08 12:36:33,099][102897] Updated weights for policy 0, policy_version 20910 (0.0009) +[2023-10-08 12:36:33,466][102897] Updated weights for policy 0, policy_version 20920 (0.0010) +[2023-10-08 12:36:33,677][102898] Updated weights for policy 1, policy_version 20930 (0.0008) +[2023-10-08 12:36:34,039][102898] Updated weights for policy 1, policy_version 20940 (0.0010) +[2023-10-08 12:36:34,408][102898] Updated weights for policy 1, policy_version 20950 (0.0008) +[2023-10-08 12:36:34,774][102898] Updated weights for policy 1, policy_version 20960 (0.0008) +[2023-10-08 12:36:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 42893312. Throughput: 0: 1781.8, 1: 1791.2. Samples: 10728960. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 12:36:36,875][101941] Avg episode reward: [(0, '6.740'), (1, '7.000')] +[2023-10-08 12:36:37,171][102897] Updated weights for policy 0, policy_version 20930 (0.0008) +[2023-10-08 12:36:37,565][102897] Updated weights for policy 0, policy_version 20940 (0.0008) +[2023-10-08 12:36:37,946][102897] Updated weights for policy 0, policy_version 20950 (0.0009) +[2023-10-08 12:36:38,313][102897] Updated weights for policy 0, policy_version 20960 (0.0008) +[2023-10-08 12:36:38,511][102898] Updated weights for policy 1, policy_version 20970 (0.0008) +[2023-10-08 12:36:38,878][102898] Updated weights for policy 1, policy_version 20980 (0.0009) +[2023-10-08 12:36:39,253][102898] Updated weights for policy 1, policy_version 20990 (0.0008) +[2023-10-08 12:36:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 42958848. Throughput: 0: 1788.4, 1: 1779.3. Samples: 10750756. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 12:36:41,876][101941] Avg episode reward: [(0, '6.800'), (1, '6.770')] +[2023-10-08 12:36:42,023][102897] Updated weights for policy 0, policy_version 20970 (0.0011) +[2023-10-08 12:36:42,393][102897] Updated weights for policy 0, policy_version 20980 (0.0010) +[2023-10-08 12:36:42,758][102897] Updated weights for policy 0, policy_version 20990 (0.0008) +[2023-10-08 12:36:43,224][102898] Updated weights for policy 1, policy_version 21000 (0.0007) +[2023-10-08 12:36:43,594][102898] Updated weights for policy 1, policy_version 21010 (0.0008) +[2023-10-08 12:36:43,961][102898] Updated weights for policy 1, policy_version 21020 (0.0011) +[2023-10-08 12:36:46,489][102897] Updated weights for policy 0, policy_version 21000 (0.0009) +[2023-10-08 12:36:46,865][102897] Updated weights for policy 0, policy_version 21010 (0.0008) +[2023-10-08 12:36:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 43024384. Throughput: 0: 1808.2, 1: 1779.4. Samples: 10772604. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 12:36:46,876][101941] Avg episode reward: [(0, '6.680'), (1, '6.370')] +[2023-10-08 12:36:47,247][102897] Updated weights for policy 0, policy_version 21020 (0.0007) +[2023-10-08 12:36:47,709][102898] Updated weights for policy 1, policy_version 21030 (0.0010) +[2023-10-08 12:36:48,083][102898] Updated weights for policy 1, policy_version 21040 (0.0007) +[2023-10-08 12:36:48,450][102898] Updated weights for policy 1, policy_version 21050 (0.0008) +[2023-10-08 12:36:50,994][102897] Updated weights for policy 0, policy_version 21030 (0.0008) +[2023-10-08 12:36:51,360][102897] Updated weights for policy 0, policy_version 21040 (0.0008) +[2023-10-08 12:36:51,731][102897] Updated weights for policy 0, policy_version 21050 (0.0007) +[2023-10-08 12:36:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 43089920. Throughput: 0: 1784.3, 1: 1784.3. Samples: 10782730. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:36:51,875][101941] Avg episode reward: [(0, '6.530'), (1, '6.030')] +[2023-10-08 12:36:52,182][102898] Updated weights for policy 1, policy_version 21060 (0.0008) +[2023-10-08 12:36:52,547][102898] Updated weights for policy 1, policy_version 21070 (0.0008) +[2023-10-08 12:36:52,910][102898] Updated weights for policy 1, policy_version 21080 (0.0007) +[2023-10-08 12:36:55,477][102897] Updated weights for policy 0, policy_version 21060 (0.0009) +[2023-10-08 12:36:55,848][102897] Updated weights for policy 0, policy_version 21070 (0.0008) +[2023-10-08 12:36:56,227][102897] Updated weights for policy 0, policy_version 21080 (0.0008) +[2023-10-08 12:36:56,634][102898] Updated weights for policy 1, policy_version 21090 (0.0007) +[2023-10-08 12:36:56,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 43188224. Throughput: 0: 1800.7, 1: 1781.0. Samples: 10804858. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:36:56,876][101941] Avg episode reward: [(0, '5.860'), (1, '6.620')] +[2023-10-08 12:36:57,006][102898] Updated weights for policy 1, policy_version 21100 (0.0009) +[2023-10-08 12:36:57,365][102898] Updated weights for policy 1, policy_version 21110 (0.0007) +[2023-10-08 12:36:57,736][102898] Updated weights for policy 1, policy_version 21120 (0.0009) +[2023-10-08 12:37:00,013][102897] Updated weights for policy 0, policy_version 21090 (0.0009) +[2023-10-08 12:37:00,390][102897] Updated weights for policy 0, policy_version 21100 (0.0010) +[2023-10-08 12:37:00,754][102897] Updated weights for policy 0, policy_version 21110 (0.0011) +[2023-10-08 12:37:01,132][102897] Updated weights for policy 0, policy_version 21120 (0.0007) +[2023-10-08 12:37:01,541][102898] Updated weights for policy 1, policy_version 21130 (0.0008) +[2023-10-08 12:37:01,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 43253760. Throughput: 0: 1782.5, 1: 1805.1. Samples: 10825808. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:37:01,876][101941] Avg episode reward: [(0, '5.760'), (1, '7.240')] +[2023-10-08 12:37:01,910][102898] Updated weights for policy 1, policy_version 21140 (0.0008) +[2023-10-08 12:37:02,284][102898] Updated weights for policy 1, policy_version 21150 (0.0007) +[2023-10-08 12:37:04,894][102897] Updated weights for policy 0, policy_version 21130 (0.0010) +[2023-10-08 12:37:05,263][102897] Updated weights for policy 0, policy_version 21140 (0.0010) +[2023-10-08 12:37:05,633][102897] Updated weights for policy 0, policy_version 21150 (0.0009) +[2023-10-08 12:37:05,930][102898] Updated weights for policy 1, policy_version 21160 (0.0007) +[2023-10-08 12:37:06,301][102898] Updated weights for policy 1, policy_version 21170 (0.0009) +[2023-10-08 12:37:06,671][102898] Updated weights for policy 1, policy_version 21180 (0.0009) +[2023-10-08 12:37:06,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 43352064. Throughput: 0: 1807.4, 1: 1779.7. Samples: 10837464. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:37:06,876][101941] Avg episode reward: [(0, '6.410'), (1, '6.470')] +[2023-10-08 12:37:09,318][102897] Updated weights for policy 0, policy_version 21160 (0.0008) +[2023-10-08 12:37:09,687][102897] Updated weights for policy 0, policy_version 21170 (0.0010) +[2023-10-08 12:37:10,057][102897] Updated weights for policy 0, policy_version 21180 (0.0008) +[2023-10-08 12:37:10,488][102898] Updated weights for policy 1, policy_version 21190 (0.0008) +[2023-10-08 12:37:10,852][102898] Updated weights for policy 1, policy_version 21200 (0.0007) +[2023-10-08 12:37:11,223][102898] Updated weights for policy 1, policy_version 21210 (0.0009) +[2023-10-08 12:37:11,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 43417600. Throughput: 0: 1787.7, 1: 1804.0. Samples: 10858224. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:37:11,876][101941] Avg episode reward: [(0, '7.110'), (1, '6.330')] +[2023-10-08 12:37:13,957][102897] Updated weights for policy 0, policy_version 21190 (0.0009) +[2023-10-08 12:37:14,326][102897] Updated weights for policy 0, policy_version 21200 (0.0008) +[2023-10-08 12:37:14,695][102897] Updated weights for policy 0, policy_version 21210 (0.0008) +[2023-10-08 12:37:14,975][102898] Updated weights for policy 1, policy_version 21220 (0.0008) +[2023-10-08 12:37:15,343][102898] Updated weights for policy 1, policy_version 21230 (0.0007) +[2023-10-08 12:37:15,704][102898] Updated weights for policy 1, policy_version 21240 (0.0009) +[2023-10-08 12:37:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 43483136. Throughput: 0: 1786.4, 1: 1788.8. Samples: 10879424. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:37:16,876][101941] Avg episode reward: [(0, '6.450'), (1, '6.450')] +[2023-10-08 12:37:18,420][102897] Updated weights for policy 0, policy_version 21220 (0.0008) +[2023-10-08 12:37:18,798][102897] Updated weights for policy 0, policy_version 21230 (0.0007) +[2023-10-08 12:37:19,167][102897] Updated weights for policy 0, policy_version 21240 (0.0008) +[2023-10-08 12:37:19,409][102898] Updated weights for policy 1, policy_version 21250 (0.0007) +[2023-10-08 12:37:19,773][102898] Updated weights for policy 1, policy_version 21260 (0.0008) +[2023-10-08 12:37:20,133][102898] Updated weights for policy 1, policy_version 21270 (0.0007) +[2023-10-08 12:37:20,506][102898] Updated weights for policy 1, policy_version 21280 (0.0007) +[2023-10-08 12:37:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 43548672. Throughput: 0: 1785.3, 1: 1802.7. Samples: 10890420. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:37:21,876][101941] Avg episode reward: [(0, '6.650'), (1, '6.590')] +[2023-10-08 12:37:22,973][102897] Updated weights for policy 0, policy_version 21250 (0.0008) +[2023-10-08 12:37:23,337][102897] Updated weights for policy 0, policy_version 21260 (0.0007) +[2023-10-08 12:37:23,710][102897] Updated weights for policy 0, policy_version 21270 (0.0007) +[2023-10-08 12:37:24,086][102897] Updated weights for policy 0, policy_version 21280 (0.0007) +[2023-10-08 12:37:24,264][102898] Updated weights for policy 1, policy_version 21290 (0.0010) +[2023-10-08 12:37:24,627][102898] Updated weights for policy 1, policy_version 21300 (0.0009) +[2023-10-08 12:37:25,000][102898] Updated weights for policy 1, policy_version 21310 (0.0010) +[2023-10-08 12:37:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 43614208. Throughput: 0: 1784.7, 1: 1788.3. Samples: 10911540. Policy #0 lag: (min: 31.0, avg: 46.2, max: 63.0) +[2023-10-08 12:37:26,875][101941] Avg episode reward: [(0, '6.200'), (1, '6.740')] +[2023-10-08 12:37:27,884][102897] Updated weights for policy 0, policy_version 21290 (0.0008) +[2023-10-08 12:37:28,264][102897] Updated weights for policy 0, policy_version 21300 (0.0008) +[2023-10-08 12:37:28,635][102897] Updated weights for policy 0, policy_version 21310 (0.0008) +[2023-10-08 12:37:28,901][102898] Updated weights for policy 1, policy_version 21320 (0.0007) +[2023-10-08 12:37:29,273][102898] Updated weights for policy 1, policy_version 21330 (0.0008) +[2023-10-08 12:37:29,646][102898] Updated weights for policy 1, policy_version 21340 (0.0007) +[2023-10-08 12:37:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 43679744. Throughput: 0: 1783.7, 1: 1791.7. Samples: 10933500. Policy #0 lag: (min: 31.0, avg: 46.2, max: 63.0) +[2023-10-08 12:37:31,876][101941] Avg episode reward: [(0, '5.880'), (1, '7.110')] +[2023-10-08 12:37:32,449][102897] Updated weights for policy 0, policy_version 21320 (0.0007) +[2023-10-08 12:37:32,810][102897] Updated weights for policy 0, policy_version 21330 (0.0007) +[2023-10-08 12:37:33,195][102897] Updated weights for policy 0, policy_version 21340 (0.0008) +[2023-10-08 12:37:33,399][102898] Updated weights for policy 1, policy_version 21350 (0.0008) +[2023-10-08 12:37:33,756][102898] Updated weights for policy 1, policy_version 21360 (0.0011) +[2023-10-08 12:37:34,123][102898] Updated weights for policy 1, policy_version 21370 (0.0010) +[2023-10-08 12:37:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 43745280. Throughput: 0: 1776.4, 1: 1788.9. Samples: 10943168. Policy #0 lag: (min: 31.0, avg: 46.2, max: 63.0) +[2023-10-08 12:37:36,876][101941] Avg episode reward: [(0, '6.180'), (1, '7.460')] +[2023-10-08 12:37:36,877][102760] Saving new best policy, reward=7.460! +[2023-10-08 12:37:36,899][102897] Updated weights for policy 0, policy_version 21350 (0.0007) +[2023-10-08 12:37:37,271][102897] Updated weights for policy 0, policy_version 21360 (0.0007) +[2023-10-08 12:37:37,642][102897] Updated weights for policy 0, policy_version 21370 (0.0007) +[2023-10-08 12:37:38,012][102898] Updated weights for policy 1, policy_version 21380 (0.0010) +[2023-10-08 12:37:38,379][102898] Updated weights for policy 1, policy_version 21390 (0.0007) +[2023-10-08 12:37:38,740][102898] Updated weights for policy 1, policy_version 21400 (0.0007) +[2023-10-08 12:37:41,422][102897] Updated weights for policy 0, policy_version 21380 (0.0008) +[2023-10-08 12:37:41,797][102897] Updated weights for policy 0, policy_version 21390 (0.0010) +[2023-10-08 12:37:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 43810816. Throughput: 0: 1781.7, 1: 1790.7. Samples: 10965618. Policy #0 lag: (min: 31.0, avg: 46.2, max: 63.0) +[2023-10-08 12:37:41,876][101941] Avg episode reward: [(0, '6.480'), (1, '6.770')] +[2023-10-08 12:37:42,169][102897] Updated weights for policy 0, policy_version 21400 (0.0009) +[2023-10-08 12:37:42,575][102898] Updated weights for policy 1, policy_version 21410 (0.0008) +[2023-10-08 12:37:42,952][102898] Updated weights for policy 1, policy_version 21420 (0.0009) +[2023-10-08 12:37:43,320][102898] Updated weights for policy 1, policy_version 21430 (0.0007) +[2023-10-08 12:37:43,693][102898] Updated weights for policy 1, policy_version 21440 (0.0008) +[2023-10-08 12:37:45,999][102897] Updated weights for policy 0, policy_version 21410 (0.0007) +[2023-10-08 12:37:46,376][102897] Updated weights for policy 0, policy_version 21420 (0.0008) +[2023-10-08 12:37:46,736][102897] Updated weights for policy 0, policy_version 21430 (0.0008) +[2023-10-08 12:37:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 43876352. Throughput: 0: 1797.3, 1: 1794.6. Samples: 10987442. Policy #0 lag: (min: 12.0, avg: 14.5, max: 44.0) +[2023-10-08 12:37:46,875][101941] Avg episode reward: [(0, '6.560'), (1, '6.690')] +[2023-10-08 12:37:47,112][102897] Updated weights for policy 0, policy_version 21440 (0.0009) +[2023-10-08 12:37:47,206][102898] Updated weights for policy 1, policy_version 21450 (0.0008) +[2023-10-08 12:37:47,579][102898] Updated weights for policy 1, policy_version 21460 (0.0008) +[2023-10-08 12:37:47,944][102898] Updated weights for policy 1, policy_version 21470 (0.0010) +[2023-10-08 12:37:51,005][102897] Updated weights for policy 0, policy_version 21450 (0.0009) +[2023-10-08 12:37:51,371][102897] Updated weights for policy 0, policy_version 21460 (0.0008) +[2023-10-08 12:37:51,690][102898] Updated weights for policy 1, policy_version 21480 (0.0008) +[2023-10-08 12:37:51,745][102897] Updated weights for policy 0, policy_version 21470 (0.0007) +[2023-10-08 12:37:51,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 43974656. Throughput: 0: 1769.3, 1: 1788.6. Samples: 10997568. Policy #0 lag: (min: 12.0, avg: 14.5, max: 44.0) +[2023-10-08 12:37:51,876][101941] Avg episode reward: [(0, '6.400'), (1, '6.520')] +[2023-10-08 12:37:52,053][102898] Updated weights for policy 1, policy_version 21490 (0.0008) +[2023-10-08 12:37:52,422][102898] Updated weights for policy 1, policy_version 21500 (0.0007) +[2023-10-08 12:37:55,432][102897] Updated weights for policy 0, policy_version 21480 (0.0009) +[2023-10-08 12:37:55,800][102897] Updated weights for policy 0, policy_version 21490 (0.0010) +[2023-10-08 12:37:56,102][102898] Updated weights for policy 1, policy_version 21510 (0.0007) +[2023-10-08 12:37:56,166][102897] Updated weights for policy 0, policy_version 21500 (0.0010) +[2023-10-08 12:37:56,473][102898] Updated weights for policy 1, policy_version 21520 (0.0007) +[2023-10-08 12:37:56,840][102898] Updated weights for policy 1, policy_version 21530 (0.0007) +[2023-10-08 12:37:56,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 44040192. Throughput: 0: 1797.4, 1: 1794.6. Samples: 11019862. Policy #0 lag: (min: 12.0, avg: 14.5, max: 44.0) +[2023-10-08 12:37:56,875][101941] Avg episode reward: [(0, '7.090'), (1, '6.120')] +[2023-10-08 12:38:00,012][102897] Updated weights for policy 0, policy_version 21510 (0.0009) +[2023-10-08 12:38:00,382][102897] Updated weights for policy 0, policy_version 21520 (0.0008) +[2023-10-08 12:38:00,648][102898] Updated weights for policy 1, policy_version 21540 (0.0010) +[2023-10-08 12:38:00,753][102897] Updated weights for policy 0, policy_version 21530 (0.0008) +[2023-10-08 12:38:01,013][102898] Updated weights for policy 1, policy_version 21550 (0.0008) +[2023-10-08 12:38:01,385][102898] Updated weights for policy 1, policy_version 21560 (0.0008) +[2023-10-08 12:38:01,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 44138496. Throughput: 0: 1767.0, 1: 1797.2. Samples: 11039812. Policy #0 lag: (min: 10.0, avg: 10.5, max: 22.0) +[2023-10-08 12:38:01,876][101941] Avg episode reward: [(0, '7.400'), (1, '6.430')] +[2023-10-08 12:38:01,885][102634] Saving new best policy, reward=7.400! +[2023-10-08 12:38:04,412][102897] Updated weights for policy 0, policy_version 21540 (0.0008) +[2023-10-08 12:38:04,786][102897] Updated weights for policy 0, policy_version 21550 (0.0007) +[2023-10-08 12:38:05,138][102898] Updated weights for policy 1, policy_version 21570 (0.0008) +[2023-10-08 12:38:05,155][102897] Updated weights for policy 0, policy_version 21560 (0.0009) +[2023-10-08 12:38:05,501][102898] Updated weights for policy 1, policy_version 21580 (0.0009) +[2023-10-08 12:38:05,871][102898] Updated weights for policy 1, policy_version 21590 (0.0010) +[2023-10-08 12:38:06,236][102898] Updated weights for policy 1, policy_version 21600 (0.0008) +[2023-10-08 12:38:06,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 44204032. Throughput: 0: 1799.7, 1: 1793.6. Samples: 11052118. Policy #0 lag: (min: 10.0, avg: 10.5, max: 22.0) +[2023-10-08 12:38:06,876][101941] Avg episode reward: [(0, '6.850'), (1, '6.470')] +[2023-10-08 12:38:08,910][102897] Updated weights for policy 0, policy_version 21570 (0.0008) +[2023-10-08 12:38:09,276][102897] Updated weights for policy 0, policy_version 21580 (0.0008) +[2023-10-08 12:38:09,655][102897] Updated weights for policy 0, policy_version 21590 (0.0008) +[2023-10-08 12:38:10,027][102897] Updated weights for policy 0, policy_version 21600 (0.0008) +[2023-10-08 12:38:10,099][102898] Updated weights for policy 1, policy_version 21610 (0.0007) +[2023-10-08 12:38:10,466][102898] Updated weights for policy 1, policy_version 21620 (0.0009) +[2023-10-08 12:38:10,840][102898] Updated weights for policy 1, policy_version 21630 (0.0007) +[2023-10-08 12:38:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 44269568. Throughput: 0: 1769.0, 1: 1804.7. Samples: 11072354. Policy #0 lag: (min: 10.0, avg: 10.5, max: 22.0) +[2023-10-08 12:38:11,876][101941] Avg episode reward: [(0, '6.530'), (1, '6.360')] +[2023-10-08 12:38:13,938][102897] Updated weights for policy 0, policy_version 21610 (0.0008) +[2023-10-08 12:38:14,309][102897] Updated weights for policy 0, policy_version 21620 (0.0007) +[2023-10-08 12:38:14,594][102898] Updated weights for policy 1, policy_version 21640 (0.0007) +[2023-10-08 12:38:14,672][102897] Updated weights for policy 0, policy_version 21630 (0.0008) +[2023-10-08 12:38:14,971][102898] Updated weights for policy 1, policy_version 21650 (0.0010) +[2023-10-08 12:38:15,337][102898] Updated weights for policy 1, policy_version 21660 (0.0009) +[2023-10-08 12:38:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 44335104. Throughput: 0: 1770.0, 1: 1791.4. Samples: 11093764. Policy #0 lag: (min: 10.0, avg: 10.5, max: 22.0) +[2023-10-08 12:38:16,876][101941] Avg episode reward: [(0, '6.840'), (1, '5.830')] +[2023-10-08 12:38:16,883][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000021664_22183936.pth... +[2023-10-08 12:38:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000021632_22151168.pth... +[2023-10-08 12:38:16,919][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000020000_20480000.pth +[2023-10-08 12:38:16,925][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000019968_20447232.pth +[2023-10-08 12:38:18,436][102897] Updated weights for policy 0, policy_version 21640 (0.0009) +[2023-10-08 12:38:18,824][102897] Updated weights for policy 0, policy_version 21650 (0.0010) +[2023-10-08 12:38:18,942][102898] Updated weights for policy 1, policy_version 21670 (0.0009) +[2023-10-08 12:38:19,192][102897] Updated weights for policy 0, policy_version 21660 (0.0008) +[2023-10-08 12:38:19,298][102898] Updated weights for policy 1, policy_version 21680 (0.0008) +[2023-10-08 12:38:19,659][102898] Updated weights for policy 1, policy_version 21690 (0.0009) +[2023-10-08 12:38:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 44400640. Throughput: 0: 1771.3, 1: 1811.3. Samples: 11104386. Policy #0 lag: (min: 28.0, avg: 36.0, max: 60.0) +[2023-10-08 12:38:21,876][101941] Avg episode reward: [(0, '6.650'), (1, '6.530')] +[2023-10-08 12:38:23,003][102897] Updated weights for policy 0, policy_version 21670 (0.0007) +[2023-10-08 12:38:23,276][102898] Updated weights for policy 1, policy_version 21700 (0.0010) +[2023-10-08 12:38:23,375][102897] Updated weights for policy 0, policy_version 21680 (0.0007) +[2023-10-08 12:38:23,639][102898] Updated weights for policy 1, policy_version 21710 (0.0007) +[2023-10-08 12:38:23,750][102897] Updated weights for policy 0, policy_version 21690 (0.0009) +[2023-10-08 12:38:24,009][102898] Updated weights for policy 1, policy_version 21720 (0.0007) +[2023-10-08 12:38:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 44466176. Throughput: 0: 1766.2, 1: 1801.5. Samples: 11126164. Policy #0 lag: (min: 28.0, avg: 36.0, max: 60.0) +[2023-10-08 12:38:26,876][101941] Avg episode reward: [(0, '6.670'), (1, '7.310')] +[2023-10-08 12:38:27,517][102897] Updated weights for policy 0, policy_version 21700 (0.0009) +[2023-10-08 12:38:27,742][102898] Updated weights for policy 1, policy_version 21730 (0.0008) +[2023-10-08 12:38:27,898][102897] Updated weights for policy 0, policy_version 21710 (0.0009) +[2023-10-08 12:38:28,104][102898] Updated weights for policy 1, policy_version 21740 (0.0008) +[2023-10-08 12:38:28,266][102897] Updated weights for policy 0, policy_version 21720 (0.0008) +[2023-10-08 12:38:28,473][102898] Updated weights for policy 1, policy_version 21750 (0.0007) +[2023-10-08 12:38:28,841][102898] Updated weights for policy 1, policy_version 21760 (0.0008) +[2023-10-08 12:38:31,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 44531712. Throughput: 0: 1781.0, 1: 1799.7. Samples: 11148572. Policy #0 lag: (min: 28.0, avg: 36.0, max: 60.0) +[2023-10-08 12:38:31,876][101941] Avg episode reward: [(0, '6.630'), (1, '7.280')] +[2023-10-08 12:38:32,117][102897] Updated weights for policy 0, policy_version 21730 (0.0008) +[2023-10-08 12:38:32,486][102897] Updated weights for policy 0, policy_version 21740 (0.0007) +[2023-10-08 12:38:32,702][102898] Updated weights for policy 1, policy_version 21770 (0.0008) +[2023-10-08 12:38:32,857][102897] Updated weights for policy 0, policy_version 21750 (0.0007) +[2023-10-08 12:38:33,074][102898] Updated weights for policy 1, policy_version 21780 (0.0008) +[2023-10-08 12:38:33,228][102897] Updated weights for policy 0, policy_version 21760 (0.0008) +[2023-10-08 12:38:33,441][102898] Updated weights for policy 1, policy_version 21790 (0.0008) +[2023-10-08 12:38:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 44597248. Throughput: 0: 1772.1, 1: 1799.3. Samples: 11158282. Policy #0 lag: (min: 28.0, avg: 36.0, max: 60.0) +[2023-10-08 12:38:36,876][101941] Avg episode reward: [(0, '6.540'), (1, '6.680')] +[2023-10-08 12:38:36,976][102897] Updated weights for policy 0, policy_version 21770 (0.0009) +[2023-10-08 12:38:37,289][102898] Updated weights for policy 1, policy_version 21800 (0.0007) +[2023-10-08 12:38:37,346][102897] Updated weights for policy 0, policy_version 21780 (0.0008) +[2023-10-08 12:38:37,666][102898] Updated weights for policy 1, policy_version 21810 (0.0007) +[2023-10-08 12:38:37,723][102897] Updated weights for policy 0, policy_version 21790 (0.0007) +[2023-10-08 12:38:38,029][102898] Updated weights for policy 1, policy_version 21820 (0.0007) +[2023-10-08 12:38:41,451][102897] Updated weights for policy 0, policy_version 21800 (0.0008) +[2023-10-08 12:38:41,716][102898] Updated weights for policy 1, policy_version 21830 (0.0008) +[2023-10-08 12:38:41,815][102897] Updated weights for policy 0, policy_version 21810 (0.0009) +[2023-10-08 12:38:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 44662784. Throughput: 0: 1774.4, 1: 1797.8. Samples: 11180610. Policy #0 lag: (min: 31.0, avg: 31.5, max: 46.0) +[2023-10-08 12:38:41,876][101941] Avg episode reward: [(0, '6.450'), (1, '6.170')] +[2023-10-08 12:38:42,085][102898] Updated weights for policy 1, policy_version 21840 (0.0008) +[2023-10-08 12:38:42,191][102897] Updated weights for policy 0, policy_version 21820 (0.0008) +[2023-10-08 12:38:42,448][102898] Updated weights for policy 1, policy_version 21850 (0.0009) +[2023-10-08 12:38:45,999][102897] Updated weights for policy 0, policy_version 21830 (0.0008) +[2023-10-08 12:38:46,124][102898] Updated weights for policy 1, policy_version 21860 (0.0008) +[2023-10-08 12:38:46,362][102897] Updated weights for policy 0, policy_version 21840 (0.0009) +[2023-10-08 12:38:46,500][102898] Updated weights for policy 1, policy_version 21870 (0.0008) +[2023-10-08 12:38:46,738][102897] Updated weights for policy 0, policy_version 21850 (0.0007) +[2023-10-08 12:38:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 44728320. Throughput: 0: 1788.3, 1: 1811.8. Samples: 11201814. Policy #0 lag: (min: 31.0, avg: 31.5, max: 46.0) +[2023-10-08 12:38:46,876][102898] Updated weights for policy 1, policy_version 21880 (0.0008) +[2023-10-08 12:38:46,876][101941] Avg episode reward: [(0, '6.020'), (1, '6.280')] +[2023-10-08 12:38:50,437][102897] Updated weights for policy 0, policy_version 21860 (0.0008) +[2023-10-08 12:38:50,504][102898] Updated weights for policy 1, policy_version 21890 (0.0008) +[2023-10-08 12:38:50,812][102897] Updated weights for policy 0, policy_version 21870 (0.0009) +[2023-10-08 12:38:50,870][102898] Updated weights for policy 1, policy_version 21900 (0.0009) +[2023-10-08 12:38:51,177][102897] Updated weights for policy 0, policy_version 21880 (0.0009) +[2023-10-08 12:38:51,239][102898] Updated weights for policy 1, policy_version 21910 (0.0009) +[2023-10-08 12:38:51,602][102898] Updated weights for policy 1, policy_version 21920 (0.0008) +[2023-10-08 12:38:51,875][101941] Fps is (10 sec: 19660.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 44859392. Throughput: 0: 1773.0, 1: 1801.8. Samples: 11212986. Policy #0 lag: (min: 31.0, avg: 31.5, max: 46.0) +[2023-10-08 12:38:51,876][101941] Avg episode reward: [(0, '5.930'), (1, '6.740')] +[2023-10-08 12:38:54,998][102897] Updated weights for policy 0, policy_version 21890 (0.0008) +[2023-10-08 12:38:55,373][102897] Updated weights for policy 0, policy_version 21900 (0.0007) +[2023-10-08 12:38:55,456][102898] Updated weights for policy 1, policy_version 21930 (0.0008) +[2023-10-08 12:38:55,734][102897] Updated weights for policy 0, policy_version 21910 (0.0008) +[2023-10-08 12:38:55,827][102898] Updated weights for policy 1, policy_version 21940 (0.0008) +[2023-10-08 12:38:56,106][102897] Updated weights for policy 0, policy_version 21920 (0.0007) +[2023-10-08 12:38:56,191][102898] Updated weights for policy 1, policy_version 21950 (0.0007) +[2023-10-08 12:38:56,875][101941] Fps is (10 sec: 19660.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 44924928. Throughput: 0: 1789.0, 1: 1804.3. Samples: 11234052. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 12:38:56,876][101941] Avg episode reward: [(0, '5.960'), (1, '6.600')] +[2023-10-08 12:39:00,022][102897] Updated weights for policy 0, policy_version 21930 (0.0008) +[2023-10-08 12:39:00,136][102898] Updated weights for policy 1, policy_version 21960 (0.0007) +[2023-10-08 12:39:00,395][102897] Updated weights for policy 0, policy_version 21940 (0.0007) +[2023-10-08 12:39:00,515][102898] Updated weights for policy 1, policy_version 21970 (0.0008) +[2023-10-08 12:39:00,771][102897] Updated weights for policy 0, policy_version 21950 (0.0007) +[2023-10-08 12:39:00,886][102898] Updated weights for policy 1, policy_version 21980 (0.0008) +[2023-10-08 12:39:01,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 44990464. Throughput: 0: 1772.3, 1: 1791.2. Samples: 11254122. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 12:39:01,876][101941] Avg episode reward: [(0, '5.850'), (1, '6.660')] +[2023-10-08 12:39:04,366][102897] Updated weights for policy 0, policy_version 21960 (0.0008) +[2023-10-08 12:39:04,558][102898] Updated weights for policy 1, policy_version 21990 (0.0009) +[2023-10-08 12:39:04,723][102897] Updated weights for policy 0, policy_version 21970 (0.0008) +[2023-10-08 12:39:04,924][102898] Updated weights for policy 1, policy_version 22000 (0.0008) +[2023-10-08 12:39:05,094][102897] Updated weights for policy 0, policy_version 21980 (0.0009) +[2023-10-08 12:39:05,284][102898] Updated weights for policy 1, policy_version 22010 (0.0008) +[2023-10-08 12:39:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 45056000. Throughput: 0: 1799.3, 1: 1800.4. Samples: 11266372. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 12:39:06,876][101941] Avg episode reward: [(0, '5.670'), (1, '6.640')] +[2023-10-08 12:39:08,996][102897] Updated weights for policy 0, policy_version 21990 (0.0007) +[2023-10-08 12:39:09,158][102898] Updated weights for policy 1, policy_version 22020 (0.0009) +[2023-10-08 12:39:09,374][102897] Updated weights for policy 0, policy_version 22000 (0.0007) +[2023-10-08 12:39:09,523][102898] Updated weights for policy 1, policy_version 22030 (0.0009) +[2023-10-08 12:39:09,741][102897] Updated weights for policy 0, policy_version 22010 (0.0009) +[2023-10-08 12:39:09,887][102898] Updated weights for policy 1, policy_version 22040 (0.0007) +[2023-10-08 12:39:11,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 45121536. Throughput: 0: 1777.2, 1: 1778.9. Samples: 11286186. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 12:39:11,875][101941] Avg episode reward: [(0, '6.290'), (1, '6.460')] +[2023-10-08 12:39:13,435][102897] Updated weights for policy 0, policy_version 22020 (0.0007) +[2023-10-08 12:39:13,435][102898] Updated weights for policy 1, policy_version 22050 (0.0009) +[2023-10-08 12:39:13,798][102897] Updated weights for policy 0, policy_version 22030 (0.0009) +[2023-10-08 12:39:13,798][102898] Updated weights for policy 1, policy_version 22060 (0.0007) +[2023-10-08 12:39:14,160][102898] Updated weights for policy 1, policy_version 22070 (0.0008) +[2023-10-08 12:39:14,173][102897] Updated weights for policy 0, policy_version 22040 (0.0008) +[2023-10-08 12:39:14,524][102898] Updated weights for policy 1, policy_version 22080 (0.0009) +[2023-10-08 12:39:16,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 45187072. Throughput: 0: 1778.6, 1: 1779.5. Samples: 11308684. Policy #0 lag: (min: 21.0, avg: 26.0, max: 53.0) +[2023-10-08 12:39:16,875][101941] Avg episode reward: [(0, '6.460'), (1, '7.390')] +[2023-10-08 12:39:17,795][102897] Updated weights for policy 0, policy_version 22050 (0.0008) +[2023-10-08 12:39:18,160][102897] Updated weights for policy 0, policy_version 22060 (0.0007) +[2023-10-08 12:39:18,412][102898] Updated weights for policy 1, policy_version 22090 (0.0008) +[2023-10-08 12:39:18,534][102897] Updated weights for policy 0, policy_version 22070 (0.0008) +[2023-10-08 12:39:18,779][102898] Updated weights for policy 1, policy_version 22100 (0.0007) +[2023-10-08 12:39:18,895][102897] Updated weights for policy 0, policy_version 22080 (0.0010) +[2023-10-08 12:39:19,137][102898] Updated weights for policy 1, policy_version 22110 (0.0008) +[2023-10-08 12:39:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 45252608. Throughput: 0: 1784.3, 1: 1781.8. Samples: 11318756. Policy #0 lag: (min: 21.0, avg: 26.0, max: 53.0) +[2023-10-08 12:39:21,876][101941] Avg episode reward: [(0, '6.860'), (1, '6.860')] +[2023-10-08 12:39:22,549][102897] Updated weights for policy 0, policy_version 22090 (0.0007) +[2023-10-08 12:39:22,923][102897] Updated weights for policy 0, policy_version 22100 (0.0007) +[2023-10-08 12:39:22,931][102898] Updated weights for policy 1, policy_version 22120 (0.0009) +[2023-10-08 12:39:23,281][102897] Updated weights for policy 0, policy_version 22110 (0.0008) +[2023-10-08 12:39:23,293][102898] Updated weights for policy 1, policy_version 22130 (0.0008) +[2023-10-08 12:39:23,666][102898] Updated weights for policy 1, policy_version 22140 (0.0010) +[2023-10-08 12:39:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 45318144. Throughput: 0: 1789.6, 1: 1772.7. Samples: 11340912. Policy #0 lag: (min: 21.0, avg: 26.0, max: 53.0) +[2023-10-08 12:39:26,875][101941] Avg episode reward: [(0, '6.830'), (1, '7.030')] +[2023-10-08 12:39:26,969][102897] Updated weights for policy 0, policy_version 22120 (0.0007) +[2023-10-08 12:39:27,334][102897] Updated weights for policy 0, policy_version 22130 (0.0007) +[2023-10-08 12:39:27,619][102898] Updated weights for policy 1, policy_version 22150 (0.0008) +[2023-10-08 12:39:27,700][102897] Updated weights for policy 0, policy_version 22140 (0.0007) +[2023-10-08 12:39:27,990][102898] Updated weights for policy 1, policy_version 22160 (0.0007) +[2023-10-08 12:39:28,351][102898] Updated weights for policy 1, policy_version 22170 (0.0008) +[2023-10-08 12:39:31,415][102897] Updated weights for policy 0, policy_version 22150 (0.0009) +[2023-10-08 12:39:31,792][102897] Updated weights for policy 0, policy_version 22160 (0.0008) +[2023-10-08 12:39:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 45383680. Throughput: 0: 1807.2, 1: 1777.4. Samples: 11363124. Policy #0 lag: (min: 21.0, avg: 26.0, max: 53.0) +[2023-10-08 12:39:31,875][101941] Avg episode reward: [(0, '6.200'), (1, '6.930')] +[2023-10-08 12:39:32,165][102897] Updated weights for policy 0, policy_version 22170 (0.0008) +[2023-10-08 12:39:32,178][102898] Updated weights for policy 1, policy_version 22180 (0.0008) +[2023-10-08 12:39:32,545][102898] Updated weights for policy 1, policy_version 22190 (0.0010) +[2023-10-08 12:39:32,918][102898] Updated weights for policy 1, policy_version 22200 (0.0008) +[2023-10-08 12:39:35,936][102897] Updated weights for policy 0, policy_version 22180 (0.0010) +[2023-10-08 12:39:36,300][102897] Updated weights for policy 0, policy_version 22190 (0.0010) +[2023-10-08 12:39:36,554][102898] Updated weights for policy 1, policy_version 22210 (0.0009) +[2023-10-08 12:39:36,676][102897] Updated weights for policy 0, policy_version 22200 (0.0009) +[2023-10-08 12:39:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 45449216. Throughput: 0: 1798.2, 1: 1761.5. Samples: 11373172. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:39:36,876][101941] Avg episode reward: [(0, '6.340'), (1, '6.520')] +[2023-10-08 12:39:36,926][102898] Updated weights for policy 1, policy_version 22220 (0.0008) +[2023-10-08 12:39:37,287][102898] Updated weights for policy 1, policy_version 22230 (0.0008) +[2023-10-08 12:39:37,654][102898] Updated weights for policy 1, policy_version 22240 (0.0009) +[2023-10-08 12:39:40,549][102897] Updated weights for policy 0, policy_version 22210 (0.0010) +[2023-10-08 12:39:40,915][102897] Updated weights for policy 0, policy_version 22220 (0.0007) +[2023-10-08 12:39:41,288][102897] Updated weights for policy 0, policy_version 22230 (0.0008) +[2023-10-08 12:39:41,533][102898] Updated weights for policy 1, policy_version 22250 (0.0009) +[2023-10-08 12:39:41,655][102897] Updated weights for policy 0, policy_version 22240 (0.0009) +[2023-10-08 12:39:41,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 45547520. Throughput: 0: 1807.6, 1: 1776.8. Samples: 11395348. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:39:41,875][101941] Avg episode reward: [(0, '6.480'), (1, '6.820')] +[2023-10-08 12:39:41,903][102898] Updated weights for policy 1, policy_version 22260 (0.0010) +[2023-10-08 12:39:42,272][102898] Updated weights for policy 1, policy_version 22270 (0.0011) +[2023-10-08 12:39:45,657][102897] Updated weights for policy 0, policy_version 22250 (0.0011) +[2023-10-08 12:39:46,036][102897] Updated weights for policy 0, policy_version 22260 (0.0010) +[2023-10-08 12:39:46,188][102898] Updated weights for policy 1, policy_version 22280 (0.0008) +[2023-10-08 12:39:46,395][102897] Updated weights for policy 0, policy_version 22270 (0.0007) +[2023-10-08 12:39:46,563][102898] Updated weights for policy 1, policy_version 22290 (0.0007) +[2023-10-08 12:39:46,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 45613056. Throughput: 0: 1794.6, 1: 1785.9. Samples: 11415246. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:39:46,876][101941] Avg episode reward: [(0, '6.520'), (1, '6.460')] +[2023-10-08 12:39:46,937][102898] Updated weights for policy 1, policy_version 22300 (0.0010) +[2023-10-08 12:39:50,154][102897] Updated weights for policy 0, policy_version 22280 (0.0008) +[2023-10-08 12:39:50,514][102897] Updated weights for policy 0, policy_version 22290 (0.0008) +[2023-10-08 12:39:50,682][102898] Updated weights for policy 1, policy_version 22310 (0.0009) +[2023-10-08 12:39:50,887][102897] Updated weights for policy 0, policy_version 22300 (0.0008) +[2023-10-08 12:39:51,045][102898] Updated weights for policy 1, policy_version 22320 (0.0008) +[2023-10-08 12:39:51,415][102898] Updated weights for policy 1, policy_version 22330 (0.0007) +[2023-10-08 12:39:51,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 45711360. Throughput: 0: 1798.0, 1: 1769.1. Samples: 11426894. Policy #0 lag: (min: 31.0, avg: 32.3, max: 57.0) +[2023-10-08 12:39:51,876][101941] Avg episode reward: [(0, '6.230'), (1, '6.650')] +[2023-10-08 12:39:54,492][102897] Updated weights for policy 0, policy_version 22310 (0.0007) +[2023-10-08 12:39:54,858][102897] Updated weights for policy 0, policy_version 22320 (0.0008) +[2023-10-08 12:39:55,147][102898] Updated weights for policy 1, policy_version 22340 (0.0008) +[2023-10-08 12:39:55,230][102897] Updated weights for policy 0, policy_version 22330 (0.0008) +[2023-10-08 12:39:55,520][102898] Updated weights for policy 1, policy_version 22350 (0.0008) +[2023-10-08 12:39:55,892][102898] Updated weights for policy 1, policy_version 22360 (0.0008) +[2023-10-08 12:39:56,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 45776896. Throughput: 0: 1795.1, 1: 1791.3. Samples: 11447572. Policy #0 lag: (min: 31.0, avg: 32.3, max: 57.0) +[2023-10-08 12:39:56,876][101941] Avg episode reward: [(0, '6.680'), (1, '6.890')] +[2023-10-08 12:39:58,980][102897] Updated weights for policy 0, policy_version 22340 (0.0010) +[2023-10-08 12:39:59,352][102897] Updated weights for policy 0, policy_version 22350 (0.0009) +[2023-10-08 12:39:59,718][102897] Updated weights for policy 0, policy_version 22360 (0.0007) +[2023-10-08 12:39:59,784][102898] Updated weights for policy 1, policy_version 22370 (0.0009) +[2023-10-08 12:40:00,159][102898] Updated weights for policy 1, policy_version 22380 (0.0009) +[2023-10-08 12:40:00,530][102898] Updated weights for policy 1, policy_version 22390 (0.0009) +[2023-10-08 12:40:00,900][102898] Updated weights for policy 1, policy_version 22400 (0.0008) +[2023-10-08 12:40:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 45842432. Throughput: 0: 1787.4, 1: 1767.1. Samples: 11468634. Policy #0 lag: (min: 31.0, avg: 32.3, max: 57.0) +[2023-10-08 12:40:01,876][101941] Avg episode reward: [(0, '6.930'), (1, '6.800')] +[2023-10-08 12:40:03,547][102897] Updated weights for policy 0, policy_version 22370 (0.0010) +[2023-10-08 12:40:03,912][102897] Updated weights for policy 0, policy_version 22380 (0.0009) +[2023-10-08 12:40:04,300][102897] Updated weights for policy 0, policy_version 22390 (0.0008) +[2023-10-08 12:40:04,665][102897] Updated weights for policy 0, policy_version 22400 (0.0007) +[2023-10-08 12:40:04,682][102898] Updated weights for policy 1, policy_version 22410 (0.0007) +[2023-10-08 12:40:05,055][102898] Updated weights for policy 1, policy_version 22420 (0.0007) +[2023-10-08 12:40:05,425][102898] Updated weights for policy 1, policy_version 22430 (0.0008) +[2023-10-08 12:40:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 45907968. Throughput: 0: 1790.5, 1: 1791.0. Samples: 11479924. Policy #0 lag: (min: 31.0, avg: 32.3, max: 57.0) +[2023-10-08 12:40:06,875][101941] Avg episode reward: [(0, '6.350'), (1, '7.110')] +[2023-10-08 12:40:08,451][102897] Updated weights for policy 0, policy_version 22410 (0.0008) +[2023-10-08 12:40:08,825][102897] Updated weights for policy 0, policy_version 22420 (0.0008) +[2023-10-08 12:40:09,177][102898] Updated weights for policy 1, policy_version 22440 (0.0009) +[2023-10-08 12:40:09,198][102897] Updated weights for policy 0, policy_version 22430 (0.0008) +[2023-10-08 12:40:09,543][102898] Updated weights for policy 1, policy_version 22450 (0.0010) +[2023-10-08 12:40:09,912][102898] Updated weights for policy 1, policy_version 22460 (0.0009) +[2023-10-08 12:40:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 45973504. Throughput: 0: 1779.2, 1: 1765.4. Samples: 11500422. Policy #0 lag: (min: 23.0, avg: 27.9, max: 55.0) +[2023-10-08 12:40:11,876][101941] Avg episode reward: [(0, '5.780'), (1, '6.770')] +[2023-10-08 12:40:12,937][102897] Updated weights for policy 0, policy_version 22440 (0.0009) +[2023-10-08 12:40:13,304][102897] Updated weights for policy 0, policy_version 22450 (0.0011) +[2023-10-08 12:40:13,677][102897] Updated weights for policy 0, policy_version 22460 (0.0007) +[2023-10-08 12:40:13,782][102898] Updated weights for policy 1, policy_version 22470 (0.0009) +[2023-10-08 12:40:14,154][102898] Updated weights for policy 1, policy_version 22480 (0.0008) +[2023-10-08 12:40:14,524][102898] Updated weights for policy 1, policy_version 22490 (0.0007) +[2023-10-08 12:40:16,875][101941] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 46039040. Throughput: 0: 1777.9, 1: 1766.7. Samples: 11522632. Policy #0 lag: (min: 23.0, avg: 27.9, max: 55.0) +[2023-10-08 12:40:16,876][101941] Avg episode reward: [(0, '5.900'), (1, '7.070')] +[2023-10-08 12:40:16,888][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000022496_23035904.pth... +[2023-10-08 12:40:16,888][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000022464_23003136.pth... +[2023-10-08 12:40:16,925][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000020832_21331968.pth +[2023-10-08 12:40:16,928][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000020800_21299200.pth +[2023-10-08 12:40:17,417][102897] Updated weights for policy 0, policy_version 22470 (0.0011) +[2023-10-08 12:40:17,790][102897] Updated weights for policy 0, policy_version 22480 (0.0008) +[2023-10-08 12:40:18,164][102897] Updated weights for policy 0, policy_version 22490 (0.0010) +[2023-10-08 12:40:18,318][102898] Updated weights for policy 1, policy_version 22500 (0.0007) +[2023-10-08 12:40:18,688][102898] Updated weights for policy 1, policy_version 22510 (0.0007) +[2023-10-08 12:40:19,057][102898] Updated weights for policy 1, policy_version 22520 (0.0007) +[2023-10-08 12:40:21,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 46104576. Throughput: 0: 1770.9, 1: 1769.3. Samples: 11532484. Policy #0 lag: (min: 23.0, avg: 27.9, max: 55.0) +[2023-10-08 12:40:21,876][101941] Avg episode reward: [(0, '6.350'), (1, '7.070')] +[2023-10-08 12:40:21,948][102897] Updated weights for policy 0, policy_version 22500 (0.0009) +[2023-10-08 12:40:22,318][102897] Updated weights for policy 0, policy_version 22510 (0.0009) +[2023-10-08 12:40:22,692][102897] Updated weights for policy 0, policy_version 22520 (0.0010) +[2023-10-08 12:40:22,851][102898] Updated weights for policy 1, policy_version 22530 (0.0007) +[2023-10-08 12:40:23,216][102898] Updated weights for policy 1, policy_version 22540 (0.0010) +[2023-10-08 12:40:23,587][102898] Updated weights for policy 1, policy_version 22550 (0.0010) +[2023-10-08 12:40:23,957][102898] Updated weights for policy 1, policy_version 22560 (0.0008) +[2023-10-08 12:40:26,632][102897] Updated weights for policy 0, policy_version 22530 (0.0008) +[2023-10-08 12:40:26,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 46170112. Throughput: 0: 1772.1, 1: 1764.8. Samples: 11554512. Policy #0 lag: (min: 23.0, avg: 27.9, max: 55.0) +[2023-10-08 12:40:26,875][101941] Avg episode reward: [(0, '6.270'), (1, '6.680')] +[2023-10-08 12:40:27,015][102897] Updated weights for policy 0, policy_version 22540 (0.0008) +[2023-10-08 12:40:27,391][102897] Updated weights for policy 0, policy_version 22550 (0.0007) +[2023-10-08 12:40:27,762][102897] Updated weights for policy 0, policy_version 22560 (0.0007) +[2023-10-08 12:40:27,795][102898] Updated weights for policy 1, policy_version 22570 (0.0008) +[2023-10-08 12:40:28,163][102898] Updated weights for policy 1, policy_version 22580 (0.0010) +[2023-10-08 12:40:28,536][102898] Updated weights for policy 1, policy_version 22590 (0.0011) +[2023-10-08 12:40:31,587][102897] Updated weights for policy 0, policy_version 22570 (0.0007) +[2023-10-08 12:40:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 46235648. Throughput: 0: 1801.6, 1: 1785.2. Samples: 11576650. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:40:31,876][101941] Avg episode reward: [(0, '5.920'), (1, '6.850')] +[2023-10-08 12:40:31,953][102897] Updated weights for policy 0, policy_version 22580 (0.0008) +[2023-10-08 12:40:32,322][102897] Updated weights for policy 0, policy_version 22590 (0.0008) +[2023-10-08 12:40:32,419][102898] Updated weights for policy 1, policy_version 22600 (0.0008) +[2023-10-08 12:40:32,782][102898] Updated weights for policy 1, policy_version 22610 (0.0009) +[2023-10-08 12:40:33,148][102898] Updated weights for policy 1, policy_version 22620 (0.0009) +[2023-10-08 12:40:36,224][102897] Updated weights for policy 0, policy_version 22600 (0.0009) +[2023-10-08 12:40:36,593][102897] Updated weights for policy 0, policy_version 22610 (0.0008) +[2023-10-08 12:40:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 46301184. Throughput: 0: 1774.2, 1: 1768.4. Samples: 11586310. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:40:36,875][101941] Avg episode reward: [(0, '6.480'), (1, '7.040')] +[2023-10-08 12:40:36,911][102898] Updated weights for policy 1, policy_version 22630 (0.0009) +[2023-10-08 12:40:36,958][102897] Updated weights for policy 0, policy_version 22620 (0.0008) +[2023-10-08 12:40:37,283][102898] Updated weights for policy 1, policy_version 22640 (0.0007) +[2023-10-08 12:40:37,657][102898] Updated weights for policy 1, policy_version 22650 (0.0007) +[2023-10-08 12:40:40,647][102897] Updated weights for policy 0, policy_version 22630 (0.0008) +[2023-10-08 12:40:41,020][102897] Updated weights for policy 0, policy_version 22640 (0.0007) +[2023-10-08 12:40:41,351][102898] Updated weights for policy 1, policy_version 22660 (0.0008) +[2023-10-08 12:40:41,398][102897] Updated weights for policy 0, policy_version 22650 (0.0008) +[2023-10-08 12:40:41,716][102898] Updated weights for policy 1, policy_version 22670 (0.0008) +[2023-10-08 12:40:41,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 46399488. Throughput: 0: 1801.7, 1: 1780.3. Samples: 11608764. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:40:41,876][101941] Avg episode reward: [(0, '6.770'), (1, '6.860')] +[2023-10-08 12:40:42,081][102898] Updated weights for policy 1, policy_version 22680 (0.0008) +[2023-10-08 12:40:45,187][102897] Updated weights for policy 0, policy_version 22660 (0.0008) +[2023-10-08 12:40:45,557][102897] Updated weights for policy 0, policy_version 22670 (0.0008) +[2023-10-08 12:40:45,891][102898] Updated weights for policy 1, policy_version 22690 (0.0008) +[2023-10-08 12:40:45,930][102897] Updated weights for policy 0, policy_version 22680 (0.0007) +[2023-10-08 12:40:46,267][102898] Updated weights for policy 1, policy_version 22700 (0.0008) +[2023-10-08 12:40:46,628][102898] Updated weights for policy 1, policy_version 22710 (0.0008) +[2023-10-08 12:40:46,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 46465024. Throughput: 0: 1770.9, 1: 1787.6. Samples: 11628766. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:40:46,875][101941] Avg episode reward: [(0, '6.190'), (1, '6.670')] +[2023-10-08 12:40:46,997][102898] Updated weights for policy 1, policy_version 22720 (0.0008) +[2023-10-08 12:40:49,636][102897] Updated weights for policy 0, policy_version 22690 (0.0008) +[2023-10-08 12:40:50,017][102897] Updated weights for policy 0, policy_version 22700 (0.0007) +[2023-10-08 12:40:50,379][102897] Updated weights for policy 0, policy_version 22710 (0.0008) +[2023-10-08 12:40:50,725][102898] Updated weights for policy 1, policy_version 22730 (0.0008) +[2023-10-08 12:40:50,754][102897] Updated weights for policy 0, policy_version 22720 (0.0008) +[2023-10-08 12:40:51,108][102898] Updated weights for policy 1, policy_version 22740 (0.0007) +[2023-10-08 12:40:51,465][102898] Updated weights for policy 1, policy_version 22750 (0.0008) +[2023-10-08 12:40:51,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 46563328. Throughput: 0: 1796.3, 1: 1780.7. Samples: 11640888. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:40:51,875][101941] Avg episode reward: [(0, '5.870'), (1, '6.810')] +[2023-10-08 12:40:54,430][102897] Updated weights for policy 0, policy_version 22730 (0.0008) +[2023-10-08 12:40:54,803][102897] Updated weights for policy 0, policy_version 22740 (0.0009) +[2023-10-08 12:40:55,187][102897] Updated weights for policy 0, policy_version 22750 (0.0008) +[2023-10-08 12:40:55,313][102898] Updated weights for policy 1, policy_version 22760 (0.0009) +[2023-10-08 12:40:55,681][102898] Updated weights for policy 1, policy_version 22770 (0.0009) +[2023-10-08 12:40:56,044][102898] Updated weights for policy 1, policy_version 22780 (0.0008) +[2023-10-08 12:40:56,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 46628864. Throughput: 0: 1776.4, 1: 1799.8. Samples: 11661350. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:40:56,876][101941] Avg episode reward: [(0, '6.660'), (1, '6.200')] +[2023-10-08 12:40:58,787][102897] Updated weights for policy 0, policy_version 22760 (0.0008) +[2023-10-08 12:40:59,167][102897] Updated weights for policy 0, policy_version 22770 (0.0007) +[2023-10-08 12:40:59,539][102897] Updated weights for policy 0, policy_version 22780 (0.0007) +[2023-10-08 12:40:59,635][102898] Updated weights for policy 1, policy_version 22790 (0.0009) +[2023-10-08 12:40:59,998][102898] Updated weights for policy 1, policy_version 22800 (0.0007) +[2023-10-08 12:41:00,368][102898] Updated weights for policy 1, policy_version 22810 (0.0008) +[2023-10-08 12:41:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 46694400. Throughput: 0: 1784.5, 1: 1787.2. Samples: 11683358. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:41:01,875][101941] Avg episode reward: [(0, '6.490'), (1, '7.080')] +[2023-10-08 12:41:03,269][102897] Updated weights for policy 0, policy_version 22790 (0.0007) +[2023-10-08 12:41:03,644][102897] Updated weights for policy 0, policy_version 22800 (0.0007) +[2023-10-08 12:41:04,010][102898] Updated weights for policy 1, policy_version 22820 (0.0008) +[2023-10-08 12:41:04,021][102897] Updated weights for policy 0, policy_version 22810 (0.0007) +[2023-10-08 12:41:04,370][102898] Updated weights for policy 1, policy_version 22830 (0.0008) +[2023-10-08 12:41:04,740][102898] Updated weights for policy 1, policy_version 22840 (0.0009) +[2023-10-08 12:41:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 46759936. Throughput: 0: 1782.2, 1: 1803.3. Samples: 11693832. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:41:06,876][101941] Avg episode reward: [(0, '6.520'), (1, '7.330')] +[2023-10-08 12:41:07,603][102897] Updated weights for policy 0, policy_version 22820 (0.0008) +[2023-10-08 12:41:07,971][102897] Updated weights for policy 0, policy_version 22830 (0.0009) +[2023-10-08 12:41:08,343][102897] Updated weights for policy 0, policy_version 22840 (0.0008) +[2023-10-08 12:41:08,486][102898] Updated weights for policy 1, policy_version 22850 (0.0008) +[2023-10-08 12:41:08,849][102898] Updated weights for policy 1, policy_version 22860 (0.0008) +[2023-10-08 12:41:09,220][102898] Updated weights for policy 1, policy_version 22870 (0.0009) +[2023-10-08 12:41:09,582][102898] Updated weights for policy 1, policy_version 22880 (0.0009) +[2023-10-08 12:41:11,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 46825472. Throughput: 0: 1787.8, 1: 1787.1. Samples: 11715382. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:41:11,876][101941] Avg episode reward: [(0, '6.380'), (1, '6.910')] +[2023-10-08 12:41:12,279][102897] Updated weights for policy 0, policy_version 22850 (0.0009) +[2023-10-08 12:41:12,661][102897] Updated weights for policy 0, policy_version 22860 (0.0008) +[2023-10-08 12:41:13,024][102897] Updated weights for policy 0, policy_version 22870 (0.0007) +[2023-10-08 12:41:13,386][102898] Updated weights for policy 1, policy_version 22890 (0.0007) +[2023-10-08 12:41:13,397][102897] Updated weights for policy 0, policy_version 22880 (0.0010) +[2023-10-08 12:41:13,750][102898] Updated weights for policy 1, policy_version 22900 (0.0009) +[2023-10-08 12:41:14,120][102898] Updated weights for policy 1, policy_version 22910 (0.0008) +[2023-10-08 12:41:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 46891008. Throughput: 0: 1796.3, 1: 1784.4. Samples: 11737782. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:41:16,875][101941] Avg episode reward: [(0, '6.460'), (1, '6.520')] +[2023-10-08 12:41:17,204][102897] Updated weights for policy 0, policy_version 22890 (0.0008) +[2023-10-08 12:41:17,576][102897] Updated weights for policy 0, policy_version 22900 (0.0008) +[2023-10-08 12:41:17,936][102898] Updated weights for policy 1, policy_version 22920 (0.0007) +[2023-10-08 12:41:17,943][102897] Updated weights for policy 0, policy_version 22910 (0.0008) +[2023-10-08 12:41:18,309][102898] Updated weights for policy 1, policy_version 22930 (0.0007) +[2023-10-08 12:41:18,675][102898] Updated weights for policy 1, policy_version 22940 (0.0008) +[2023-10-08 12:41:21,785][102897] Updated weights for policy 0, policy_version 22920 (0.0007) +[2023-10-08 12:41:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 46956544. Throughput: 0: 1792.8, 1: 1786.0. Samples: 11747358. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:41:21,876][101941] Avg episode reward: [(0, '6.840'), (1, '6.790')] +[2023-10-08 12:41:22,163][102897] Updated weights for policy 0, policy_version 22930 (0.0007) +[2023-10-08 12:41:22,542][102897] Updated weights for policy 0, policy_version 22940 (0.0007) +[2023-10-08 12:41:22,642][102898] Updated weights for policy 1, policy_version 22950 (0.0008) +[2023-10-08 12:41:23,017][102898] Updated weights for policy 1, policy_version 22960 (0.0009) +[2023-10-08 12:41:23,390][102898] Updated weights for policy 1, policy_version 22970 (0.0008) +[2023-10-08 12:41:26,278][102897] Updated weights for policy 0, policy_version 22950 (0.0008) +[2023-10-08 12:41:26,663][102897] Updated weights for policy 0, policy_version 22960 (0.0008) +[2023-10-08 12:41:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 47022080. Throughput: 0: 1788.6, 1: 1779.1. Samples: 11769310. Policy #0 lag: (min: 13.0, avg: 13.5, max: 27.0) +[2023-10-08 12:41:26,875][101941] Avg episode reward: [(0, '6.460'), (1, '7.100')] +[2023-10-08 12:41:27,033][102897] Updated weights for policy 0, policy_version 22970 (0.0008) +[2023-10-08 12:41:27,256][102898] Updated weights for policy 1, policy_version 22980 (0.0009) +[2023-10-08 12:41:27,622][102898] Updated weights for policy 1, policy_version 22990 (0.0008) +[2023-10-08 12:41:27,989][102898] Updated weights for policy 1, policy_version 23000 (0.0007) +[2023-10-08 12:41:30,885][102897] Updated weights for policy 0, policy_version 22980 (0.0008) +[2023-10-08 12:41:31,252][102897] Updated weights for policy 0, policy_version 22990 (0.0008) +[2023-10-08 12:41:31,620][102897] Updated weights for policy 0, policy_version 23000 (0.0008) +[2023-10-08 12:41:31,693][102898] Updated weights for policy 1, policy_version 23010 (0.0007) +[2023-10-08 12:41:31,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 47087616. Throughput: 0: 1800.0, 1: 1796.9. Samples: 11790626. Policy #0 lag: (min: 13.0, avg: 13.5, max: 27.0) +[2023-10-08 12:41:31,876][101941] Avg episode reward: [(0, '6.450'), (1, '6.280')] +[2023-10-08 12:41:32,059][102898] Updated weights for policy 1, policy_version 23020 (0.0007) +[2023-10-08 12:41:32,437][102898] Updated weights for policy 1, policy_version 23030 (0.0008) +[2023-10-08 12:41:32,804][102898] Updated weights for policy 1, policy_version 23040 (0.0008) +[2023-10-08 12:41:35,243][102897] Updated weights for policy 0, policy_version 23010 (0.0010) +[2023-10-08 12:41:35,604][102897] Updated weights for policy 0, policy_version 23020 (0.0008) +[2023-10-08 12:41:35,980][102897] Updated weights for policy 0, policy_version 23030 (0.0009) +[2023-10-08 12:41:36,353][102897] Updated weights for policy 0, policy_version 23040 (0.0009) +[2023-10-08 12:41:36,728][102898] Updated weights for policy 1, policy_version 23050 (0.0007) +[2023-10-08 12:41:36,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 47185920. Throughput: 0: 1788.7, 1: 1773.5. Samples: 11801186. Policy #0 lag: (min: 13.0, avg: 13.5, max: 27.0) +[2023-10-08 12:41:36,876][101941] Avg episode reward: [(0, '6.610'), (1, '6.130')] +[2023-10-08 12:41:37,099][102898] Updated weights for policy 1, policy_version 23060 (0.0007) +[2023-10-08 12:41:37,468][102898] Updated weights for policy 1, policy_version 23070 (0.0007) +[2023-10-08 12:41:40,170][102897] Updated weights for policy 0, policy_version 23050 (0.0010) +[2023-10-08 12:41:40,536][102897] Updated weights for policy 0, policy_version 23060 (0.0010) +[2023-10-08 12:41:40,915][102897] Updated weights for policy 0, policy_version 23070 (0.0008) +[2023-10-08 12:41:41,321][102898] Updated weights for policy 1, policy_version 23080 (0.0010) +[2023-10-08 12:41:41,691][102898] Updated weights for policy 1, policy_version 23090 (0.0009) +[2023-10-08 12:41:41,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 47251456. Throughput: 0: 1802.2, 1: 1787.7. Samples: 11822894. Policy #0 lag: (min: 31.0, avg: 31.0, max: 34.0) +[2023-10-08 12:41:41,876][101941] Avg episode reward: [(0, '6.650'), (1, '6.820')] +[2023-10-08 12:41:42,058][102898] Updated weights for policy 1, policy_version 23100 (0.0008) +[2023-10-08 12:41:44,551][102897] Updated weights for policy 0, policy_version 23080 (0.0010) +[2023-10-08 12:41:44,921][102897] Updated weights for policy 0, policy_version 23090 (0.0007) +[2023-10-08 12:41:45,291][102897] Updated weights for policy 0, policy_version 23100 (0.0007) +[2023-10-08 12:41:45,623][102898] Updated weights for policy 1, policy_version 23110 (0.0010) +[2023-10-08 12:41:45,990][102898] Updated weights for policy 1, policy_version 23120 (0.0008) +[2023-10-08 12:41:46,356][102898] Updated weights for policy 1, policy_version 23130 (0.0007) +[2023-10-08 12:41:46,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 47349760. Throughput: 0: 1778.0, 1: 1775.5. Samples: 11843266. Policy #0 lag: (min: 31.0, avg: 31.0, max: 34.0) +[2023-10-08 12:41:46,876][101941] Avg episode reward: [(0, '6.280'), (1, '7.050')] +[2023-10-08 12:41:49,190][102897] Updated weights for policy 0, policy_version 23110 (0.0008) +[2023-10-08 12:41:49,573][102897] Updated weights for policy 0, policy_version 23120 (0.0009) +[2023-10-08 12:41:49,937][102897] Updated weights for policy 0, policy_version 23130 (0.0009) +[2023-10-08 12:41:50,199][102898] Updated weights for policy 1, policy_version 23140 (0.0010) +[2023-10-08 12:41:50,573][102898] Updated weights for policy 1, policy_version 23150 (0.0009) +[2023-10-08 12:41:50,930][102898] Updated weights for policy 1, policy_version 23160 (0.0010) +[2023-10-08 12:41:51,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 47415296. Throughput: 0: 1799.3, 1: 1785.4. Samples: 11855146. Policy #0 lag: (min: 31.0, avg: 31.0, max: 34.0) +[2023-10-08 12:41:51,876][101941] Avg episode reward: [(0, '6.190'), (1, '6.900')] +[2023-10-08 12:41:53,797][102897] Updated weights for policy 0, policy_version 23140 (0.0008) +[2023-10-08 12:41:54,160][102897] Updated weights for policy 0, policy_version 23150 (0.0007) +[2023-10-08 12:41:54,530][102897] Updated weights for policy 0, policy_version 23160 (0.0007) +[2023-10-08 12:41:54,570][102898] Updated weights for policy 1, policy_version 23170 (0.0008) +[2023-10-08 12:41:54,926][102898] Updated weights for policy 1, policy_version 23180 (0.0009) +[2023-10-08 12:41:55,302][102898] Updated weights for policy 1, policy_version 23190 (0.0008) +[2023-10-08 12:41:55,664][102898] Updated weights for policy 1, policy_version 23200 (0.0008) +[2023-10-08 12:41:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 47480832. Throughput: 0: 1775.7, 1: 1780.4. Samples: 11875410. Policy #0 lag: (min: 31.0, avg: 31.0, max: 34.0) +[2023-10-08 12:41:56,876][101941] Avg episode reward: [(0, '6.160'), (1, '6.420')] +[2023-10-08 12:41:58,330][102897] Updated weights for policy 0, policy_version 23170 (0.0008) +[2023-10-08 12:41:58,698][102897] Updated weights for policy 0, policy_version 23180 (0.0007) +[2023-10-08 12:41:59,069][102897] Updated weights for policy 0, policy_version 23190 (0.0008) +[2023-10-08 12:41:59,450][102897] Updated weights for policy 0, policy_version 23200 (0.0009) +[2023-10-08 12:41:59,633][102898] Updated weights for policy 1, policy_version 23210 (0.0010) +[2023-10-08 12:42:00,000][102898] Updated weights for policy 1, policy_version 23220 (0.0010) +[2023-10-08 12:42:00,362][102898] Updated weights for policy 1, policy_version 23230 (0.0011) +[2023-10-08 12:42:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 47546368. Throughput: 0: 1772.3, 1: 1766.9. Samples: 11897044. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 12:42:01,876][101941] Avg episode reward: [(0, '6.070'), (1, '6.250')] +[2023-10-08 12:42:03,295][102897] Updated weights for policy 0, policy_version 23210 (0.0007) +[2023-10-08 12:42:03,666][102897] Updated weights for policy 0, policy_version 23220 (0.0007) +[2023-10-08 12:42:04,024][102897] Updated weights for policy 0, policy_version 23230 (0.0007) +[2023-10-08 12:42:04,196][102898] Updated weights for policy 1, policy_version 23240 (0.0008) +[2023-10-08 12:42:04,555][102898] Updated weights for policy 1, policy_version 23250 (0.0007) +[2023-10-08 12:42:04,925][102898] Updated weights for policy 1, policy_version 23260 (0.0007) +[2023-10-08 12:42:06,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 47611904. Throughput: 0: 1770.6, 1: 1786.9. Samples: 11907446. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 12:42:06,875][101941] Avg episode reward: [(0, '6.020'), (1, '7.490')] +[2023-10-08 12:42:06,876][102760] Saving new best policy, reward=7.490! +[2023-10-08 12:42:07,820][102897] Updated weights for policy 0, policy_version 23240 (0.0009) +[2023-10-08 12:42:08,202][102897] Updated weights for policy 0, policy_version 23250 (0.0011) +[2023-10-08 12:42:08,575][102897] Updated weights for policy 0, policy_version 23260 (0.0010) +[2023-10-08 12:42:08,833][102898] Updated weights for policy 1, policy_version 23270 (0.0007) +[2023-10-08 12:42:09,195][102898] Updated weights for policy 1, policy_version 23280 (0.0009) +[2023-10-08 12:42:09,570][102898] Updated weights for policy 1, policy_version 23290 (0.0008) +[2023-10-08 12:42:11,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 47677440. Throughput: 0: 1770.3, 1: 1770.4. Samples: 11928642. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 12:42:11,877][101941] Avg episode reward: [(0, '6.750'), (1, '7.510')] +[2023-10-08 12:42:11,879][102760] Saving new best policy, reward=7.510! +[2023-10-08 12:42:12,252][102897] Updated weights for policy 0, policy_version 23270 (0.0008) +[2023-10-08 12:42:12,622][102897] Updated weights for policy 0, policy_version 23280 (0.0007) +[2023-10-08 12:42:12,994][102897] Updated weights for policy 0, policy_version 23290 (0.0008) +[2023-10-08 12:42:13,213][102898] Updated weights for policy 1, policy_version 23300 (0.0008) +[2023-10-08 12:42:13,574][102898] Updated weights for policy 1, policy_version 23310 (0.0008) +[2023-10-08 12:42:13,949][102898] Updated weights for policy 1, policy_version 23320 (0.0008) +[2023-10-08 12:42:16,844][102897] Updated weights for policy 0, policy_version 23300 (0.0008) +[2023-10-08 12:42:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 47742976. Throughput: 0: 1797.6, 1: 1769.9. Samples: 11951164. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 12:42:16,876][101941] Avg episode reward: [(0, '6.920'), (1, '7.410')] +[2023-10-08 12:42:16,884][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000023328_23887872.pth... +[2023-10-08 12:42:16,920][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000021664_22183936.pth +[2023-10-08 12:42:17,218][102897] Updated weights for policy 0, policy_version 23310 (0.0007) +[2023-10-08 12:42:17,585][102897] Updated weights for policy 0, policy_version 23320 (0.0007) +[2023-10-08 12:42:17,798][102898] Updated weights for policy 1, policy_version 23330 (0.0007) +[2023-10-08 12:42:17,887][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000023328_23887872.pth... +[2023-10-08 12:42:17,927][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000021632_22151168.pth +[2023-10-08 12:42:18,157][102898] Updated weights for policy 1, policy_version 23340 (0.0010) +[2023-10-08 12:42:18,519][102898] Updated weights for policy 1, policy_version 23350 (0.0007) +[2023-10-08 12:42:18,883][102898] Updated weights for policy 1, policy_version 23360 (0.0010) +[2023-10-08 12:42:21,277][102897] Updated weights for policy 0, policy_version 23330 (0.0008) +[2023-10-08 12:42:21,653][102897] Updated weights for policy 0, policy_version 23340 (0.0008) +[2023-10-08 12:42:21,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 47808512. Throughput: 0: 1776.5, 1: 1775.0. Samples: 11961004. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 12:42:21,876][101941] Avg episode reward: [(0, '5.980'), (1, '7.150')] +[2023-10-08 12:42:22,016][102897] Updated weights for policy 0, policy_version 23350 (0.0011) +[2023-10-08 12:42:22,389][102897] Updated weights for policy 0, policy_version 23360 (0.0007) +[2023-10-08 12:42:22,491][102898] Updated weights for policy 1, policy_version 23370 (0.0007) +[2023-10-08 12:42:22,857][102898] Updated weights for policy 1, policy_version 23380 (0.0010) +[2023-10-08 12:42:23,225][102898] Updated weights for policy 1, policy_version 23390 (0.0009) +[2023-10-08 12:42:26,016][102897] Updated weights for policy 0, policy_version 23370 (0.0008) +[2023-10-08 12:42:26,388][102897] Updated weights for policy 0, policy_version 23380 (0.0010) +[2023-10-08 12:42:26,772][102897] Updated weights for policy 0, policy_version 23390 (0.0008) +[2023-10-08 12:42:26,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 47906816. Throughput: 0: 1796.4, 1: 1773.4. Samples: 11983538. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 12:42:26,875][101941] Avg episode reward: [(0, '5.720'), (1, '6.350')] +[2023-10-08 12:42:26,957][102898] Updated weights for policy 1, policy_version 23400 (0.0008) +[2023-10-08 12:42:27,331][102898] Updated weights for policy 1, policy_version 23410 (0.0007) +[2023-10-08 12:42:27,691][102898] Updated weights for policy 1, policy_version 23420 (0.0009) +[2023-10-08 12:42:30,592][102897] Updated weights for policy 0, policy_version 23400 (0.0007) +[2023-10-08 12:42:30,965][102897] Updated weights for policy 0, policy_version 23410 (0.0007) +[2023-10-08 12:42:31,330][102897] Updated weights for policy 0, policy_version 23420 (0.0007) +[2023-10-08 12:42:31,650][102898] Updated weights for policy 1, policy_version 23430 (0.0007) +[2023-10-08 12:42:31,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 47972352. Throughput: 0: 1781.0, 1: 1801.7. Samples: 12004484. Policy #0 lag: (min: 6.0, avg: 6.0, max: 6.0) +[2023-10-08 12:42:31,876][101941] Avg episode reward: [(0, '6.500'), (1, '6.430')] +[2023-10-08 12:42:32,021][102898] Updated weights for policy 1, policy_version 23440 (0.0008) +[2023-10-08 12:42:32,394][102898] Updated weights for policy 1, policy_version 23450 (0.0007) +[2023-10-08 12:42:35,118][102897] Updated weights for policy 0, policy_version 23430 (0.0007) +[2023-10-08 12:42:35,491][102897] Updated weights for policy 0, policy_version 23440 (0.0010) +[2023-10-08 12:42:35,872][102897] Updated weights for policy 0, policy_version 23450 (0.0008) +[2023-10-08 12:42:36,128][102898] Updated weights for policy 1, policy_version 23460 (0.0008) +[2023-10-08 12:42:36,494][102898] Updated weights for policy 1, policy_version 23470 (0.0007) +[2023-10-08 12:42:36,860][102898] Updated weights for policy 1, policy_version 23480 (0.0007) +[2023-10-08 12:42:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 48037888. Throughput: 0: 1790.8, 1: 1775.5. Samples: 12015630. Policy #0 lag: (min: 20.0, avg: 27.0, max: 52.0) +[2023-10-08 12:42:36,876][101941] Avg episode reward: [(0, '6.070'), (1, '7.310')] +[2023-10-08 12:42:39,695][102897] Updated weights for policy 0, policy_version 23460 (0.0010) +[2023-10-08 12:42:40,074][102897] Updated weights for policy 0, policy_version 23470 (0.0010) +[2023-10-08 12:42:40,444][102897] Updated weights for policy 0, policy_version 23480 (0.0009) +[2023-10-08 12:42:40,534][102898] Updated weights for policy 1, policy_version 23490 (0.0007) +[2023-10-08 12:42:40,895][102898] Updated weights for policy 1, policy_version 23500 (0.0009) +[2023-10-08 12:42:41,264][102898] Updated weights for policy 1, policy_version 23510 (0.0008) +[2023-10-08 12:42:41,629][102898] Updated weights for policy 1, policy_version 23520 (0.0008) +[2023-10-08 12:42:41,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 48136192. Throughput: 0: 1784.8, 1: 1801.3. Samples: 12036782. Policy #0 lag: (min: 20.0, avg: 27.0, max: 52.0) +[2023-10-08 12:42:41,876][101941] Avg episode reward: [(0, '5.850'), (1, '6.850')] +[2023-10-08 12:42:44,024][102897] Updated weights for policy 0, policy_version 23490 (0.0008) +[2023-10-08 12:42:44,405][102897] Updated weights for policy 0, policy_version 23500 (0.0009) +[2023-10-08 12:42:44,776][102897] Updated weights for policy 0, policy_version 23510 (0.0007) +[2023-10-08 12:42:45,145][102897] Updated weights for policy 0, policy_version 23520 (0.0009) +[2023-10-08 12:42:45,408][102898] Updated weights for policy 1, policy_version 23530 (0.0011) +[2023-10-08 12:42:45,766][102898] Updated weights for policy 1, policy_version 23540 (0.0009) +[2023-10-08 12:42:46,134][102898] Updated weights for policy 1, policy_version 23550 (0.0008) +[2023-10-08 12:42:46,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 48201728. Throughput: 0: 1784.0, 1: 1780.5. Samples: 12057444. Policy #0 lag: (min: 20.0, avg: 27.0, max: 52.0) +[2023-10-08 12:42:46,876][101941] Avg episode reward: [(0, '6.400'), (1, '6.470')] +[2023-10-08 12:42:48,970][102897] Updated weights for policy 0, policy_version 23530 (0.0009) +[2023-10-08 12:42:49,342][102897] Updated weights for policy 0, policy_version 23540 (0.0009) +[2023-10-08 12:42:49,723][102897] Updated weights for policy 0, policy_version 23550 (0.0008) +[2023-10-08 12:42:50,172][102898] Updated weights for policy 1, policy_version 23560 (0.0007) +[2023-10-08 12:42:50,550][102898] Updated weights for policy 1, policy_version 23570 (0.0007) +[2023-10-08 12:42:50,916][102898] Updated weights for policy 1, policy_version 23580 (0.0008) +[2023-10-08 12:42:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 48267264. Throughput: 0: 1794.3, 1: 1795.6. Samples: 12068988. Policy #0 lag: (min: 20.0, avg: 27.0, max: 52.0) +[2023-10-08 12:42:51,876][101941] Avg episode reward: [(0, '6.060'), (1, '6.270')] +[2023-10-08 12:42:53,614][102897] Updated weights for policy 0, policy_version 23560 (0.0008) +[2023-10-08 12:42:53,983][102897] Updated weights for policy 0, policy_version 23570 (0.0008) +[2023-10-08 12:42:54,359][102897] Updated weights for policy 0, policy_version 23580 (0.0008) +[2023-10-08 12:42:54,589][102898] Updated weights for policy 1, policy_version 23590 (0.0009) +[2023-10-08 12:42:54,948][102898] Updated weights for policy 1, policy_version 23600 (0.0008) +[2023-10-08 12:42:55,321][102898] Updated weights for policy 1, policy_version 23610 (0.0010) +[2023-10-08 12:42:56,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 48332800. Throughput: 0: 1784.7, 1: 1786.3. Samples: 12089336. Policy #0 lag: (min: 26.0, avg: 26.6, max: 40.0) +[2023-10-08 12:42:56,876][101941] Avg episode reward: [(0, '5.800'), (1, '6.660')] +[2023-10-08 12:42:58,088][102897] Updated weights for policy 0, policy_version 23590 (0.0008) +[2023-10-08 12:42:58,456][102897] Updated weights for policy 0, policy_version 23600 (0.0009) +[2023-10-08 12:42:58,832][102897] Updated weights for policy 0, policy_version 23610 (0.0009) +[2023-10-08 12:42:59,084][102898] Updated weights for policy 1, policy_version 23620 (0.0009) +[2023-10-08 12:42:59,447][102898] Updated weights for policy 1, policy_version 23630 (0.0009) +[2023-10-08 12:42:59,822][102898] Updated weights for policy 1, policy_version 23640 (0.0007) +[2023-10-08 12:43:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 48398336. Throughput: 0: 1779.1, 1: 1783.8. Samples: 12111492. Policy #0 lag: (min: 26.0, avg: 26.6, max: 40.0) +[2023-10-08 12:43:01,876][101941] Avg episode reward: [(0, '5.930'), (1, '6.680')] +[2023-10-08 12:43:02,772][102897] Updated weights for policy 0, policy_version 23620 (0.0008) +[2023-10-08 12:43:03,146][102897] Updated weights for policy 0, policy_version 23630 (0.0008) +[2023-10-08 12:43:03,524][102897] Updated weights for policy 0, policy_version 23640 (0.0009) +[2023-10-08 12:43:03,640][102898] Updated weights for policy 1, policy_version 23650 (0.0007) +[2023-10-08 12:43:04,018][102898] Updated weights for policy 1, policy_version 23660 (0.0008) +[2023-10-08 12:43:04,386][102898] Updated weights for policy 1, policy_version 23670 (0.0008) +[2023-10-08 12:43:04,747][102898] Updated weights for policy 1, policy_version 23680 (0.0008) +[2023-10-08 12:43:06,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 48463872. Throughput: 0: 1776.7, 1: 1790.5. Samples: 12121526. Policy #0 lag: (min: 26.0, avg: 26.6, max: 40.0) +[2023-10-08 12:43:06,876][101941] Avg episode reward: [(0, '6.660'), (1, '6.350')] +[2023-10-08 12:43:07,308][102897] Updated weights for policy 0, policy_version 23650 (0.0008) +[2023-10-08 12:43:07,678][102897] Updated weights for policy 0, policy_version 23660 (0.0007) +[2023-10-08 12:43:08,058][102897] Updated weights for policy 0, policy_version 23670 (0.0008) +[2023-10-08 12:43:08,418][102897] Updated weights for policy 0, policy_version 23680 (0.0007) +[2023-10-08 12:43:08,624][102898] Updated weights for policy 1, policy_version 23690 (0.0010) +[2023-10-08 12:43:08,998][102898] Updated weights for policy 1, policy_version 23700 (0.0008) +[2023-10-08 12:43:09,366][102898] Updated weights for policy 1, policy_version 23710 (0.0007) +[2023-10-08 12:43:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 48529408. Throughput: 0: 1767.1, 1: 1780.8. Samples: 12143192. Policy #0 lag: (min: 26.0, avg: 26.6, max: 40.0) +[2023-10-08 12:43:11,876][101941] Avg episode reward: [(0, '6.330'), (1, '6.250')] +[2023-10-08 12:43:12,081][102897] Updated weights for policy 0, policy_version 23690 (0.0007) +[2023-10-08 12:43:12,469][102897] Updated weights for policy 0, policy_version 23700 (0.0008) +[2023-10-08 12:43:12,835][102897] Updated weights for policy 0, policy_version 23710 (0.0007) +[2023-10-08 12:43:13,008][102898] Updated weights for policy 1, policy_version 23720 (0.0008) +[2023-10-08 12:43:13,368][102898] Updated weights for policy 1, policy_version 23730 (0.0007) +[2023-10-08 12:43:13,742][102898] Updated weights for policy 1, policy_version 23740 (0.0008) +[2023-10-08 12:43:16,563][102897] Updated weights for policy 0, policy_version 23720 (0.0010) +[2023-10-08 12:43:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 48594944. Throughput: 0: 1796.8, 1: 1781.9. Samples: 12165528. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:43:16,876][101941] Avg episode reward: [(0, '6.410'), (1, '6.720')] +[2023-10-08 12:43:16,936][102897] Updated weights for policy 0, policy_version 23730 (0.0008) +[2023-10-08 12:43:17,318][102897] Updated weights for policy 0, policy_version 23740 (0.0010) +[2023-10-08 12:43:17,410][102898] Updated weights for policy 1, policy_version 23750 (0.0009) +[2023-10-08 12:43:17,789][102898] Updated weights for policy 1, policy_version 23760 (0.0010) +[2023-10-08 12:43:18,166][102898] Updated weights for policy 1, policy_version 23770 (0.0010) +[2023-10-08 12:43:21,164][102897] Updated weights for policy 0, policy_version 23750 (0.0009) +[2023-10-08 12:43:21,543][102897] Updated weights for policy 0, policy_version 23760 (0.0007) +[2023-10-08 12:43:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 48660480. Throughput: 0: 1768.7, 1: 1780.6. Samples: 12175350. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:43:21,875][101941] Avg episode reward: [(0, '6.420'), (1, '7.210')] +[2023-10-08 12:43:21,916][102897] Updated weights for policy 0, policy_version 23770 (0.0009) +[2023-10-08 12:43:21,952][102898] Updated weights for policy 1, policy_version 23780 (0.0009) +[2023-10-08 12:43:22,323][102898] Updated weights for policy 1, policy_version 23790 (0.0008) +[2023-10-08 12:43:22,690][102898] Updated weights for policy 1, policy_version 23800 (0.0007) +[2023-10-08 12:43:25,531][102897] Updated weights for policy 0, policy_version 23780 (0.0009) +[2023-10-08 12:43:25,897][102897] Updated weights for policy 0, policy_version 23790 (0.0007) +[2023-10-08 12:43:26,271][102897] Updated weights for policy 0, policy_version 23800 (0.0008) +[2023-10-08 12:43:26,304][102898] Updated weights for policy 1, policy_version 23810 (0.0008) +[2023-10-08 12:43:26,676][102898] Updated weights for policy 1, policy_version 23820 (0.0007) +[2023-10-08 12:43:26,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 48758784. Throughput: 0: 1801.1, 1: 1785.7. Samples: 12198188. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:43:26,876][101941] Avg episode reward: [(0, '6.360'), (1, '7.420')] +[2023-10-08 12:43:27,036][102898] Updated weights for policy 1, policy_version 23830 (0.0008) +[2023-10-08 12:43:27,407][102898] Updated weights for policy 1, policy_version 23840 (0.0009) +[2023-10-08 12:43:30,113][102897] Updated weights for policy 0, policy_version 23810 (0.0008) +[2023-10-08 12:43:30,485][102897] Updated weights for policy 0, policy_version 23820 (0.0010) +[2023-10-08 12:43:30,860][102897] Updated weights for policy 0, policy_version 23830 (0.0007) +[2023-10-08 12:43:31,091][102898] Updated weights for policy 1, policy_version 23850 (0.0007) +[2023-10-08 12:43:31,228][102897] Updated weights for policy 0, policy_version 23840 (0.0008) +[2023-10-08 12:43:31,458][102898] Updated weights for policy 1, policy_version 23860 (0.0007) +[2023-10-08 12:43:31,830][102898] Updated weights for policy 1, policy_version 23870 (0.0007) +[2023-10-08 12:43:31,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 48824320. Throughput: 0: 1770.6, 1: 1800.0. Samples: 12218120. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 12:43:31,875][101941] Avg episode reward: [(0, '5.890'), (1, '6.870')] +[2023-10-08 12:43:34,970][102897] Updated weights for policy 0, policy_version 23850 (0.0008) +[2023-10-08 12:43:35,344][102897] Updated weights for policy 0, policy_version 23860 (0.0009) +[2023-10-08 12:43:35,646][102898] Updated weights for policy 1, policy_version 23880 (0.0008) +[2023-10-08 12:43:35,718][102897] Updated weights for policy 0, policy_version 23870 (0.0009) +[2023-10-08 12:43:36,028][102898] Updated weights for policy 1, policy_version 23890 (0.0008) +[2023-10-08 12:43:36,404][102898] Updated weights for policy 1, policy_version 23900 (0.0009) +[2023-10-08 12:43:36,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 48922624. Throughput: 0: 1799.0, 1: 1784.1. Samples: 12230228. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 12:43:36,876][101941] Avg episode reward: [(0, '5.290'), (1, '6.870')] +[2023-10-08 12:43:39,394][102897] Updated weights for policy 0, policy_version 23880 (0.0008) +[2023-10-08 12:43:39,769][102897] Updated weights for policy 0, policy_version 23890 (0.0011) +[2023-10-08 12:43:40,139][102897] Updated weights for policy 0, policy_version 23900 (0.0009) +[2023-10-08 12:43:40,160][102898] Updated weights for policy 1, policy_version 23910 (0.0008) +[2023-10-08 12:43:40,521][102898] Updated weights for policy 1, policy_version 23920 (0.0010) +[2023-10-08 12:43:40,888][102898] Updated weights for policy 1, policy_version 23930 (0.0008) +[2023-10-08 12:43:41,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 48988160. Throughput: 0: 1777.7, 1: 1806.0. Samples: 12250598. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 12:43:41,876][101941] Avg episode reward: [(0, '6.100'), (1, '6.780')] +[2023-10-08 12:43:43,836][102897] Updated weights for policy 0, policy_version 23910 (0.0009) +[2023-10-08 12:43:44,201][102897] Updated weights for policy 0, policy_version 23920 (0.0009) +[2023-10-08 12:43:44,566][102897] Updated weights for policy 0, policy_version 23930 (0.0008) +[2023-10-08 12:43:44,579][102898] Updated weights for policy 1, policy_version 23940 (0.0009) +[2023-10-08 12:43:44,941][102898] Updated weights for policy 1, policy_version 23950 (0.0008) +[2023-10-08 12:43:45,308][102898] Updated weights for policy 1, policy_version 23960 (0.0009) +[2023-10-08 12:43:46,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 49053696. Throughput: 0: 1784.3, 1: 1790.0. Samples: 12272340. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 12:43:46,876][101941] Avg episode reward: [(0, '6.380'), (1, '6.740')] +[2023-10-08 12:43:48,338][102897] Updated weights for policy 0, policy_version 23940 (0.0010) +[2023-10-08 12:43:48,713][102897] Updated weights for policy 0, policy_version 23950 (0.0008) +[2023-10-08 12:43:49,077][102897] Updated weights for policy 0, policy_version 23960 (0.0010) +[2023-10-08 12:43:49,086][102898] Updated weights for policy 1, policy_version 23970 (0.0009) +[2023-10-08 12:43:49,449][102898] Updated weights for policy 1, policy_version 23980 (0.0009) +[2023-10-08 12:43:49,819][102898] Updated weights for policy 1, policy_version 23990 (0.0009) +[2023-10-08 12:43:50,184][102898] Updated weights for policy 1, policy_version 24000 (0.0009) +[2023-10-08 12:43:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 49119232. Throughput: 0: 1785.4, 1: 1803.0. Samples: 12283006. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 12:43:51,875][101941] Avg episode reward: [(0, '6.200'), (1, '7.030')] +[2023-10-08 12:43:52,987][102897] Updated weights for policy 0, policy_version 23970 (0.0008) +[2023-10-08 12:43:53,358][102897] Updated weights for policy 0, policy_version 23980 (0.0007) +[2023-10-08 12:43:53,734][102897] Updated weights for policy 0, policy_version 23990 (0.0008) +[2023-10-08 12:43:53,855][102898] Updated weights for policy 1, policy_version 24010 (0.0008) +[2023-10-08 12:43:54,104][102897] Updated weights for policy 0, policy_version 24000 (0.0009) +[2023-10-08 12:43:54,223][102898] Updated weights for policy 1, policy_version 24020 (0.0008) +[2023-10-08 12:43:54,590][102898] Updated weights for policy 1, policy_version 24030 (0.0009) +[2023-10-08 12:43:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 49184768. Throughput: 0: 1784.3, 1: 1794.3. Samples: 12304226. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 12:43:56,876][101941] Avg episode reward: [(0, '6.870'), (1, '7.250')] +[2023-10-08 12:43:57,918][102897] Updated weights for policy 0, policy_version 24010 (0.0007) +[2023-10-08 12:43:58,284][102897] Updated weights for policy 0, policy_version 24020 (0.0009) +[2023-10-08 12:43:58,379][102898] Updated weights for policy 1, policy_version 24040 (0.0008) +[2023-10-08 12:43:58,664][102897] Updated weights for policy 0, policy_version 24030 (0.0007) +[2023-10-08 12:43:58,740][102898] Updated weights for policy 1, policy_version 24050 (0.0008) +[2023-10-08 12:43:59,107][102898] Updated weights for policy 1, policy_version 24060 (0.0009) +[2023-10-08 12:44:01,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 49250304. Throughput: 0: 1781.1, 1: 1792.1. Samples: 12326324. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 12:44:01,876][101941] Avg episode reward: [(0, '6.500'), (1, '7.350')] +[2023-10-08 12:44:02,551][102897] Updated weights for policy 0, policy_version 24040 (0.0007) +[2023-10-08 12:44:02,916][102897] Updated weights for policy 0, policy_version 24050 (0.0007) +[2023-10-08 12:44:02,948][102898] Updated weights for policy 1, policy_version 24070 (0.0010) +[2023-10-08 12:44:03,293][102897] Updated weights for policy 0, policy_version 24060 (0.0007) +[2023-10-08 12:44:03,312][102898] Updated weights for policy 1, policy_version 24080 (0.0008) +[2023-10-08 12:44:03,680][102898] Updated weights for policy 1, policy_version 24090 (0.0009) +[2023-10-08 12:44:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 49315840. Throughput: 0: 1779.9, 1: 1790.1. Samples: 12336000. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 12:44:06,876][101941] Avg episode reward: [(0, '5.710'), (1, '7.300')] +[2023-10-08 12:44:07,065][102897] Updated weights for policy 0, policy_version 24070 (0.0008) +[2023-10-08 12:44:07,425][102898] Updated weights for policy 1, policy_version 24100 (0.0009) +[2023-10-08 12:44:07,438][102897] Updated weights for policy 0, policy_version 24080 (0.0009) +[2023-10-08 12:44:07,800][102898] Updated weights for policy 1, policy_version 24110 (0.0007) +[2023-10-08 12:44:07,809][102897] Updated weights for policy 0, policy_version 24090 (0.0008) +[2023-10-08 12:44:08,162][102898] Updated weights for policy 1, policy_version 24120 (0.0008) +[2023-10-08 12:44:11,751][102897] Updated weights for policy 0, policy_version 24100 (0.0009) +[2023-10-08 12:44:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 49381376. Throughput: 0: 1770.6, 1: 1782.8. Samples: 12358088. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:44:11,876][101941] Avg episode reward: [(0, '5.970'), (1, '6.510')] +[2023-10-08 12:44:12,042][102898] Updated weights for policy 1, policy_version 24130 (0.0010) +[2023-10-08 12:44:12,116][102897] Updated weights for policy 0, policy_version 24110 (0.0007) +[2023-10-08 12:44:12,412][102898] Updated weights for policy 1, policy_version 24140 (0.0009) +[2023-10-08 12:44:12,490][102897] Updated weights for policy 0, policy_version 24120 (0.0007) +[2023-10-08 12:44:12,776][102898] Updated weights for policy 1, policy_version 24150 (0.0008) +[2023-10-08 12:44:13,136][102898] Updated weights for policy 1, policy_version 24160 (0.0010) +[2023-10-08 12:44:16,332][102897] Updated weights for policy 0, policy_version 24130 (0.0008) +[2023-10-08 12:44:16,710][102897] Updated weights for policy 0, policy_version 24140 (0.0009) +[2023-10-08 12:44:16,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 49446912. Throughput: 0: 1792.6, 1: 1800.7. Samples: 12379816. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:44:16,875][101941] Avg episode reward: [(0, '6.400'), (1, '6.760')] +[2023-10-08 12:44:16,947][102898] Updated weights for policy 1, policy_version 24170 (0.0007) +[2023-10-08 12:44:17,089][102897] Updated weights for policy 0, policy_version 24150 (0.0008) +[2023-10-08 12:44:17,310][102898] Updated weights for policy 1, policy_version 24180 (0.0007) +[2023-10-08 12:44:17,458][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000024160_24739840.pth... +[2023-10-08 12:44:17,463][102897] Updated weights for policy 0, policy_version 24160 (0.0007) +[2023-10-08 12:44:17,490][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000022464_23003136.pth +[2023-10-08 12:44:17,676][102898] Updated weights for policy 1, policy_version 24190 (0.0010) +[2023-10-08 12:44:17,748][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000024192_24772608.pth... +[2023-10-08 12:44:17,785][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000022496_23035904.pth +[2023-10-08 12:44:21,259][102897] Updated weights for policy 0, policy_version 24170 (0.0007) +[2023-10-08 12:44:21,630][102897] Updated weights for policy 0, policy_version 24180 (0.0008) +[2023-10-08 12:44:21,670][102898] Updated weights for policy 1, policy_version 24200 (0.0008) +[2023-10-08 12:44:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 49512448. Throughput: 0: 1758.9, 1: 1781.2. Samples: 12389534. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:44:21,876][101941] Avg episode reward: [(0, '6.350'), (1, '7.050')] +[2023-10-08 12:44:21,997][102897] Updated weights for policy 0, policy_version 24190 (0.0008) +[2023-10-08 12:44:22,050][102898] Updated weights for policy 1, policy_version 24210 (0.0009) +[2023-10-08 12:44:22,425][102898] Updated weights for policy 1, policy_version 24220 (0.0008) +[2023-10-08 12:44:25,822][102897] Updated weights for policy 0, policy_version 24200 (0.0008) +[2023-10-08 12:44:26,194][102897] Updated weights for policy 0, policy_version 24210 (0.0008) +[2023-10-08 12:44:26,365][102898] Updated weights for policy 1, policy_version 24230 (0.0007) +[2023-10-08 12:44:26,564][102897] Updated weights for policy 0, policy_version 24220 (0.0009) +[2023-10-08 12:44:26,733][102898] Updated weights for policy 1, policy_version 24240 (0.0007) +[2023-10-08 12:44:26,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 49610752. Throughput: 0: 1795.0, 1: 1782.2. Samples: 12411570. Policy #0 lag: (min: 0.0, avg: 27.9, max: 32.0) +[2023-10-08 12:44:26,876][101941] Avg episode reward: [(0, '6.170'), (1, '6.480')] +[2023-10-08 12:44:27,106][102898] Updated weights for policy 1, policy_version 24250 (0.0011) +[2023-10-08 12:44:30,293][102897] Updated weights for policy 0, policy_version 24230 (0.0010) +[2023-10-08 12:44:30,664][102897] Updated weights for policy 0, policy_version 24240 (0.0009) +[2023-10-08 12:44:30,921][102898] Updated weights for policy 1, policy_version 24260 (0.0010) +[2023-10-08 12:44:31,040][102897] Updated weights for policy 0, policy_version 24250 (0.0007) +[2023-10-08 12:44:31,284][102898] Updated weights for policy 1, policy_version 24270 (0.0007) +[2023-10-08 12:44:31,646][102898] Updated weights for policy 1, policy_version 24280 (0.0008) +[2023-10-08 12:44:31,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 49676288. Throughput: 0: 1756.7, 1: 1780.6. Samples: 12431518. Policy #0 lag: (min: 0.0, avg: 27.9, max: 32.0) +[2023-10-08 12:44:31,875][101941] Avg episode reward: [(0, '5.490'), (1, '6.960')] +[2023-10-08 12:44:34,784][102897] Updated weights for policy 0, policy_version 24260 (0.0007) +[2023-10-08 12:44:35,165][102897] Updated weights for policy 0, policy_version 24270 (0.0008) +[2023-10-08 12:44:35,441][102898] Updated weights for policy 1, policy_version 24290 (0.0010) +[2023-10-08 12:44:35,541][102897] Updated weights for policy 0, policy_version 24280 (0.0008) +[2023-10-08 12:44:35,803][102898] Updated weights for policy 1, policy_version 24300 (0.0009) +[2023-10-08 12:44:36,171][102898] Updated weights for policy 1, policy_version 24310 (0.0008) +[2023-10-08 12:44:36,536][102898] Updated weights for policy 1, policy_version 24320 (0.0009) +[2023-10-08 12:44:36,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 49774592. Throughput: 0: 1791.8, 1: 1773.8. Samples: 12443458. Policy #0 lag: (min: 0.0, avg: 27.9, max: 32.0) +[2023-10-08 12:44:36,875][101941] Avg episode reward: [(0, '5.320'), (1, '7.060')] +[2023-10-08 12:44:39,073][102897] Updated weights for policy 0, policy_version 24290 (0.0007) +[2023-10-08 12:44:39,447][102897] Updated weights for policy 0, policy_version 24300 (0.0008) +[2023-10-08 12:44:39,816][102897] Updated weights for policy 0, policy_version 24310 (0.0009) +[2023-10-08 12:44:40,184][102897] Updated weights for policy 0, policy_version 24320 (0.0008) +[2023-10-08 12:44:40,332][102898] Updated weights for policy 1, policy_version 24330 (0.0011) +[2023-10-08 12:44:40,693][102898] Updated weights for policy 1, policy_version 24340 (0.0011) +[2023-10-08 12:44:41,062][102898] Updated weights for policy 1, policy_version 24350 (0.0008) +[2023-10-08 12:44:41,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 49840128. Throughput: 0: 1768.7, 1: 1776.2. Samples: 12463746. Policy #0 lag: (min: 0.0, avg: 27.9, max: 32.0) +[2023-10-08 12:44:41,876][101941] Avg episode reward: [(0, '5.490'), (1, '6.900')] +[2023-10-08 12:44:44,010][102897] Updated weights for policy 0, policy_version 24330 (0.0009) +[2023-10-08 12:44:44,375][102897] Updated weights for policy 0, policy_version 24340 (0.0008) +[2023-10-08 12:44:44,755][102897] Updated weights for policy 0, policy_version 24350 (0.0008) +[2023-10-08 12:44:44,985][102898] Updated weights for policy 1, policy_version 24360 (0.0009) +[2023-10-08 12:44:45,354][102898] Updated weights for policy 1, policy_version 24370 (0.0008) +[2023-10-08 12:44:45,727][102898] Updated weights for policy 1, policy_version 24380 (0.0009) +[2023-10-08 12:44:46,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 49905664. Throughput: 0: 1768.5, 1: 1754.8. Samples: 12484872. Policy #0 lag: (min: 31.0, avg: 31.5, max: 46.0) +[2023-10-08 12:44:46,876][101941] Avg episode reward: [(0, '6.130'), (1, '6.610')] +[2023-10-08 12:44:48,638][102897] Updated weights for policy 0, policy_version 24360 (0.0007) +[2023-10-08 12:44:49,013][102897] Updated weights for policy 0, policy_version 24370 (0.0010) +[2023-10-08 12:44:49,373][102897] Updated weights for policy 0, policy_version 24380 (0.0009) +[2023-10-08 12:44:49,468][102898] Updated weights for policy 1, policy_version 24390 (0.0008) +[2023-10-08 12:44:49,838][102898] Updated weights for policy 1, policy_version 24400 (0.0008) +[2023-10-08 12:44:50,209][102898] Updated weights for policy 1, policy_version 24410 (0.0007) +[2023-10-08 12:44:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 49971200. Throughput: 0: 1771.5, 1: 1783.3. Samples: 12495964. Policy #0 lag: (min: 31.0, avg: 31.5, max: 46.0) +[2023-10-08 12:44:51,876][101941] Avg episode reward: [(0, '6.670'), (1, '6.660')] +[2023-10-08 12:44:53,208][102897] Updated weights for policy 0, policy_version 24390 (0.0008) +[2023-10-08 12:44:53,588][102897] Updated weights for policy 0, policy_version 24400 (0.0008) +[2023-10-08 12:44:53,825][102898] Updated weights for policy 1, policy_version 24420 (0.0008) +[2023-10-08 12:44:53,949][102897] Updated weights for policy 0, policy_version 24410 (0.0008) +[2023-10-08 12:44:54,189][102898] Updated weights for policy 1, policy_version 24430 (0.0007) +[2023-10-08 12:44:54,554][102898] Updated weights for policy 1, policy_version 24440 (0.0007) +[2023-10-08 12:44:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 50036736. Throughput: 0: 1775.6, 1: 1755.2. Samples: 12516976. Policy #0 lag: (min: 31.0, avg: 31.5, max: 46.0) +[2023-10-08 12:44:56,876][101941] Avg episode reward: [(0, '7.300'), (1, '7.050')] +[2023-10-08 12:44:57,673][102897] Updated weights for policy 0, policy_version 24420 (0.0008) +[2023-10-08 12:44:58,043][102897] Updated weights for policy 0, policy_version 24430 (0.0009) +[2023-10-08 12:44:58,357][102898] Updated weights for policy 1, policy_version 24450 (0.0010) +[2023-10-08 12:44:58,414][102897] Updated weights for policy 0, policy_version 24440 (0.0008) +[2023-10-08 12:44:58,722][102898] Updated weights for policy 1, policy_version 24460 (0.0009) +[2023-10-08 12:44:59,092][102898] Updated weights for policy 1, policy_version 24470 (0.0007) +[2023-10-08 12:44:59,464][102898] Updated weights for policy 1, policy_version 24480 (0.0007) +[2023-10-08 12:45:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 50102272. Throughput: 0: 1790.4, 1: 1761.8. Samples: 12539662. Policy #0 lag: (min: 31.0, avg: 31.5, max: 46.0) +[2023-10-08 12:45:01,875][101941] Avg episode reward: [(0, '7.100'), (1, '6.780')] +[2023-10-08 12:45:02,026][102897] Updated weights for policy 0, policy_version 24450 (0.0009) +[2023-10-08 12:45:02,395][102897] Updated weights for policy 0, policy_version 24460 (0.0009) +[2023-10-08 12:45:02,779][102897] Updated weights for policy 0, policy_version 24470 (0.0008) +[2023-10-08 12:45:03,155][102897] Updated weights for policy 0, policy_version 24480 (0.0009) +[2023-10-08 12:45:03,233][102898] Updated weights for policy 1, policy_version 24490 (0.0008) +[2023-10-08 12:45:03,606][102898] Updated weights for policy 1, policy_version 24500 (0.0009) +[2023-10-08 12:45:03,977][102898] Updated weights for policy 1, policy_version 24510 (0.0009) +[2023-10-08 12:45:06,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 50167808. Throughput: 0: 1785.2, 1: 1764.0. Samples: 12549246. Policy #0 lag: (min: 31.0, avg: 31.1, max: 38.0) +[2023-10-08 12:45:06,875][101941] Avg episode reward: [(0, '6.990'), (1, '6.770')] +[2023-10-08 12:45:07,132][102897] Updated weights for policy 0, policy_version 24490 (0.0007) +[2023-10-08 12:45:07,497][102897] Updated weights for policy 0, policy_version 24500 (0.0008) +[2023-10-08 12:45:07,841][102898] Updated weights for policy 1, policy_version 24520 (0.0009) +[2023-10-08 12:45:07,863][102897] Updated weights for policy 0, policy_version 24510 (0.0008) +[2023-10-08 12:45:08,213][102898] Updated weights for policy 1, policy_version 24530 (0.0009) +[2023-10-08 12:45:08,582][102898] Updated weights for policy 1, policy_version 24540 (0.0010) +[2023-10-08 12:45:11,673][102897] Updated weights for policy 0, policy_version 24520 (0.0011) +[2023-10-08 12:45:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 50233344. Throughput: 0: 1778.9, 1: 1770.8. Samples: 12571306. Policy #0 lag: (min: 31.0, avg: 31.1, max: 38.0) +[2023-10-08 12:45:11,876][101941] Avg episode reward: [(0, '6.770'), (1, '6.610')] +[2023-10-08 12:45:12,042][102897] Updated weights for policy 0, policy_version 24530 (0.0010) +[2023-10-08 12:45:12,264][102898] Updated weights for policy 1, policy_version 24550 (0.0008) +[2023-10-08 12:45:12,410][102897] Updated weights for policy 0, policy_version 24540 (0.0008) +[2023-10-08 12:45:12,624][102898] Updated weights for policy 1, policy_version 24560 (0.0010) +[2023-10-08 12:45:12,991][102898] Updated weights for policy 1, policy_version 24570 (0.0009) +[2023-10-08 12:45:16,058][102897] Updated weights for policy 0, policy_version 24550 (0.0008) +[2023-10-08 12:45:16,438][102897] Updated weights for policy 0, policy_version 24560 (0.0008) +[2023-10-08 12:45:16,808][102897] Updated weights for policy 0, policy_version 24570 (0.0007) +[2023-10-08 12:45:16,822][102898] Updated weights for policy 1, policy_version 24580 (0.0008) +[2023-10-08 12:45:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 50298880. Throughput: 0: 1798.6, 1: 1787.6. Samples: 12592896. Policy #0 lag: (min: 31.0, avg: 31.1, max: 38.0) +[2023-10-08 12:45:16,876][101941] Avg episode reward: [(0, '6.050'), (1, '7.080')] +[2023-10-08 12:45:17,176][102898] Updated weights for policy 1, policy_version 24590 (0.0010) +[2023-10-08 12:45:17,552][102898] Updated weights for policy 1, policy_version 24600 (0.0009) +[2023-10-08 12:45:20,626][102897] Updated weights for policy 0, policy_version 24580 (0.0007) +[2023-10-08 12:45:20,989][102897] Updated weights for policy 0, policy_version 24590 (0.0010) +[2023-10-08 12:45:21,363][102897] Updated weights for policy 0, policy_version 24600 (0.0008) +[2023-10-08 12:45:21,601][102898] Updated weights for policy 1, policy_version 24610 (0.0009) +[2023-10-08 12:45:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 50397184. Throughput: 0: 1779.2, 1: 1772.6. Samples: 12603288. Policy #0 lag: (min: 19.0, avg: 21.9, max: 51.0) +[2023-10-08 12:45:21,876][101941] Avg episode reward: [(0, '5.840'), (1, '7.460')] +[2023-10-08 12:45:21,969][102898] Updated weights for policy 1, policy_version 24620 (0.0010) +[2023-10-08 12:45:22,331][102898] Updated weights for policy 1, policy_version 24630 (0.0007) +[2023-10-08 12:45:22,698][102898] Updated weights for policy 1, policy_version 24640 (0.0009) +[2023-10-08 12:45:25,042][102897] Updated weights for policy 0, policy_version 24610 (0.0007) +[2023-10-08 12:45:25,410][102897] Updated weights for policy 0, policy_version 24620 (0.0007) +[2023-10-08 12:45:25,784][102897] Updated weights for policy 0, policy_version 24630 (0.0007) +[2023-10-08 12:45:26,146][102897] Updated weights for policy 0, policy_version 24640 (0.0009) +[2023-10-08 12:45:26,528][102898] Updated weights for policy 1, policy_version 24650 (0.0008) +[2023-10-08 12:45:26,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 50462720. Throughput: 0: 1800.4, 1: 1784.6. Samples: 12625070. Policy #0 lag: (min: 19.0, avg: 21.9, max: 51.0) +[2023-10-08 12:45:26,876][101941] Avg episode reward: [(0, '6.510'), (1, '7.190')] +[2023-10-08 12:45:26,901][102898] Updated weights for policy 1, policy_version 24660 (0.0008) +[2023-10-08 12:45:27,278][102898] Updated weights for policy 1, policy_version 24670 (0.0008) +[2023-10-08 12:45:29,929][102897] Updated weights for policy 0, policy_version 24650 (0.0007) +[2023-10-08 12:45:30,306][102897] Updated weights for policy 0, policy_version 24660 (0.0010) +[2023-10-08 12:45:30,688][102897] Updated weights for policy 0, policy_version 24670 (0.0008) +[2023-10-08 12:45:31,009][102898] Updated weights for policy 1, policy_version 24680 (0.0010) +[2023-10-08 12:45:31,389][102898] Updated weights for policy 1, policy_version 24690 (0.0010) +[2023-10-08 12:45:31,750][102898] Updated weights for policy 1, policy_version 24700 (0.0008) +[2023-10-08 12:45:31,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 50528256. Throughput: 0: 1786.6, 1: 1782.9. Samples: 12645498. Policy #0 lag: (min: 19.0, avg: 21.9, max: 51.0) +[2023-10-08 12:45:31,875][101941] Avg episode reward: [(0, '7.010'), (1, '6.660')] +[2023-10-08 12:45:34,316][102897] Updated weights for policy 0, policy_version 24680 (0.0009) +[2023-10-08 12:45:34,680][102897] Updated weights for policy 0, policy_version 24690 (0.0009) +[2023-10-08 12:45:35,049][102897] Updated weights for policy 0, policy_version 24700 (0.0008) +[2023-10-08 12:45:35,402][102898] Updated weights for policy 1, policy_version 24710 (0.0009) +[2023-10-08 12:45:35,779][102898] Updated weights for policy 1, policy_version 24720 (0.0011) +[2023-10-08 12:45:36,146][102898] Updated weights for policy 1, policy_version 24730 (0.0010) +[2023-10-08 12:45:36,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 50626560. Throughput: 0: 1806.3, 1: 1778.7. Samples: 12657290. Policy #0 lag: (min: 19.0, avg: 21.9, max: 51.0) +[2023-10-08 12:45:36,875][101941] Avg episode reward: [(0, '7.360'), (1, '6.750')] +[2023-10-08 12:45:38,814][102897] Updated weights for policy 0, policy_version 24710 (0.0009) +[2023-10-08 12:45:39,174][102897] Updated weights for policy 0, policy_version 24720 (0.0008) +[2023-10-08 12:45:39,541][102897] Updated weights for policy 0, policy_version 24730 (0.0009) +[2023-10-08 12:45:39,795][102898] Updated weights for policy 1, policy_version 24740 (0.0009) +[2023-10-08 12:45:40,165][102898] Updated weights for policy 1, policy_version 24750 (0.0011) +[2023-10-08 12:45:40,531][102898] Updated weights for policy 1, policy_version 24760 (0.0011) +[2023-10-08 12:45:41,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 50692096. Throughput: 0: 1787.6, 1: 1789.9. Samples: 12677962. Policy #0 lag: (min: 3.0, avg: 3.4, max: 18.0) +[2023-10-08 12:45:41,876][101941] Avg episode reward: [(0, '7.230'), (1, '6.770')] +[2023-10-08 12:45:43,254][102897] Updated weights for policy 0, policy_version 24740 (0.0008) +[2023-10-08 12:45:43,619][102897] Updated weights for policy 0, policy_version 24750 (0.0007) +[2023-10-08 12:45:43,999][102897] Updated weights for policy 0, policy_version 24760 (0.0010) +[2023-10-08 12:45:44,465][102898] Updated weights for policy 1, policy_version 24770 (0.0011) +[2023-10-08 12:45:44,833][102898] Updated weights for policy 1, policy_version 24780 (0.0009) +[2023-10-08 12:45:45,192][102898] Updated weights for policy 1, policy_version 24790 (0.0009) +[2023-10-08 12:45:45,555][102898] Updated weights for policy 1, policy_version 24800 (0.0008) +[2023-10-08 12:45:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 50757632. Throughput: 0: 1788.3, 1: 1767.4. Samples: 12699668. Policy #0 lag: (min: 3.0, avg: 3.4, max: 18.0) +[2023-10-08 12:45:46,876][101941] Avg episode reward: [(0, '6.710'), (1, '7.260')] +[2023-10-08 12:45:47,728][102897] Updated weights for policy 0, policy_version 24770 (0.0008) +[2023-10-08 12:45:48,096][102897] Updated weights for policy 0, policy_version 24780 (0.0008) +[2023-10-08 12:45:48,465][102897] Updated weights for policy 0, policy_version 24790 (0.0010) +[2023-10-08 12:45:48,833][102897] Updated weights for policy 0, policy_version 24800 (0.0007) +[2023-10-08 12:45:49,370][102898] Updated weights for policy 1, policy_version 24810 (0.0008) +[2023-10-08 12:45:49,726][102898] Updated weights for policy 1, policy_version 24820 (0.0009) +[2023-10-08 12:45:50,098][102898] Updated weights for policy 1, policy_version 24830 (0.0008) +[2023-10-08 12:45:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 50823168. Throughput: 0: 1788.3, 1: 1791.5. Samples: 12710342. Policy #0 lag: (min: 3.0, avg: 3.4, max: 18.0) +[2023-10-08 12:45:51,876][101941] Avg episode reward: [(0, '6.310'), (1, '7.590')] +[2023-10-08 12:45:51,878][102760] Saving new best policy, reward=7.590! +[2023-10-08 12:45:52,521][102897] Updated weights for policy 0, policy_version 24810 (0.0010) +[2023-10-08 12:45:52,885][102897] Updated weights for policy 0, policy_version 24820 (0.0010) +[2023-10-08 12:45:53,263][102897] Updated weights for policy 0, policy_version 24830 (0.0010) +[2023-10-08 12:45:53,865][102898] Updated weights for policy 1, policy_version 24840 (0.0009) +[2023-10-08 12:45:54,231][102898] Updated weights for policy 1, policy_version 24850 (0.0008) +[2023-10-08 12:45:54,595][102898] Updated weights for policy 1, policy_version 24860 (0.0007) +[2023-10-08 12:45:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 50888704. Throughput: 0: 1795.0, 1: 1774.9. Samples: 12731954. Policy #0 lag: (min: 3.0, avg: 3.4, max: 18.0) +[2023-10-08 12:45:56,876][101941] Avg episode reward: [(0, '6.350'), (1, '7.250')] +[2023-10-08 12:45:57,080][102897] Updated weights for policy 0, policy_version 24840 (0.0008) +[2023-10-08 12:45:57,447][102897] Updated weights for policy 0, policy_version 24850 (0.0009) +[2023-10-08 12:45:57,825][102897] Updated weights for policy 0, policy_version 24860 (0.0009) +[2023-10-08 12:45:58,501][102898] Updated weights for policy 1, policy_version 24870 (0.0008) +[2023-10-08 12:45:58,885][102898] Updated weights for policy 1, policy_version 24880 (0.0007) +[2023-10-08 12:45:59,255][102898] Updated weights for policy 1, policy_version 24890 (0.0008) +[2023-10-08 12:46:01,683][102897] Updated weights for policy 0, policy_version 24870 (0.0010) +[2023-10-08 12:46:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 50954240. Throughput: 0: 1807.9, 1: 1768.1. Samples: 12753816. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:46:01,876][101941] Avg episode reward: [(0, '6.970'), (1, '6.930')] +[2023-10-08 12:46:02,068][102897] Updated weights for policy 0, policy_version 24880 (0.0009) +[2023-10-08 12:46:02,448][102897] Updated weights for policy 0, policy_version 24890 (0.0007) +[2023-10-08 12:46:02,983][102898] Updated weights for policy 1, policy_version 24900 (0.0008) +[2023-10-08 12:46:03,354][102898] Updated weights for policy 1, policy_version 24910 (0.0007) +[2023-10-08 12:46:03,718][102898] Updated weights for policy 1, policy_version 24920 (0.0008) +[2023-10-08 12:46:06,097][102897] Updated weights for policy 0, policy_version 24900 (0.0008) +[2023-10-08 12:46:06,470][102897] Updated weights for policy 0, policy_version 24910 (0.0007) +[2023-10-08 12:46:06,840][102897] Updated weights for policy 0, policy_version 24920 (0.0007) +[2023-10-08 12:46:06,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 51019776. Throughput: 0: 1791.5, 1: 1769.9. Samples: 12763550. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:46:06,876][101941] Avg episode reward: [(0, '6.530'), (1, '6.560')] +[2023-10-08 12:46:07,468][102898] Updated weights for policy 1, policy_version 24930 (0.0008) +[2023-10-08 12:46:07,840][102898] Updated weights for policy 1, policy_version 24940 (0.0009) +[2023-10-08 12:46:08,202][102898] Updated weights for policy 1, policy_version 24950 (0.0010) +[2023-10-08 12:46:08,577][102898] Updated weights for policy 1, policy_version 24960 (0.0009) +[2023-10-08 12:46:10,709][102897] Updated weights for policy 0, policy_version 24930 (0.0007) +[2023-10-08 12:46:11,085][102897] Updated weights for policy 0, policy_version 24940 (0.0009) +[2023-10-08 12:46:11,465][102897] Updated weights for policy 0, policy_version 24950 (0.0010) +[2023-10-08 12:46:11,832][102897] Updated weights for policy 0, policy_version 24960 (0.0007) +[2023-10-08 12:46:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 51118080. Throughput: 0: 1797.7, 1: 1778.5. Samples: 12786002. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:46:11,876][101941] Avg episode reward: [(0, '6.040'), (1, '6.290')] +[2023-10-08 12:46:12,454][102898] Updated weights for policy 1, policy_version 24970 (0.0007) +[2023-10-08 12:46:12,819][102898] Updated weights for policy 1, policy_version 24980 (0.0008) +[2023-10-08 12:46:13,189][102898] Updated weights for policy 1, policy_version 24990 (0.0009) +[2023-10-08 12:46:15,661][102897] Updated weights for policy 0, policy_version 24970 (0.0008) +[2023-10-08 12:46:16,036][102897] Updated weights for policy 0, policy_version 24980 (0.0009) +[2023-10-08 12:46:16,409][102897] Updated weights for policy 0, policy_version 24990 (0.0008) +[2023-10-08 12:46:16,851][102898] Updated weights for policy 1, policy_version 25000 (0.0009) +[2023-10-08 12:46:16,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 51183616. Throughput: 0: 1791.3, 1: 1803.8. Samples: 12807278. Policy #0 lag: (min: 14.0, avg: 20.9, max: 46.0) +[2023-10-08 12:46:16,875][101941] Avg episode reward: [(0, '6.130'), (1, '7.090')] +[2023-10-08 12:46:16,886][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000024992_25591808.pth... +[2023-10-08 12:46:16,926][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000023328_23887872.pth +[2023-10-08 12:46:16,931][102634] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p0/milestones/checkpoint_000024992_25591808.pth +[2023-10-08 12:46:17,216][102898] Updated weights for policy 1, policy_version 25010 (0.0010) +[2023-10-08 12:46:17,584][102898] Updated weights for policy 1, policy_version 25020 (0.0010) +[2023-10-08 12:46:17,731][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000025024_25624576.pth... +[2023-10-08 12:46:17,768][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000023328_23887872.pth +[2023-10-08 12:46:17,773][102760] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p1/milestones/checkpoint_000025024_25624576.pth +[2023-10-08 12:46:19,975][102897] Updated weights for policy 0, policy_version 25000 (0.0007) +[2023-10-08 12:46:20,341][102897] Updated weights for policy 0, policy_version 25010 (0.0008) +[2023-10-08 12:46:20,713][102897] Updated weights for policy 0, policy_version 25020 (0.0011) +[2023-10-08 12:46:21,329][102898] Updated weights for policy 1, policy_version 25030 (0.0008) +[2023-10-08 12:46:21,697][102898] Updated weights for policy 1, policy_version 25040 (0.0010) +[2023-10-08 12:46:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 51249152. Throughput: 0: 1799.2, 1: 1780.6. Samples: 12818380. Policy #0 lag: (min: 14.0, avg: 20.9, max: 46.0) +[2023-10-08 12:46:21,876][101941] Avg episode reward: [(0, '6.400'), (1, '7.250')] +[2023-10-08 12:46:22,071][102898] Updated weights for policy 1, policy_version 25050 (0.0009) +[2023-10-08 12:46:24,532][102897] Updated weights for policy 0, policy_version 25030 (0.0009) +[2023-10-08 12:46:24,893][102897] Updated weights for policy 0, policy_version 25040 (0.0008) +[2023-10-08 12:46:25,266][102897] Updated weights for policy 0, policy_version 25050 (0.0008) +[2023-10-08 12:46:25,783][102898] Updated weights for policy 1, policy_version 25060 (0.0007) +[2023-10-08 12:46:26,162][102898] Updated weights for policy 1, policy_version 25070 (0.0009) +[2023-10-08 12:46:26,538][102898] Updated weights for policy 1, policy_version 25080 (0.0009) +[2023-10-08 12:46:26,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 51347456. Throughput: 0: 1786.3, 1: 1801.9. Samples: 12839428. Policy #0 lag: (min: 14.0, avg: 20.9, max: 46.0) +[2023-10-08 12:46:26,875][101941] Avg episode reward: [(0, '7.110'), (1, '7.130')] +[2023-10-08 12:46:29,174][102897] Updated weights for policy 0, policy_version 25060 (0.0008) +[2023-10-08 12:46:29,549][102897] Updated weights for policy 0, policy_version 25070 (0.0007) +[2023-10-08 12:46:29,920][102897] Updated weights for policy 0, policy_version 25080 (0.0007) +[2023-10-08 12:46:30,348][102898] Updated weights for policy 1, policy_version 25090 (0.0007) +[2023-10-08 12:46:30,713][102898] Updated weights for policy 1, policy_version 25100 (0.0008) +[2023-10-08 12:46:31,078][102898] Updated weights for policy 1, policy_version 25110 (0.0010) +[2023-10-08 12:46:31,440][102898] Updated weights for policy 1, policy_version 25120 (0.0008) +[2023-10-08 12:46:31,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 51412992. Throughput: 0: 1778.0, 1: 1791.0. Samples: 12860272. Policy #0 lag: (min: 14.0, avg: 20.9, max: 46.0) +[2023-10-08 12:46:31,876][101941] Avg episode reward: [(0, '6.910'), (1, '6.900')] +[2023-10-08 12:46:33,797][102897] Updated weights for policy 0, policy_version 25090 (0.0008) +[2023-10-08 12:46:34,167][102897] Updated weights for policy 0, policy_version 25100 (0.0009) +[2023-10-08 12:46:34,546][102897] Updated weights for policy 0, policy_version 25110 (0.0008) +[2023-10-08 12:46:34,916][102897] Updated weights for policy 0, policy_version 25120 (0.0009) +[2023-10-08 12:46:35,166][102898] Updated weights for policy 1, policy_version 25130 (0.0007) +[2023-10-08 12:46:35,528][102898] Updated weights for policy 1, policy_version 25140 (0.0008) +[2023-10-08 12:46:35,897][102898] Updated weights for policy 1, policy_version 25150 (0.0008) +[2023-10-08 12:46:36,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 51478528. Throughput: 0: 1793.7, 1: 1803.2. Samples: 12872200. Policy #0 lag: (min: 10.0, avg: 10.3, max: 21.0) +[2023-10-08 12:46:36,876][101941] Avg episode reward: [(0, '6.530'), (1, '6.620')] +[2023-10-08 12:46:38,817][102897] Updated weights for policy 0, policy_version 25130 (0.0008) +[2023-10-08 12:46:39,189][102897] Updated weights for policy 0, policy_version 25140 (0.0008) +[2023-10-08 12:46:39,561][102897] Updated weights for policy 0, policy_version 25150 (0.0009) +[2023-10-08 12:46:39,564][102898] Updated weights for policy 1, policy_version 25160 (0.0008) +[2023-10-08 12:46:39,933][102898] Updated weights for policy 1, policy_version 25170 (0.0007) +[2023-10-08 12:46:40,305][102898] Updated weights for policy 1, policy_version 25180 (0.0011) +[2023-10-08 12:46:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 51544064. Throughput: 0: 1774.4, 1: 1793.2. Samples: 12892492. Policy #0 lag: (min: 10.0, avg: 10.3, max: 21.0) +[2023-10-08 12:46:41,876][101941] Avg episode reward: [(0, '6.620'), (1, '6.970')] +[2023-10-08 12:46:43,266][102897] Updated weights for policy 0, policy_version 25160 (0.0007) +[2023-10-08 12:46:43,639][102897] Updated weights for policy 0, policy_version 25170 (0.0008) +[2023-10-08 12:46:43,997][102897] Updated weights for policy 0, policy_version 25180 (0.0008) +[2023-10-08 12:46:44,088][102898] Updated weights for policy 1, policy_version 25190 (0.0008) +[2023-10-08 12:46:44,458][102898] Updated weights for policy 1, policy_version 25200 (0.0008) +[2023-10-08 12:46:44,821][102898] Updated weights for policy 1, policy_version 25210 (0.0008) +[2023-10-08 12:46:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 51609600. Throughput: 0: 1778.6, 1: 1803.7. Samples: 12915020. Policy #0 lag: (min: 10.0, avg: 10.3, max: 21.0) +[2023-10-08 12:46:46,876][101941] Avg episode reward: [(0, '6.570'), (1, '6.980')] +[2023-10-08 12:46:47,746][102897] Updated weights for policy 0, policy_version 25190 (0.0010) +[2023-10-08 12:46:48,114][102897] Updated weights for policy 0, policy_version 25200 (0.0009) +[2023-10-08 12:46:48,495][102897] Updated weights for policy 0, policy_version 25210 (0.0008) +[2023-10-08 12:46:48,639][102898] Updated weights for policy 1, policy_version 25220 (0.0009) +[2023-10-08 12:46:49,007][102898] Updated weights for policy 1, policy_version 25230 (0.0008) +[2023-10-08 12:46:49,370][102898] Updated weights for policy 1, policy_version 25240 (0.0008) +[2023-10-08 12:46:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 51675136. Throughput: 0: 1780.5, 1: 1807.7. Samples: 12925018. Policy #0 lag: (min: 10.0, avg: 10.3, max: 21.0) +[2023-10-08 12:46:51,875][101941] Avg episode reward: [(0, '6.630'), (1, '6.390')] +[2023-10-08 12:46:52,177][102897] Updated weights for policy 0, policy_version 25220 (0.0009) +[2023-10-08 12:46:52,547][102897] Updated weights for policy 0, policy_version 25230 (0.0008) +[2023-10-08 12:46:52,914][102897] Updated weights for policy 0, policy_version 25240 (0.0009) +[2023-10-08 12:46:53,072][102898] Updated weights for policy 1, policy_version 25250 (0.0007) +[2023-10-08 12:46:53,441][102898] Updated weights for policy 1, policy_version 25260 (0.0008) +[2023-10-08 12:46:53,811][102898] Updated weights for policy 1, policy_version 25270 (0.0007) +[2023-10-08 12:46:54,175][102898] Updated weights for policy 1, policy_version 25280 (0.0008) +[2023-10-08 12:46:56,723][102897] Updated weights for policy 0, policy_version 25250 (0.0008) +[2023-10-08 12:46:56,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 51740672. Throughput: 0: 1781.7, 1: 1801.4. Samples: 12947240. Policy #0 lag: (min: 25.0, avg: 43.0, max: 57.0) +[2023-10-08 12:46:56,875][101941] Avg episode reward: [(0, '6.320'), (1, '6.690')] +[2023-10-08 12:46:57,097][102897] Updated weights for policy 0, policy_version 25260 (0.0010) +[2023-10-08 12:46:57,464][102897] Updated weights for policy 0, policy_version 25270 (0.0009) +[2023-10-08 12:46:57,758][102898] Updated weights for policy 1, policy_version 25290 (0.0007) +[2023-10-08 12:46:57,838][102897] Updated weights for policy 0, policy_version 25280 (0.0008) +[2023-10-08 12:46:58,134][102898] Updated weights for policy 1, policy_version 25300 (0.0008) +[2023-10-08 12:46:58,507][102898] Updated weights for policy 1, policy_version 25310 (0.0009) +[2023-10-08 12:47:01,638][102897] Updated weights for policy 0, policy_version 25290 (0.0007) +[2023-10-08 12:47:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 51806208. Throughput: 0: 1801.4, 1: 1800.0. Samples: 12969344. Policy #0 lag: (min: 25.0, avg: 43.0, max: 57.0) +[2023-10-08 12:47:01,875][101941] Avg episode reward: [(0, '5.950'), (1, '6.710')] +[2023-10-08 12:47:02,013][102897] Updated weights for policy 0, policy_version 25300 (0.0008) +[2023-10-08 12:47:02,302][102898] Updated weights for policy 1, policy_version 25320 (0.0009) +[2023-10-08 12:47:02,391][102897] Updated weights for policy 0, policy_version 25310 (0.0009) +[2023-10-08 12:47:02,674][102898] Updated weights for policy 1, policy_version 25330 (0.0009) +[2023-10-08 12:47:03,032][102898] Updated weights for policy 1, policy_version 25340 (0.0010) +[2023-10-08 12:47:06,053][102897] Updated weights for policy 0, policy_version 25320 (0.0008) +[2023-10-08 12:47:06,443][102897] Updated weights for policy 0, policy_version 25330 (0.0008) +[2023-10-08 12:47:06,753][102898] Updated weights for policy 1, policy_version 25350 (0.0010) +[2023-10-08 12:47:06,814][102897] Updated weights for policy 0, policy_version 25340 (0.0008) +[2023-10-08 12:47:06,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 51871744. Throughput: 0: 1775.3, 1: 1799.9. Samples: 12979264. Policy #0 lag: (min: 25.0, avg: 43.0, max: 57.0) +[2023-10-08 12:47:06,876][101941] Avg episode reward: [(0, '6.130'), (1, '7.120')] +[2023-10-08 12:47:07,120][102898] Updated weights for policy 1, policy_version 25360 (0.0007) +[2023-10-08 12:47:07,489][102898] Updated weights for policy 1, policy_version 25370 (0.0008) +[2023-10-08 12:47:10,541][102897] Updated weights for policy 0, policy_version 25350 (0.0010) +[2023-10-08 12:47:10,925][102897] Updated weights for policy 0, policy_version 25360 (0.0010) +[2023-10-08 12:47:11,290][102897] Updated weights for policy 0, policy_version 25370 (0.0008) +[2023-10-08 12:47:11,402][102898] Updated weights for policy 1, policy_version 25380 (0.0007) +[2023-10-08 12:47:11,768][102898] Updated weights for policy 1, policy_version 25390 (0.0007) +[2023-10-08 12:47:11,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 51970048. Throughput: 0: 1800.8, 1: 1799.1. Samples: 13001420. Policy #0 lag: (min: 18.0, avg: 20.2, max: 47.0) +[2023-10-08 12:47:11,876][101941] Avg episode reward: [(0, '6.290'), (1, '7.490')] +[2023-10-08 12:47:12,142][102898] Updated weights for policy 1, policy_version 25400 (0.0008) +[2023-10-08 12:47:15,093][102897] Updated weights for policy 0, policy_version 25380 (0.0009) +[2023-10-08 12:47:15,460][102897] Updated weights for policy 0, policy_version 25390 (0.0011) +[2023-10-08 12:47:15,831][102897] Updated weights for policy 0, policy_version 25400 (0.0010) +[2023-10-08 12:47:15,914][102898] Updated weights for policy 1, policy_version 25410 (0.0009) +[2023-10-08 12:47:16,275][102898] Updated weights for policy 1, policy_version 25420 (0.0007) +[2023-10-08 12:47:16,648][102898] Updated weights for policy 1, policy_version 25430 (0.0007) +[2023-10-08 12:47:16,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 52035584. Throughput: 0: 1773.1, 1: 1814.8. Samples: 13021728. Policy #0 lag: (min: 18.0, avg: 20.2, max: 47.0) +[2023-10-08 12:47:16,875][101941] Avg episode reward: [(0, '6.120'), (1, '7.410')] +[2023-10-08 12:47:17,017][102898] Updated weights for policy 1, policy_version 25440 (0.0010) +[2023-10-08 12:47:19,570][102897] Updated weights for policy 0, policy_version 25410 (0.0008) +[2023-10-08 12:47:19,949][102897] Updated weights for policy 0, policy_version 25420 (0.0008) +[2023-10-08 12:47:20,317][102897] Updated weights for policy 0, policy_version 25430 (0.0008) +[2023-10-08 12:47:20,535][102898] Updated weights for policy 1, policy_version 25450 (0.0008) +[2023-10-08 12:47:20,686][102897] Updated weights for policy 0, policy_version 25440 (0.0007) +[2023-10-08 12:47:20,912][102898] Updated weights for policy 1, policy_version 25460 (0.0007) +[2023-10-08 12:47:21,267][102898] Updated weights for policy 1, policy_version 25470 (0.0007) +[2023-10-08 12:47:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 52133888. Throughput: 0: 1794.1, 1: 1796.3. Samples: 13033768. Policy #0 lag: (min: 18.0, avg: 20.2, max: 47.0) +[2023-10-08 12:47:21,876][101941] Avg episode reward: [(0, '6.390'), (1, '7.440')] +[2023-10-08 12:47:24,515][102897] Updated weights for policy 0, policy_version 25450 (0.0007) +[2023-10-08 12:47:24,880][102897] Updated weights for policy 0, policy_version 25460 (0.0009) +[2023-10-08 12:47:25,065][102898] Updated weights for policy 1, policy_version 25480 (0.0007) +[2023-10-08 12:47:25,261][102897] Updated weights for policy 0, policy_version 25470 (0.0008) +[2023-10-08 12:47:25,430][102898] Updated weights for policy 1, policy_version 25490 (0.0007) +[2023-10-08 12:47:25,806][102898] Updated weights for policy 1, policy_version 25500 (0.0008) +[2023-10-08 12:47:26,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 52199424. Throughput: 0: 1778.3, 1: 1806.2. Samples: 13053796. Policy #0 lag: (min: 18.0, avg: 20.2, max: 47.0) +[2023-10-08 12:47:26,876][101941] Avg episode reward: [(0, '6.210'), (1, '7.970')] +[2023-10-08 12:47:26,878][102760] Saving new best policy, reward=7.970! +[2023-10-08 12:47:29,153][102897] Updated weights for policy 0, policy_version 25480 (0.0007) +[2023-10-08 12:47:29,524][102897] Updated weights for policy 0, policy_version 25490 (0.0007) +[2023-10-08 12:47:29,601][102898] Updated weights for policy 1, policy_version 25510 (0.0008) +[2023-10-08 12:47:29,903][102897] Updated weights for policy 0, policy_version 25500 (0.0007) +[2023-10-08 12:47:29,982][102898] Updated weights for policy 1, policy_version 25520 (0.0007) +[2023-10-08 12:47:30,344][102898] Updated weights for policy 1, policy_version 25530 (0.0007) +[2023-10-08 12:47:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 52264960. Throughput: 0: 1771.0, 1: 1783.6. Samples: 13074976. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 12:47:31,875][101941] Avg episode reward: [(0, '6.380'), (1, '7.570')] +[2023-10-08 12:47:33,614][102897] Updated weights for policy 0, policy_version 25510 (0.0010) +[2023-10-08 12:47:33,988][102897] Updated weights for policy 0, policy_version 25520 (0.0009) +[2023-10-08 12:47:34,048][102898] Updated weights for policy 1, policy_version 25540 (0.0007) +[2023-10-08 12:47:34,367][102897] Updated weights for policy 0, policy_version 25530 (0.0007) +[2023-10-08 12:47:34,413][102898] Updated weights for policy 1, policy_version 25550 (0.0007) +[2023-10-08 12:47:34,785][102898] Updated weights for policy 1, policy_version 25560 (0.0007) +[2023-10-08 12:47:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 52330496. Throughput: 0: 1774.1, 1: 1799.1. Samples: 13085814. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 12:47:36,876][101941] Avg episode reward: [(0, '6.820'), (1, '7.200')] +[2023-10-08 12:47:38,143][102897] Updated weights for policy 0, policy_version 25540 (0.0008) +[2023-10-08 12:47:38,518][102897] Updated weights for policy 0, policy_version 25550 (0.0007) +[2023-10-08 12:47:38,553][102898] Updated weights for policy 1, policy_version 25570 (0.0007) +[2023-10-08 12:47:38,894][102897] Updated weights for policy 0, policy_version 25560 (0.0007) +[2023-10-08 12:47:38,917][102898] Updated weights for policy 1, policy_version 25580 (0.0008) +[2023-10-08 12:47:39,286][102898] Updated weights for policy 1, policy_version 25590 (0.0008) +[2023-10-08 12:47:39,659][102898] Updated weights for policy 1, policy_version 25600 (0.0007) +[2023-10-08 12:47:41,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 52396032. Throughput: 0: 1771.1, 1: 1781.9. Samples: 13107128. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 12:47:41,876][101941] Avg episode reward: [(0, '6.930'), (1, '7.690')] +[2023-10-08 12:47:42,639][102897] Updated weights for policy 0, policy_version 25570 (0.0007) +[2023-10-08 12:47:43,012][102897] Updated weights for policy 0, policy_version 25580 (0.0007) +[2023-10-08 12:47:43,385][102897] Updated weights for policy 0, policy_version 25590 (0.0008) +[2023-10-08 12:47:43,738][102898] Updated weights for policy 1, policy_version 25610 (0.0009) +[2023-10-08 12:47:43,747][102897] Updated weights for policy 0, policy_version 25600 (0.0009) +[2023-10-08 12:47:44,097][102898] Updated weights for policy 1, policy_version 25620 (0.0007) +[2023-10-08 12:47:44,465][102898] Updated weights for policy 1, policy_version 25630 (0.0010) +[2023-10-08 12:47:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 52461568. Throughput: 0: 1778.4, 1: 1781.1. Samples: 13129522. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 12:47:46,876][101941] Avg episode reward: [(0, '6.260'), (1, '7.870')] +[2023-10-08 12:47:47,555][102897] Updated weights for policy 0, policy_version 25610 (0.0010) +[2023-10-08 12:47:47,934][102897] Updated weights for policy 0, policy_version 25620 (0.0007) +[2023-10-08 12:47:48,259][102898] Updated weights for policy 1, policy_version 25640 (0.0008) +[2023-10-08 12:47:48,312][102897] Updated weights for policy 0, policy_version 25630 (0.0009) +[2023-10-08 12:47:48,623][102898] Updated weights for policy 1, policy_version 25650 (0.0008) +[2023-10-08 12:47:48,996][102898] Updated weights for policy 1, policy_version 25660 (0.0009) +[2023-10-08 12:47:51,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 52527104. Throughput: 0: 1773.1, 1: 1783.3. Samples: 13139298. Policy #0 lag: (min: 17.0, avg: 31.5, max: 49.0) +[2023-10-08 12:47:51,875][101941] Avg episode reward: [(0, '6.550'), (1, '7.390')] +[2023-10-08 12:47:52,015][102897] Updated weights for policy 0, policy_version 25640 (0.0007) +[2023-10-08 12:47:52,385][102897] Updated weights for policy 0, policy_version 25650 (0.0007) +[2023-10-08 12:47:52,751][102897] Updated weights for policy 0, policy_version 25660 (0.0007) +[2023-10-08 12:47:52,789][102898] Updated weights for policy 1, policy_version 25670 (0.0009) +[2023-10-08 12:47:53,154][102898] Updated weights for policy 1, policy_version 25680 (0.0010) +[2023-10-08 12:47:53,525][102898] Updated weights for policy 1, policy_version 25690 (0.0009) +[2023-10-08 12:47:56,525][102897] Updated weights for policy 0, policy_version 25670 (0.0007) +[2023-10-08 12:47:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 52592640. Throughput: 0: 1780.5, 1: 1776.2. Samples: 13161472. Policy #0 lag: (min: 17.0, avg: 31.5, max: 49.0) +[2023-10-08 12:47:56,876][101941] Avg episode reward: [(0, '7.000'), (1, '7.870')] +[2023-10-08 12:47:56,901][102897] Updated weights for policy 0, policy_version 25680 (0.0008) +[2023-10-08 12:47:57,267][102897] Updated weights for policy 0, policy_version 25690 (0.0007) +[2023-10-08 12:47:57,301][102898] Updated weights for policy 1, policy_version 25700 (0.0009) +[2023-10-08 12:47:57,667][102898] Updated weights for policy 1, policy_version 25710 (0.0008) +[2023-10-08 12:47:58,038][102898] Updated weights for policy 1, policy_version 25720 (0.0009) +[2023-10-08 12:48:01,033][102897] Updated weights for policy 0, policy_version 25700 (0.0007) +[2023-10-08 12:48:01,410][102897] Updated weights for policy 0, policy_version 25710 (0.0007) +[2023-10-08 12:48:01,677][102898] Updated weights for policy 1, policy_version 25730 (0.0008) +[2023-10-08 12:48:01,788][102897] Updated weights for policy 0, policy_version 25720 (0.0008) +[2023-10-08 12:48:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 52658176. Throughput: 0: 1797.0, 1: 1792.0. Samples: 13183232. Policy #0 lag: (min: 17.0, avg: 31.5, max: 49.0) +[2023-10-08 12:48:01,875][101941] Avg episode reward: [(0, '7.220'), (1, '7.790')] +[2023-10-08 12:48:02,050][102898] Updated weights for policy 1, policy_version 25740 (0.0008) +[2023-10-08 12:48:02,421][102898] Updated weights for policy 1, policy_version 25750 (0.0008) +[2023-10-08 12:48:02,784][102898] Updated weights for policy 1, policy_version 25760 (0.0007) +[2023-10-08 12:48:05,513][102897] Updated weights for policy 0, policy_version 25730 (0.0010) +[2023-10-08 12:48:05,887][102897] Updated weights for policy 0, policy_version 25740 (0.0010) +[2023-10-08 12:48:06,253][102897] Updated weights for policy 0, policy_version 25750 (0.0008) +[2023-10-08 12:48:06,602][102898] Updated weights for policy 1, policy_version 25770 (0.0008) +[2023-10-08 12:48:06,623][102897] Updated weights for policy 0, policy_version 25760 (0.0007) +[2023-10-08 12:48:06,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 52756480. Throughput: 0: 1774.3, 1: 1775.0. Samples: 13193486. Policy #0 lag: (min: 17.0, avg: 26.6, max: 49.0) +[2023-10-08 12:48:06,876][101941] Avg episode reward: [(0, '6.530'), (1, '7.030')] +[2023-10-08 12:48:06,967][102898] Updated weights for policy 1, policy_version 25780 (0.0010) +[2023-10-08 12:48:07,331][102898] Updated weights for policy 1, policy_version 25790 (0.0010) +[2023-10-08 12:48:10,272][102897] Updated weights for policy 0, policy_version 25770 (0.0009) +[2023-10-08 12:48:10,649][102897] Updated weights for policy 0, policy_version 25780 (0.0009) +[2023-10-08 12:48:10,987][102898] Updated weights for policy 1, policy_version 25800 (0.0009) +[2023-10-08 12:48:11,023][102897] Updated weights for policy 0, policy_version 25790 (0.0008) +[2023-10-08 12:48:11,355][102898] Updated weights for policy 1, policy_version 25810 (0.0009) +[2023-10-08 12:48:11,719][102898] Updated weights for policy 1, policy_version 25820 (0.0009) +[2023-10-08 12:48:11,875][101941] Fps is (10 sec: 19660.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 52854784. Throughput: 0: 1799.7, 1: 1793.2. Samples: 13215474. Policy #0 lag: (min: 17.0, avg: 26.6, max: 49.0) +[2023-10-08 12:48:11,875][101941] Avg episode reward: [(0, '6.370'), (1, '7.340')] +[2023-10-08 12:48:15,048][102897] Updated weights for policy 0, policy_version 25800 (0.0008) +[2023-10-08 12:48:15,428][102897] Updated weights for policy 0, policy_version 25810 (0.0009) +[2023-10-08 12:48:15,630][102898] Updated weights for policy 1, policy_version 25830 (0.0007) +[2023-10-08 12:48:15,794][102897] Updated weights for policy 0, policy_version 25820 (0.0008) +[2023-10-08 12:48:16,018][102898] Updated weights for policy 1, policy_version 25840 (0.0009) +[2023-10-08 12:48:16,384][102898] Updated weights for policy 1, policy_version 25850 (0.0010) +[2023-10-08 12:48:16,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 52920320. Throughput: 0: 1780.2, 1: 1784.4. Samples: 13235384. Policy #0 lag: (min: 17.0, avg: 26.6, max: 49.0) +[2023-10-08 12:48:16,875][101941] Avg episode reward: [(0, '6.320'), (1, '7.270')] +[2023-10-08 12:48:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000025824_26443776.pth... +[2023-10-08 12:48:16,883][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000025856_26476544.pth... +[2023-10-08 12:48:16,914][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000024160_24739840.pth +[2023-10-08 12:48:16,923][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000024192_24772608.pth +[2023-10-08 12:48:19,608][102897] Updated weights for policy 0, policy_version 25830 (0.0008) +[2023-10-08 12:48:19,979][102897] Updated weights for policy 0, policy_version 25840 (0.0010) +[2023-10-08 12:48:20,190][102898] Updated weights for policy 1, policy_version 25860 (0.0008) +[2023-10-08 12:48:20,354][102897] Updated weights for policy 0, policy_version 25850 (0.0008) +[2023-10-08 12:48:20,561][102898] Updated weights for policy 1, policy_version 25870 (0.0008) +[2023-10-08 12:48:20,925][102898] Updated weights for policy 1, policy_version 25880 (0.0010) +[2023-10-08 12:48:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 52985856. Throughput: 0: 1806.6, 1: 1788.9. Samples: 13247614. Policy #0 lag: (min: 17.0, avg: 26.6, max: 49.0) +[2023-10-08 12:48:21,875][101941] Avg episode reward: [(0, '6.690'), (1, '7.230')] +[2023-10-08 12:48:24,075][102897] Updated weights for policy 0, policy_version 25860 (0.0010) +[2023-10-08 12:48:24,447][102897] Updated weights for policy 0, policy_version 25870 (0.0010) +[2023-10-08 12:48:24,786][102898] Updated weights for policy 1, policy_version 25890 (0.0010) +[2023-10-08 12:48:24,810][102897] Updated weights for policy 0, policy_version 25880 (0.0009) +[2023-10-08 12:48:25,153][102898] Updated weights for policy 1, policy_version 25900 (0.0009) +[2023-10-08 12:48:25,525][102898] Updated weights for policy 1, policy_version 25910 (0.0010) +[2023-10-08 12:48:25,888][102898] Updated weights for policy 1, policy_version 25920 (0.0007) +[2023-10-08 12:48:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 53051392. Throughput: 0: 1775.1, 1: 1783.3. Samples: 13267256. Policy #0 lag: (min: 20.0, avg: 21.0, max: 41.0) +[2023-10-08 12:48:26,876][101941] Avg episode reward: [(0, '6.230'), (1, '7.210')] +[2023-10-08 12:48:28,494][102897] Updated weights for policy 0, policy_version 25890 (0.0010) +[2023-10-08 12:48:28,862][102897] Updated weights for policy 0, policy_version 25900 (0.0010) +[2023-10-08 12:48:29,234][102897] Updated weights for policy 0, policy_version 25910 (0.0009) +[2023-10-08 12:48:29,603][102898] Updated weights for policy 1, policy_version 25930 (0.0008) +[2023-10-08 12:48:29,607][102897] Updated weights for policy 0, policy_version 25920 (0.0009) +[2023-10-08 12:48:29,972][102898] Updated weights for policy 1, policy_version 25940 (0.0007) +[2023-10-08 12:48:30,345][102898] Updated weights for policy 1, policy_version 25950 (0.0007) +[2023-10-08 12:48:31,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 53116928. Throughput: 0: 1778.3, 1: 1768.9. Samples: 13289148. Policy #0 lag: (min: 20.0, avg: 21.0, max: 41.0) +[2023-10-08 12:48:31,876][101941] Avg episode reward: [(0, '6.450'), (1, '6.480')] +[2023-10-08 12:48:33,440][102897] Updated weights for policy 0, policy_version 25930 (0.0009) +[2023-10-08 12:48:33,819][102897] Updated weights for policy 0, policy_version 25940 (0.0008) +[2023-10-08 12:48:34,184][102898] Updated weights for policy 1, policy_version 25960 (0.0008) +[2023-10-08 12:48:34,189][102897] Updated weights for policy 0, policy_version 25950 (0.0007) +[2023-10-08 12:48:34,551][102898] Updated weights for policy 1, policy_version 25970 (0.0008) +[2023-10-08 12:48:34,926][102898] Updated weights for policy 1, policy_version 25980 (0.0008) +[2023-10-08 12:48:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 53182464. Throughput: 0: 1775.6, 1: 1783.7. Samples: 13299470. Policy #0 lag: (min: 20.0, avg: 21.0, max: 41.0) +[2023-10-08 12:48:36,876][101941] Avg episode reward: [(0, '6.700'), (1, '6.790')] +[2023-10-08 12:48:37,930][102897] Updated weights for policy 0, policy_version 25960 (0.0008) +[2023-10-08 12:48:38,302][102897] Updated weights for policy 0, policy_version 25970 (0.0008) +[2023-10-08 12:48:38,674][102897] Updated weights for policy 0, policy_version 25980 (0.0009) +[2023-10-08 12:48:38,695][102898] Updated weights for policy 1, policy_version 25990 (0.0008) +[2023-10-08 12:48:39,062][102898] Updated weights for policy 1, policy_version 26000 (0.0007) +[2023-10-08 12:48:39,436][102898] Updated weights for policy 1, policy_version 26010 (0.0007) +[2023-10-08 12:48:41,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 53248000. Throughput: 0: 1774.2, 1: 1768.6. Samples: 13320900. Policy #0 lag: (min: 20.0, avg: 21.0, max: 41.0) +[2023-10-08 12:48:41,875][101941] Avg episode reward: [(0, '7.190'), (1, '7.500')] +[2023-10-08 12:48:42,521][102897] Updated weights for policy 0, policy_version 25990 (0.0009) +[2023-10-08 12:48:42,903][102897] Updated weights for policy 0, policy_version 26000 (0.0009) +[2023-10-08 12:48:43,199][102898] Updated weights for policy 1, policy_version 26020 (0.0008) +[2023-10-08 12:48:43,273][102897] Updated weights for policy 0, policy_version 26010 (0.0007) +[2023-10-08 12:48:43,563][102898] Updated weights for policy 1, policy_version 26030 (0.0007) +[2023-10-08 12:48:43,929][102898] Updated weights for policy 1, policy_version 26040 (0.0008) +[2023-10-08 12:48:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 53313536. Throughput: 0: 1787.4, 1: 1763.9. Samples: 13343042. Policy #0 lag: (min: 1.0, avg: 4.0, max: 33.0) +[2023-10-08 12:48:46,876][101941] Avg episode reward: [(0, '6.350'), (1, '7.680')] +[2023-10-08 12:48:47,126][102897] Updated weights for policy 0, policy_version 26020 (0.0008) +[2023-10-08 12:48:47,501][102897] Updated weights for policy 0, policy_version 26030 (0.0008) +[2023-10-08 12:48:47,867][102897] Updated weights for policy 0, policy_version 26040 (0.0009) +[2023-10-08 12:48:47,886][102898] Updated weights for policy 1, policy_version 26050 (0.0007) +[2023-10-08 12:48:48,262][102898] Updated weights for policy 1, policy_version 26060 (0.0007) +[2023-10-08 12:48:48,625][102898] Updated weights for policy 1, policy_version 26070 (0.0007) +[2023-10-08 12:48:48,998][102898] Updated weights for policy 1, policy_version 26080 (0.0008) +[2023-10-08 12:48:51,652][102897] Updated weights for policy 0, policy_version 26050 (0.0009) +[2023-10-08 12:48:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 53379072. Throughput: 0: 1773.7, 1: 1760.4. Samples: 13352524. Policy #0 lag: (min: 1.0, avg: 4.0, max: 33.0) +[2023-10-08 12:48:51,875][101941] Avg episode reward: [(0, '6.280'), (1, '7.650')] +[2023-10-08 12:48:52,017][102897] Updated weights for policy 0, policy_version 26060 (0.0010) +[2023-10-08 12:48:52,396][102897] Updated weights for policy 0, policy_version 26070 (0.0009) +[2023-10-08 12:48:52,761][102897] Updated weights for policy 0, policy_version 26080 (0.0010) +[2023-10-08 12:48:52,794][102898] Updated weights for policy 1, policy_version 26090 (0.0009) +[2023-10-08 12:48:53,169][102898] Updated weights for policy 1, policy_version 26100 (0.0011) +[2023-10-08 12:48:53,541][102898] Updated weights for policy 1, policy_version 26110 (0.0010) +[2023-10-08 12:48:56,678][102897] Updated weights for policy 0, policy_version 26090 (0.0008) +[2023-10-08 12:48:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 53444608. Throughput: 0: 1780.3, 1: 1759.4. Samples: 13374760. Policy #0 lag: (min: 1.0, avg: 4.0, max: 33.0) +[2023-10-08 12:48:56,876][101941] Avg episode reward: [(0, '5.870'), (1, '7.910')] +[2023-10-08 12:48:57,050][102897] Updated weights for policy 0, policy_version 26100 (0.0007) +[2023-10-08 12:48:57,225][102898] Updated weights for policy 1, policy_version 26120 (0.0009) +[2023-10-08 12:48:57,413][102897] Updated weights for policy 0, policy_version 26110 (0.0007) +[2023-10-08 12:48:57,582][102898] Updated weights for policy 1, policy_version 26130 (0.0008) +[2023-10-08 12:48:57,949][102898] Updated weights for policy 1, policy_version 26140 (0.0009) +[2023-10-08 12:49:01,101][102897] Updated weights for policy 0, policy_version 26120 (0.0007) +[2023-10-08 12:49:01,472][102897] Updated weights for policy 0, policy_version 26130 (0.0007) +[2023-10-08 12:49:01,804][102898] Updated weights for policy 1, policy_version 26150 (0.0008) +[2023-10-08 12:49:01,848][102897] Updated weights for policy 0, policy_version 26140 (0.0010) +[2023-10-08 12:49:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 53510144. Throughput: 0: 1786.6, 1: 1787.1. Samples: 13396198. Policy #0 lag: (min: 1.0, avg: 4.0, max: 33.0) +[2023-10-08 12:49:01,876][101941] Avg episode reward: [(0, '6.350'), (1, '7.320')] +[2023-10-08 12:49:02,171][102898] Updated weights for policy 1, policy_version 26160 (0.0009) +[2023-10-08 12:49:02,540][102898] Updated weights for policy 1, policy_version 26170 (0.0009) +[2023-10-08 12:49:05,365][102897] Updated weights for policy 0, policy_version 26150 (0.0007) +[2023-10-08 12:49:05,746][102897] Updated weights for policy 0, policy_version 26160 (0.0008) +[2023-10-08 12:49:06,118][102897] Updated weights for policy 0, policy_version 26170 (0.0007) +[2023-10-08 12:49:06,328][102898] Updated weights for policy 1, policy_version 26180 (0.0009) +[2023-10-08 12:49:06,704][102898] Updated weights for policy 1, policy_version 26190 (0.0009) +[2023-10-08 12:49:06,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 53608448. Throughput: 0: 1775.9, 1: 1759.8. Samples: 13406722. Policy #0 lag: (min: 28.0, avg: 32.4, max: 60.0) +[2023-10-08 12:49:06,876][101941] Avg episode reward: [(0, '6.770'), (1, '6.410')] +[2023-10-08 12:49:07,076][102898] Updated weights for policy 1, policy_version 26200 (0.0007) +[2023-10-08 12:49:09,974][102897] Updated weights for policy 0, policy_version 26180 (0.0008) +[2023-10-08 12:49:10,335][102897] Updated weights for policy 0, policy_version 26190 (0.0010) +[2023-10-08 12:49:10,702][102897] Updated weights for policy 0, policy_version 26200 (0.0010) +[2023-10-08 12:49:10,781][102898] Updated weights for policy 1, policy_version 26210 (0.0008) +[2023-10-08 12:49:11,147][102898] Updated weights for policy 1, policy_version 26220 (0.0010) +[2023-10-08 12:49:11,528][102898] Updated weights for policy 1, policy_version 26230 (0.0008) +[2023-10-08 12:49:11,875][101941] Fps is (10 sec: 16383.9, 60 sec: 13653.3, 300 sec: 14329.1). Total num frames: 53673984. Throughput: 0: 1792.9, 1: 1787.2. Samples: 13428364. Policy #0 lag: (min: 28.0, avg: 32.4, max: 60.0) +[2023-10-08 12:49:11,876][101941] Avg episode reward: [(0, '6.710'), (1, '6.790')] +[2023-10-08 12:49:11,894][102898] Updated weights for policy 1, policy_version 26240 (0.0010) +[2023-10-08 12:49:14,501][102897] Updated weights for policy 0, policy_version 26210 (0.0008) +[2023-10-08 12:49:14,883][102897] Updated weights for policy 0, policy_version 26220 (0.0007) +[2023-10-08 12:49:15,247][102897] Updated weights for policy 0, policy_version 26230 (0.0009) +[2023-10-08 12:49:15,619][102897] Updated weights for policy 0, policy_version 26240 (0.0008) +[2023-10-08 12:49:15,779][102898] Updated weights for policy 1, policy_version 26250 (0.0009) +[2023-10-08 12:49:16,150][102898] Updated weights for policy 1, policy_version 26260 (0.0009) +[2023-10-08 12:49:16,521][102898] Updated weights for policy 1, policy_version 26270 (0.0007) +[2023-10-08 12:49:16,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 53772288. Throughput: 0: 1772.5, 1: 1773.5. Samples: 13448714. Policy #0 lag: (min: 28.0, avg: 32.4, max: 60.0) +[2023-10-08 12:49:16,875][101941] Avg episode reward: [(0, '6.090'), (1, '7.680')] +[2023-10-08 12:49:19,445][102897] Updated weights for policy 0, policy_version 26250 (0.0008) +[2023-10-08 12:49:19,826][102897] Updated weights for policy 0, policy_version 26260 (0.0007) +[2023-10-08 12:49:20,201][102897] Updated weights for policy 0, policy_version 26270 (0.0007) +[2023-10-08 12:49:20,468][102898] Updated weights for policy 1, policy_version 26280 (0.0008) +[2023-10-08 12:49:20,832][102898] Updated weights for policy 1, policy_version 26290 (0.0009) +[2023-10-08 12:49:21,206][102898] Updated weights for policy 1, policy_version 26300 (0.0008) +[2023-10-08 12:49:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 53837824. Throughput: 0: 1796.1, 1: 1781.2. Samples: 13460446. Policy #0 lag: (min: 28.0, avg: 32.4, max: 60.0) +[2023-10-08 12:49:21,876][101941] Avg episode reward: [(0, '5.990'), (1, '7.090')] +[2023-10-08 12:49:23,933][102897] Updated weights for policy 0, policy_version 26280 (0.0007) +[2023-10-08 12:49:24,293][102897] Updated weights for policy 0, policy_version 26290 (0.0008) +[2023-10-08 12:49:24,674][102897] Updated weights for policy 0, policy_version 26300 (0.0008) +[2023-10-08 12:49:24,925][102898] Updated weights for policy 1, policy_version 26310 (0.0009) +[2023-10-08 12:49:25,294][102898] Updated weights for policy 1, policy_version 26320 (0.0008) +[2023-10-08 12:49:25,659][102898] Updated weights for policy 1, policy_version 26330 (0.0008) +[2023-10-08 12:49:26,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 53903360. Throughput: 0: 1774.3, 1: 1782.0. Samples: 13480934. Policy #0 lag: (min: 31.0, avg: 34.5, max: 63.0) +[2023-10-08 12:49:26,876][101941] Avg episode reward: [(0, '6.560'), (1, '6.750')] +[2023-10-08 12:49:28,613][102897] Updated weights for policy 0, policy_version 26310 (0.0008) +[2023-10-08 12:49:28,985][102897] Updated weights for policy 0, policy_version 26320 (0.0008) +[2023-10-08 12:49:29,358][102897] Updated weights for policy 0, policy_version 26330 (0.0007) +[2023-10-08 12:49:29,380][102898] Updated weights for policy 1, policy_version 26340 (0.0007) +[2023-10-08 12:49:29,746][102898] Updated weights for policy 1, policy_version 26350 (0.0009) +[2023-10-08 12:49:30,116][102898] Updated weights for policy 1, policy_version 26360 (0.0008) +[2023-10-08 12:49:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 53968896. Throughput: 0: 1772.0, 1: 1771.5. Samples: 13502502. Policy #0 lag: (min: 31.0, avg: 34.5, max: 63.0) +[2023-10-08 12:49:31,876][101941] Avg episode reward: [(0, '6.570'), (1, '7.410')] +[2023-10-08 12:49:32,934][102897] Updated weights for policy 0, policy_version 26340 (0.0007) +[2023-10-08 12:49:33,312][102897] Updated weights for policy 0, policy_version 26350 (0.0008) +[2023-10-08 12:49:33,670][102897] Updated weights for policy 0, policy_version 26360 (0.0007) +[2023-10-08 12:49:33,827][102898] Updated weights for policy 1, policy_version 26370 (0.0009) +[2023-10-08 12:49:34,197][102898] Updated weights for policy 1, policy_version 26380 (0.0008) +[2023-10-08 12:49:34,559][102898] Updated weights for policy 1, policy_version 26390 (0.0007) +[2023-10-08 12:49:34,937][102898] Updated weights for policy 1, policy_version 26400 (0.0008) +[2023-10-08 12:49:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 54034432. Throughput: 0: 1772.3, 1: 1789.9. Samples: 13512822. Policy #0 lag: (min: 31.0, avg: 34.5, max: 63.0) +[2023-10-08 12:49:36,876][101941] Avg episode reward: [(0, '6.180'), (1, '6.870')] +[2023-10-08 12:49:37,329][102897] Updated weights for policy 0, policy_version 26370 (0.0007) +[2023-10-08 12:49:37,706][102897] Updated weights for policy 0, policy_version 26380 (0.0008) +[2023-10-08 12:49:38,075][102897] Updated weights for policy 0, policy_version 26390 (0.0008) +[2023-10-08 12:49:38,451][102897] Updated weights for policy 0, policy_version 26400 (0.0009) +[2023-10-08 12:49:38,820][102898] Updated weights for policy 1, policy_version 26410 (0.0009) +[2023-10-08 12:49:39,187][102898] Updated weights for policy 1, policy_version 26420 (0.0007) +[2023-10-08 12:49:39,560][102898] Updated weights for policy 1, policy_version 26430 (0.0011) +[2023-10-08 12:49:41,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 54099968. Throughput: 0: 1785.1, 1: 1775.7. Samples: 13534998. Policy #0 lag: (min: 31.0, avg: 34.5, max: 63.0) +[2023-10-08 12:49:41,876][101941] Avg episode reward: [(0, '6.390'), (1, '5.950')] +[2023-10-08 12:49:42,052][102897] Updated weights for policy 0, policy_version 26410 (0.0010) +[2023-10-08 12:49:42,428][102897] Updated weights for policy 0, policy_version 26420 (0.0008) +[2023-10-08 12:49:42,812][102897] Updated weights for policy 0, policy_version 26430 (0.0007) +[2023-10-08 12:49:43,333][102898] Updated weights for policy 1, policy_version 26440 (0.0008) +[2023-10-08 12:49:43,705][102898] Updated weights for policy 1, policy_version 26450 (0.0007) +[2023-10-08 12:49:44,073][102898] Updated weights for policy 1, policy_version 26460 (0.0008) +[2023-10-08 12:49:46,622][102897] Updated weights for policy 0, policy_version 26440 (0.0007) +[2023-10-08 12:49:46,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 54165504. Throughput: 0: 1802.1, 1: 1779.9. Samples: 13557388. Policy #0 lag: (min: 31.0, avg: 34.5, max: 63.0) +[2023-10-08 12:49:46,875][101941] Avg episode reward: [(0, '6.490'), (1, '6.550')] +[2023-10-08 12:49:47,005][102897] Updated weights for policy 0, policy_version 26450 (0.0008) +[2023-10-08 12:49:47,382][102897] Updated weights for policy 0, policy_version 26460 (0.0009) +[2023-10-08 12:49:47,941][102898] Updated weights for policy 1, policy_version 26470 (0.0009) +[2023-10-08 12:49:48,303][102898] Updated weights for policy 1, policy_version 26480 (0.0007) +[2023-10-08 12:49:48,675][102898] Updated weights for policy 1, policy_version 26490 (0.0010) +[2023-10-08 12:49:51,127][102897] Updated weights for policy 0, policy_version 26470 (0.0009) +[2023-10-08 12:49:51,498][102897] Updated weights for policy 0, policy_version 26480 (0.0008) +[2023-10-08 12:49:51,861][102897] Updated weights for policy 0, policy_version 26490 (0.0009) +[2023-10-08 12:49:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 54231040. Throughput: 0: 1785.3, 1: 1780.1. Samples: 13567160. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 12:49:51,876][101941] Avg episode reward: [(0, '6.350'), (1, '6.640')] +[2023-10-08 12:49:52,354][102898] Updated weights for policy 1, policy_version 26500 (0.0009) +[2023-10-08 12:49:52,716][102898] Updated weights for policy 1, policy_version 26510 (0.0011) +[2023-10-08 12:49:53,082][102898] Updated weights for policy 1, policy_version 26520 (0.0008) +[2023-10-08 12:49:55,711][102897] Updated weights for policy 0, policy_version 26500 (0.0009) +[2023-10-08 12:49:56,083][102897] Updated weights for policy 0, policy_version 26510 (0.0008) +[2023-10-08 12:49:56,463][102897] Updated weights for policy 0, policy_version 26520 (0.0009) +[2023-10-08 12:49:56,872][102898] Updated weights for policy 1, policy_version 26530 (0.0009) +[2023-10-08 12:49:56,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 54329344. Throughput: 0: 1805.0, 1: 1774.8. Samples: 13589452. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 12:49:56,875][101941] Avg episode reward: [(0, '6.040'), (1, '7.320')] +[2023-10-08 12:49:57,234][102898] Updated weights for policy 1, policy_version 26540 (0.0007) +[2023-10-08 12:49:57,602][102898] Updated weights for policy 1, policy_version 26550 (0.0007) +[2023-10-08 12:49:57,973][102898] Updated weights for policy 1, policy_version 26560 (0.0008) +[2023-10-08 12:50:00,223][102897] Updated weights for policy 0, policy_version 26530 (0.0008) +[2023-10-08 12:50:00,584][102897] Updated weights for policy 0, policy_version 26540 (0.0008) +[2023-10-08 12:50:00,962][102897] Updated weights for policy 0, policy_version 26550 (0.0008) +[2023-10-08 12:50:01,333][102897] Updated weights for policy 0, policy_version 26560 (0.0007) +[2023-10-08 12:50:01,791][102898] Updated weights for policy 1, policy_version 26570 (0.0010) +[2023-10-08 12:50:01,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 54394880. Throughput: 0: 1787.5, 1: 1801.0. Samples: 13610196. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 12:50:01,876][101941] Avg episode reward: [(0, '6.470'), (1, '7.270')] +[2023-10-08 12:50:02,154][102898] Updated weights for policy 1, policy_version 26580 (0.0010) +[2023-10-08 12:50:02,528][102898] Updated weights for policy 1, policy_version 26590 (0.0007) +[2023-10-08 12:50:04,959][102897] Updated weights for policy 0, policy_version 26570 (0.0008) +[2023-10-08 12:50:05,338][102897] Updated weights for policy 0, policy_version 26580 (0.0008) +[2023-10-08 12:50:05,716][102897] Updated weights for policy 0, policy_version 26590 (0.0008) +[2023-10-08 12:50:06,312][102898] Updated weights for policy 1, policy_version 26600 (0.0011) +[2023-10-08 12:50:06,684][102898] Updated weights for policy 1, policy_version 26610 (0.0008) +[2023-10-08 12:50:06,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 54460416. Throughput: 0: 1799.7, 1: 1777.6. Samples: 13621426. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 12:50:06,876][101941] Avg episode reward: [(0, '6.490'), (1, '7.080')] +[2023-10-08 12:50:07,054][102898] Updated weights for policy 1, policy_version 26620 (0.0007) +[2023-10-08 12:50:09,667][102897] Updated weights for policy 0, policy_version 26600 (0.0009) +[2023-10-08 12:50:10,038][102897] Updated weights for policy 0, policy_version 26610 (0.0009) +[2023-10-08 12:50:10,416][102897] Updated weights for policy 0, policy_version 26620 (0.0010) +[2023-10-08 12:50:10,683][102898] Updated weights for policy 1, policy_version 26630 (0.0007) +[2023-10-08 12:50:11,047][102898] Updated weights for policy 1, policy_version 26640 (0.0007) +[2023-10-08 12:50:11,429][102898] Updated weights for policy 1, policy_version 26650 (0.0009) +[2023-10-08 12:50:11,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 54558720. Throughput: 0: 1794.6, 1: 1797.9. Samples: 13642596. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:50:11,876][101941] Avg episode reward: [(0, '6.900'), (1, '6.510')] +[2023-10-08 12:50:14,218][102897] Updated weights for policy 0, policy_version 26630 (0.0009) +[2023-10-08 12:50:14,587][102897] Updated weights for policy 0, policy_version 26640 (0.0007) +[2023-10-08 12:50:14,968][102897] Updated weights for policy 0, policy_version 26650 (0.0009) +[2023-10-08 12:50:15,210][102898] Updated weights for policy 1, policy_version 26660 (0.0008) +[2023-10-08 12:50:15,581][102898] Updated weights for policy 1, policy_version 26670 (0.0009) +[2023-10-08 12:50:15,957][102898] Updated weights for policy 1, policy_version 26680 (0.0009) +[2023-10-08 12:50:16,876][101941] Fps is (10 sec: 16383.4, 60 sec: 14199.3, 300 sec: 14329.0). Total num frames: 54624256. Throughput: 0: 1789.2, 1: 1778.6. Samples: 13663054. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:50:16,877][101941] Avg episode reward: [(0, '7.020'), (1, '6.470')] +[2023-10-08 12:50:16,887][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000026656_27295744.pth... +[2023-10-08 12:50:16,887][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000026688_27328512.pth... +[2023-10-08 12:50:16,917][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000024992_25591808.pth +[2023-10-08 12:50:16,922][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000025024_25624576.pth +[2023-10-08 12:50:18,706][102897] Updated weights for policy 0, policy_version 26660 (0.0009) +[2023-10-08 12:50:19,082][102897] Updated weights for policy 0, policy_version 26670 (0.0008) +[2023-10-08 12:50:19,457][102897] Updated weights for policy 0, policy_version 26680 (0.0009) +[2023-10-08 12:50:19,885][102898] Updated weights for policy 1, policy_version 26690 (0.0007) +[2023-10-08 12:50:20,260][102898] Updated weights for policy 1, policy_version 26700 (0.0007) +[2023-10-08 12:50:20,617][102898] Updated weights for policy 1, policy_version 26710 (0.0008) +[2023-10-08 12:50:20,987][102898] Updated weights for policy 1, policy_version 26720 (0.0010) +[2023-10-08 12:50:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 54689792. Throughput: 0: 1803.9, 1: 1794.1. Samples: 13674730. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:50:21,876][101941] Avg episode reward: [(0, '6.780'), (1, '6.310')] +[2023-10-08 12:50:23,340][102897] Updated weights for policy 0, policy_version 26690 (0.0010) +[2023-10-08 12:50:23,706][102897] Updated weights for policy 0, policy_version 26700 (0.0007) +[2023-10-08 12:50:24,088][102897] Updated weights for policy 0, policy_version 26710 (0.0008) +[2023-10-08 12:50:24,454][102897] Updated weights for policy 0, policy_version 26720 (0.0008) +[2023-10-08 12:50:24,776][102898] Updated weights for policy 1, policy_version 26730 (0.0008) +[2023-10-08 12:50:25,144][102898] Updated weights for policy 1, policy_version 26740 (0.0009) +[2023-10-08 12:50:25,514][102898] Updated weights for policy 1, policy_version 26750 (0.0009) +[2023-10-08 12:50:26,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 54755328. Throughput: 0: 1775.3, 1: 1783.7. Samples: 13695152. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:50:26,876][101941] Avg episode reward: [(0, '6.570'), (1, '6.430')] +[2023-10-08 12:50:28,216][102897] Updated weights for policy 0, policy_version 26730 (0.0007) +[2023-10-08 12:50:28,593][102897] Updated weights for policy 0, policy_version 26740 (0.0007) +[2023-10-08 12:50:28,967][102897] Updated weights for policy 0, policy_version 26750 (0.0007) +[2023-10-08 12:50:29,292][102898] Updated weights for policy 1, policy_version 26760 (0.0008) +[2023-10-08 12:50:29,668][102898] Updated weights for policy 1, policy_version 26770 (0.0008) +[2023-10-08 12:50:30,032][102898] Updated weights for policy 1, policy_version 26780 (0.0007) +[2023-10-08 12:50:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 54820864. Throughput: 0: 1774.9, 1: 1774.1. Samples: 13717094. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:50:31,876][101941] Avg episode reward: [(0, '6.420'), (1, '6.530')] +[2023-10-08 12:50:32,892][102897] Updated weights for policy 0, policy_version 26760 (0.0009) +[2023-10-08 12:50:33,257][102897] Updated weights for policy 0, policy_version 26770 (0.0010) +[2023-10-08 12:50:33,626][102897] Updated weights for policy 0, policy_version 26780 (0.0010) +[2023-10-08 12:50:33,790][102898] Updated weights for policy 1, policy_version 26790 (0.0008) +[2023-10-08 12:50:34,167][102898] Updated weights for policy 1, policy_version 26800 (0.0009) +[2023-10-08 12:50:34,536][102898] Updated weights for policy 1, policy_version 26810 (0.0007) +[2023-10-08 12:50:36,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 54886400. Throughput: 0: 1767.2, 1: 1785.4. Samples: 13727024. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 12:50:36,875][101941] Avg episode reward: [(0, '6.250'), (1, '6.700')] +[2023-10-08 12:50:37,340][102897] Updated weights for policy 0, policy_version 26790 (0.0007) +[2023-10-08 12:50:37,711][102897] Updated weights for policy 0, policy_version 26800 (0.0007) +[2023-10-08 12:50:38,084][102897] Updated weights for policy 0, policy_version 26810 (0.0008) +[2023-10-08 12:50:38,324][102898] Updated weights for policy 1, policy_version 26820 (0.0008) +[2023-10-08 12:50:38,693][102898] Updated weights for policy 1, policy_version 26830 (0.0007) +[2023-10-08 12:50:39,056][102898] Updated weights for policy 1, policy_version 26840 (0.0007) +[2023-10-08 12:50:41,819][102897] Updated weights for policy 0, policy_version 26820 (0.0007) +[2023-10-08 12:50:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 54951936. Throughput: 0: 1769.4, 1: 1779.2. Samples: 13749136. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 12:50:41,876][101941] Avg episode reward: [(0, '6.730'), (1, '7.300')] +[2023-10-08 12:50:42,190][102897] Updated weights for policy 0, policy_version 26830 (0.0009) +[2023-10-08 12:50:42,559][102897] Updated weights for policy 0, policy_version 26840 (0.0008) +[2023-10-08 12:50:42,747][102898] Updated weights for policy 1, policy_version 26850 (0.0008) +[2023-10-08 12:50:43,107][102898] Updated weights for policy 1, policy_version 26860 (0.0007) +[2023-10-08 12:50:43,473][102898] Updated weights for policy 1, policy_version 26870 (0.0007) +[2023-10-08 12:50:43,848][102898] Updated weights for policy 1, policy_version 26880 (0.0008) +[2023-10-08 12:50:46,397][102897] Updated weights for policy 0, policy_version 26850 (0.0008) +[2023-10-08 12:50:46,769][102897] Updated weights for policy 0, policy_version 26860 (0.0007) +[2023-10-08 12:50:46,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 55017472. Throughput: 0: 1801.6, 1: 1784.8. Samples: 13771580. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 12:50:46,876][101941] Avg episode reward: [(0, '7.140'), (1, '6.870')] +[2023-10-08 12:50:47,152][102897] Updated weights for policy 0, policy_version 26870 (0.0008) +[2023-10-08 12:50:47,522][102897] Updated weights for policy 0, policy_version 26880 (0.0009) +[2023-10-08 12:50:47,646][102898] Updated weights for policy 1, policy_version 26890 (0.0007) +[2023-10-08 12:50:48,017][102898] Updated weights for policy 1, policy_version 26900 (0.0009) +[2023-10-08 12:50:48,390][102898] Updated weights for policy 1, policy_version 26910 (0.0008) +[2023-10-08 12:50:51,443][102897] Updated weights for policy 0, policy_version 26890 (0.0007) +[2023-10-08 12:50:51,818][102897] Updated weights for policy 0, policy_version 26900 (0.0007) +[2023-10-08 12:50:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 55083008. Throughput: 0: 1770.4, 1: 1783.3. Samples: 13781344. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 12:50:51,875][101941] Avg episode reward: [(0, '7.360'), (1, '6.320')] +[2023-10-08 12:50:52,101][102898] Updated weights for policy 1, policy_version 26920 (0.0007) +[2023-10-08 12:50:52,184][102897] Updated weights for policy 0, policy_version 26910 (0.0009) +[2023-10-08 12:50:52,477][102898] Updated weights for policy 1, policy_version 26930 (0.0008) +[2023-10-08 12:50:52,857][102898] Updated weights for policy 1, policy_version 26940 (0.0009) +[2023-10-08 12:50:55,882][102897] Updated weights for policy 0, policy_version 26920 (0.0010) +[2023-10-08 12:50:56,259][102897] Updated weights for policy 0, policy_version 26930 (0.0010) +[2023-10-08 12:50:56,618][102898] Updated weights for policy 1, policy_version 26950 (0.0007) +[2023-10-08 12:50:56,635][102897] Updated weights for policy 0, policy_version 26940 (0.0008) +[2023-10-08 12:50:56,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 55181312. Throughput: 0: 1799.5, 1: 1783.3. Samples: 13803826. Policy #0 lag: (min: 5.0, avg: 5.2, max: 15.0) +[2023-10-08 12:50:56,876][101941] Avg episode reward: [(0, '7.090'), (1, '7.420')] +[2023-10-08 12:50:56,985][102898] Updated weights for policy 1, policy_version 26960 (0.0009) +[2023-10-08 12:50:57,357][102898] Updated weights for policy 1, policy_version 26970 (0.0009) +[2023-10-08 12:51:00,326][102897] Updated weights for policy 0, policy_version 26950 (0.0011) +[2023-10-08 12:51:00,697][102897] Updated weights for policy 0, policy_version 26960 (0.0010) +[2023-10-08 12:51:01,070][102897] Updated weights for policy 0, policy_version 26970 (0.0007) +[2023-10-08 12:51:01,175][102898] Updated weights for policy 1, policy_version 26980 (0.0010) +[2023-10-08 12:51:01,543][102898] Updated weights for policy 1, policy_version 26990 (0.0008) +[2023-10-08 12:51:01,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 55246848. Throughput: 0: 1770.8, 1: 1801.3. Samples: 13823794. Policy #0 lag: (min: 5.0, avg: 5.2, max: 15.0) +[2023-10-08 12:51:01,876][101941] Avg episode reward: [(0, '6.470'), (1, '8.030')] +[2023-10-08 12:51:01,907][102898] Updated weights for policy 1, policy_version 27000 (0.0009) +[2023-10-08 12:51:02,203][102760] Saving new best policy, reward=8.030! +[2023-10-08 12:51:04,859][102897] Updated weights for policy 0, policy_version 26980 (0.0007) +[2023-10-08 12:51:05,241][102897] Updated weights for policy 0, policy_version 26990 (0.0008) +[2023-10-08 12:51:05,585][102898] Updated weights for policy 1, policy_version 27010 (0.0008) +[2023-10-08 12:51:05,608][102897] Updated weights for policy 0, policy_version 27000 (0.0009) +[2023-10-08 12:51:05,951][102898] Updated weights for policy 1, policy_version 27020 (0.0009) +[2023-10-08 12:51:06,318][102898] Updated weights for policy 1, policy_version 27030 (0.0009) +[2023-10-08 12:51:06,696][102898] Updated weights for policy 1, policy_version 27040 (0.0008) +[2023-10-08 12:51:06,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 55345152. Throughput: 0: 1795.0, 1: 1782.8. Samples: 13835730. Policy #0 lag: (min: 5.0, avg: 5.2, max: 15.0) +[2023-10-08 12:51:06,875][101941] Avg episode reward: [(0, '6.560'), (1, '6.900')] +[2023-10-08 12:51:09,313][102897] Updated weights for policy 0, policy_version 27010 (0.0009) +[2023-10-08 12:51:09,695][102897] Updated weights for policy 0, policy_version 27020 (0.0008) +[2023-10-08 12:51:10,075][102897] Updated weights for policy 0, policy_version 27030 (0.0008) +[2023-10-08 12:51:10,307][102898] Updated weights for policy 1, policy_version 27050 (0.0007) +[2023-10-08 12:51:10,437][102897] Updated weights for policy 0, policy_version 27040 (0.0008) +[2023-10-08 12:51:10,684][102898] Updated weights for policy 1, policy_version 27060 (0.0009) +[2023-10-08 12:51:11,041][102898] Updated weights for policy 1, policy_version 27070 (0.0008) +[2023-10-08 12:51:11,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 55410688. Throughput: 0: 1782.0, 1: 1797.3. Samples: 13856224. Policy #0 lag: (min: 5.0, avg: 5.2, max: 15.0) +[2023-10-08 12:51:11,876][101941] Avg episode reward: [(0, '7.000'), (1, '6.490')] +[2023-10-08 12:51:14,124][102897] Updated weights for policy 0, policy_version 27050 (0.0010) +[2023-10-08 12:51:14,498][102897] Updated weights for policy 0, policy_version 27060 (0.0011) +[2023-10-08 12:51:14,847][102898] Updated weights for policy 1, policy_version 27080 (0.0007) +[2023-10-08 12:51:14,876][102897] Updated weights for policy 0, policy_version 27070 (0.0007) +[2023-10-08 12:51:15,217][102898] Updated weights for policy 1, policy_version 27090 (0.0009) +[2023-10-08 12:51:15,581][102898] Updated weights for policy 1, policy_version 27100 (0.0010) +[2023-10-08 12:51:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.6, 300 sec: 14329.1). Total num frames: 55476224. Throughput: 0: 1778.9, 1: 1787.1. Samples: 13877566. Policy #0 lag: (min: 12.0, avg: 13.9, max: 40.0) +[2023-10-08 12:51:16,875][101941] Avg episode reward: [(0, '6.800'), (1, '7.030')] +[2023-10-08 12:51:18,708][102897] Updated weights for policy 0, policy_version 27080 (0.0009) +[2023-10-08 12:51:19,089][102897] Updated weights for policy 0, policy_version 27090 (0.0009) +[2023-10-08 12:51:19,407][102898] Updated weights for policy 1, policy_version 27110 (0.0008) +[2023-10-08 12:51:19,456][102897] Updated weights for policy 0, policy_version 27100 (0.0008) +[2023-10-08 12:51:19,773][102898] Updated weights for policy 1, policy_version 27120 (0.0009) +[2023-10-08 12:51:20,150][102898] Updated weights for policy 1, policy_version 27130 (0.0009) +[2023-10-08 12:51:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 55541760. Throughput: 0: 1786.4, 1: 1808.4. Samples: 13888792. Policy #0 lag: (min: 12.0, avg: 13.9, max: 40.0) +[2023-10-08 12:51:21,876][101941] Avg episode reward: [(0, '6.980'), (1, '7.100')] +[2023-10-08 12:51:23,203][102897] Updated weights for policy 0, policy_version 27110 (0.0007) +[2023-10-08 12:51:23,571][102897] Updated weights for policy 0, policy_version 27120 (0.0007) +[2023-10-08 12:51:23,949][102897] Updated weights for policy 0, policy_version 27130 (0.0008) +[2023-10-08 12:51:23,955][102898] Updated weights for policy 1, policy_version 27140 (0.0009) +[2023-10-08 12:51:24,326][102898] Updated weights for policy 1, policy_version 27150 (0.0009) +[2023-10-08 12:51:24,692][102898] Updated weights for policy 1, policy_version 27160 (0.0009) +[2023-10-08 12:51:26,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 55607296. Throughput: 0: 1776.0, 1: 1786.3. Samples: 13909440. Policy #0 lag: (min: 12.0, avg: 13.9, max: 40.0) +[2023-10-08 12:51:26,876][101941] Avg episode reward: [(0, '6.560'), (1, '7.170')] +[2023-10-08 12:51:27,559][102897] Updated weights for policy 0, policy_version 27140 (0.0008) +[2023-10-08 12:51:27,926][102897] Updated weights for policy 0, policy_version 27150 (0.0008) +[2023-10-08 12:51:28,300][102897] Updated weights for policy 0, policy_version 27160 (0.0008) +[2023-10-08 12:51:28,628][102898] Updated weights for policy 1, policy_version 27170 (0.0010) +[2023-10-08 12:51:28,987][102898] Updated weights for policy 1, policy_version 27180 (0.0008) +[2023-10-08 12:51:29,359][102898] Updated weights for policy 1, policy_version 27190 (0.0008) +[2023-10-08 12:51:29,736][102898] Updated weights for policy 1, policy_version 27200 (0.0008) +[2023-10-08 12:51:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 55672832. Throughput: 0: 1778.3, 1: 1778.8. Samples: 13931650. Policy #0 lag: (min: 12.0, avg: 13.9, max: 40.0) +[2023-10-08 12:51:31,876][101941] Avg episode reward: [(0, '6.170'), (1, '6.570')] +[2023-10-08 12:51:32,103][102897] Updated weights for policy 0, policy_version 27170 (0.0008) +[2023-10-08 12:51:32,470][102897] Updated weights for policy 0, policy_version 27180 (0.0007) +[2023-10-08 12:51:32,847][102897] Updated weights for policy 0, policy_version 27190 (0.0009) +[2023-10-08 12:51:33,217][102897] Updated weights for policy 0, policy_version 27200 (0.0007) +[2023-10-08 12:51:33,601][102898] Updated weights for policy 1, policy_version 27210 (0.0008) +[2023-10-08 12:51:33,972][102898] Updated weights for policy 1, policy_version 27220 (0.0009) +[2023-10-08 12:51:34,347][102898] Updated weights for policy 1, policy_version 27230 (0.0009) +[2023-10-08 12:51:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 55738368. Throughput: 0: 1778.1, 1: 1776.8. Samples: 13941316. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:51:36,876][101941] Avg episode reward: [(0, '6.170'), (1, '7.020')] +[2023-10-08 12:51:37,051][102897] Updated weights for policy 0, policy_version 27210 (0.0008) +[2023-10-08 12:51:37,427][102897] Updated weights for policy 0, policy_version 27220 (0.0007) +[2023-10-08 12:51:37,791][102897] Updated weights for policy 0, policy_version 27230 (0.0007) +[2023-10-08 12:51:37,953][102898] Updated weights for policy 1, policy_version 27240 (0.0008) +[2023-10-08 12:51:38,317][102898] Updated weights for policy 1, policy_version 27250 (0.0009) +[2023-10-08 12:51:38,683][102898] Updated weights for policy 1, policy_version 27260 (0.0009) +[2023-10-08 12:51:41,630][102897] Updated weights for policy 0, policy_version 27240 (0.0008) +[2023-10-08 12:51:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 55803904. Throughput: 0: 1780.6, 1: 1776.7. Samples: 13963904. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:51:41,875][101941] Avg episode reward: [(0, '6.590'), (1, '7.160')] +[2023-10-08 12:51:42,015][102897] Updated weights for policy 0, policy_version 27250 (0.0009) +[2023-10-08 12:51:42,370][102897] Updated weights for policy 0, policy_version 27260 (0.0009) +[2023-10-08 12:51:42,516][102898] Updated weights for policy 1, policy_version 27270 (0.0007) +[2023-10-08 12:51:42,886][102898] Updated weights for policy 1, policy_version 27280 (0.0007) +[2023-10-08 12:51:43,247][102898] Updated weights for policy 1, policy_version 27290 (0.0007) +[2023-10-08 12:51:45,897][102897] Updated weights for policy 0, policy_version 27270 (0.0008) +[2023-10-08 12:51:46,273][102897] Updated weights for policy 0, policy_version 27280 (0.0009) +[2023-10-08 12:51:46,652][102897] Updated weights for policy 0, policy_version 27290 (0.0008) +[2023-10-08 12:51:46,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 55902208. Throughput: 0: 1804.8, 1: 1794.4. Samples: 13985758. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:51:46,876][101941] Avg episode reward: [(0, '6.470'), (1, '6.780')] +[2023-10-08 12:51:46,952][102898] Updated weights for policy 1, policy_version 27300 (0.0008) +[2023-10-08 12:51:47,319][102898] Updated weights for policy 1, policy_version 27310 (0.0009) +[2023-10-08 12:51:47,691][102898] Updated weights for policy 1, policy_version 27320 (0.0009) +[2023-10-08 12:51:50,375][102897] Updated weights for policy 0, policy_version 27300 (0.0008) +[2023-10-08 12:51:50,739][102897] Updated weights for policy 0, policy_version 27310 (0.0010) +[2023-10-08 12:51:51,097][102897] Updated weights for policy 0, policy_version 27320 (0.0010) +[2023-10-08 12:51:51,373][102898] Updated weights for policy 1, policy_version 27330 (0.0009) +[2023-10-08 12:51:51,734][102898] Updated weights for policy 1, policy_version 27340 (0.0008) +[2023-10-08 12:51:51,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 55967744. Throughput: 0: 1787.1, 1: 1781.4. Samples: 13996312. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:51:51,876][101941] Avg episode reward: [(0, '6.490'), (1, '6.870')] +[2023-10-08 12:51:52,097][102898] Updated weights for policy 1, policy_version 27350 (0.0011) +[2023-10-08 12:51:52,466][102898] Updated weights for policy 1, policy_version 27360 (0.0011) +[2023-10-08 12:51:54,828][102897] Updated weights for policy 0, policy_version 27330 (0.0009) +[2023-10-08 12:51:55,205][102897] Updated weights for policy 0, policy_version 27340 (0.0007) +[2023-10-08 12:51:55,572][102897] Updated weights for policy 0, policy_version 27350 (0.0008) +[2023-10-08 12:51:55,942][102897] Updated weights for policy 0, policy_version 27360 (0.0007) +[2023-10-08 12:51:56,366][102898] Updated weights for policy 1, policy_version 27370 (0.0007) +[2023-10-08 12:51:56,730][102898] Updated weights for policy 1, policy_version 27380 (0.0007) +[2023-10-08 12:51:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 56033280. Throughput: 0: 1801.8, 1: 1791.8. Samples: 14017936. Policy #0 lag: (min: 31.0, avg: 36.5, max: 63.0) +[2023-10-08 12:51:56,876][101941] Avg episode reward: [(0, '6.570'), (1, '6.830')] +[2023-10-08 12:51:57,094][102898] Updated weights for policy 1, policy_version 27390 (0.0007) +[2023-10-08 12:51:59,649][102897] Updated weights for policy 0, policy_version 27370 (0.0007) +[2023-10-08 12:52:00,027][102897] Updated weights for policy 0, policy_version 27380 (0.0007) +[2023-10-08 12:52:00,398][102897] Updated weights for policy 0, policy_version 27390 (0.0008) +[2023-10-08 12:52:00,842][102898] Updated weights for policy 1, policy_version 27400 (0.0009) +[2023-10-08 12:52:01,207][102898] Updated weights for policy 1, policy_version 27410 (0.0007) +[2023-10-08 12:52:01,579][102898] Updated weights for policy 1, policy_version 27420 (0.0008) +[2023-10-08 12:52:01,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 56131584. Throughput: 0: 1793.9, 1: 1785.3. Samples: 14038632. Policy #0 lag: (min: 31.0, avg: 36.5, max: 63.0) +[2023-10-08 12:52:01,876][101941] Avg episode reward: [(0, '6.510'), (1, '6.710')] +[2023-10-08 12:52:04,159][102897] Updated weights for policy 0, policy_version 27400 (0.0008) +[2023-10-08 12:52:04,530][102897] Updated weights for policy 0, policy_version 27410 (0.0008) +[2023-10-08 12:52:04,909][102897] Updated weights for policy 0, policy_version 27420 (0.0010) +[2023-10-08 12:52:05,323][102898] Updated weights for policy 1, policy_version 27430 (0.0009) +[2023-10-08 12:52:05,699][102898] Updated weights for policy 1, policy_version 27440 (0.0008) +[2023-10-08 12:52:06,065][102898] Updated weights for policy 1, policy_version 27450 (0.0007) +[2023-10-08 12:52:06,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 56197120. Throughput: 0: 1810.0, 1: 1779.8. Samples: 14050332. Policy #0 lag: (min: 31.0, avg: 36.5, max: 63.0) +[2023-10-08 12:52:06,876][101941] Avg episode reward: [(0, '6.530'), (1, '7.000')] +[2023-10-08 12:52:08,818][102897] Updated weights for policy 0, policy_version 27430 (0.0008) +[2023-10-08 12:52:09,183][102897] Updated weights for policy 0, policy_version 27440 (0.0008) +[2023-10-08 12:52:09,555][102897] Updated weights for policy 0, policy_version 27450 (0.0009) +[2023-10-08 12:52:09,691][102898] Updated weights for policy 1, policy_version 27460 (0.0007) +[2023-10-08 12:52:10,060][102898] Updated weights for policy 1, policy_version 27470 (0.0009) +[2023-10-08 12:52:10,427][102898] Updated weights for policy 1, policy_version 27480 (0.0008) +[2023-10-08 12:52:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 56262656. Throughput: 0: 1795.2, 1: 1784.9. Samples: 14070548. Policy #0 lag: (min: 31.0, avg: 36.5, max: 63.0) +[2023-10-08 12:52:11,876][101941] Avg episode reward: [(0, '6.020'), (1, '7.080')] +[2023-10-08 12:52:13,194][102897] Updated weights for policy 0, policy_version 27460 (0.0007) +[2023-10-08 12:52:13,571][102897] Updated weights for policy 0, policy_version 27470 (0.0007) +[2023-10-08 12:52:13,943][102897] Updated weights for policy 0, policy_version 27480 (0.0007) +[2023-10-08 12:52:14,102][102898] Updated weights for policy 1, policy_version 27490 (0.0008) +[2023-10-08 12:52:14,476][102898] Updated weights for policy 1, policy_version 27500 (0.0009) +[2023-10-08 12:52:14,841][102898] Updated weights for policy 1, policy_version 27510 (0.0008) +[2023-10-08 12:52:15,206][102898] Updated weights for policy 1, policy_version 27520 (0.0009) +[2023-10-08 12:52:16,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 56328192. Throughput: 0: 1798.3, 1: 1781.5. Samples: 14092740. Policy #0 lag: (min: 31.0, avg: 36.5, max: 63.0) +[2023-10-08 12:52:16,875][101941] Avg episode reward: [(0, '6.330'), (1, '6.740')] +[2023-10-08 12:52:16,882][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000027488_28147712.pth... +[2023-10-08 12:52:16,882][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000027520_28180480.pth... +[2023-10-08 12:52:16,913][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000025856_26476544.pth +[2023-10-08 12:52:16,923][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000025824_26443776.pth +[2023-10-08 12:52:17,676][102897] Updated weights for policy 0, policy_version 27490 (0.0009) +[2023-10-08 12:52:18,056][102897] Updated weights for policy 0, policy_version 27500 (0.0007) +[2023-10-08 12:52:18,422][102897] Updated weights for policy 0, policy_version 27510 (0.0007) +[2023-10-08 12:52:18,792][102897] Updated weights for policy 0, policy_version 27520 (0.0007) +[2023-10-08 12:52:18,865][102898] Updated weights for policy 1, policy_version 27530 (0.0008) +[2023-10-08 12:52:19,224][102898] Updated weights for policy 1, policy_version 27540 (0.0010) +[2023-10-08 12:52:19,591][102898] Updated weights for policy 1, policy_version 27550 (0.0007) +[2023-10-08 12:52:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 56393728. Throughput: 0: 1797.9, 1: 1797.7. Samples: 14103120. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 12:52:21,875][101941] Avg episode reward: [(0, '6.140'), (1, '7.730')] +[2023-10-08 12:52:22,697][102897] Updated weights for policy 0, policy_version 27530 (0.0008) +[2023-10-08 12:52:23,066][102897] Updated weights for policy 0, policy_version 27540 (0.0008) +[2023-10-08 12:52:23,439][102897] Updated weights for policy 0, policy_version 27550 (0.0008) +[2023-10-08 12:52:23,476][102898] Updated weights for policy 1, policy_version 27560 (0.0008) +[2023-10-08 12:52:23,840][102898] Updated weights for policy 1, policy_version 27570 (0.0010) +[2023-10-08 12:52:24,210][102898] Updated weights for policy 1, policy_version 27580 (0.0010) +[2023-10-08 12:52:26,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 56459264. Throughput: 0: 1788.3, 1: 1786.1. Samples: 14124750. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 12:52:26,876][101941] Avg episode reward: [(0, '6.210'), (1, '7.890')] +[2023-10-08 12:52:27,152][102897] Updated weights for policy 0, policy_version 27560 (0.0008) +[2023-10-08 12:52:27,518][102897] Updated weights for policy 0, policy_version 27570 (0.0008) +[2023-10-08 12:52:27,897][102897] Updated weights for policy 0, policy_version 27580 (0.0008) +[2023-10-08 12:52:28,058][102898] Updated weights for policy 1, policy_version 27590 (0.0010) +[2023-10-08 12:52:28,423][102898] Updated weights for policy 1, policy_version 27600 (0.0009) +[2023-10-08 12:52:28,788][102898] Updated weights for policy 1, policy_version 27610 (0.0008) +[2023-10-08 12:52:31,564][102897] Updated weights for policy 0, policy_version 27590 (0.0008) +[2023-10-08 12:52:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 56524800. Throughput: 0: 1806.5, 1: 1782.4. Samples: 14147260. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 12:52:31,876][101941] Avg episode reward: [(0, '6.170'), (1, '7.300')] +[2023-10-08 12:52:31,936][102897] Updated weights for policy 0, policy_version 27600 (0.0008) +[2023-10-08 12:52:32,323][102897] Updated weights for policy 0, policy_version 27610 (0.0010) +[2023-10-08 12:52:32,797][102898] Updated weights for policy 1, policy_version 27620 (0.0008) +[2023-10-08 12:52:33,172][102898] Updated weights for policy 1, policy_version 27630 (0.0007) +[2023-10-08 12:52:33,547][102898] Updated weights for policy 1, policy_version 27640 (0.0011) +[2023-10-08 12:52:35,949][102897] Updated weights for policy 0, policy_version 27620 (0.0009) +[2023-10-08 12:52:36,324][102897] Updated weights for policy 0, policy_version 27630 (0.0009) +[2023-10-08 12:52:36,695][102897] Updated weights for policy 0, policy_version 27640 (0.0007) +[2023-10-08 12:52:36,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 56590336. Throughput: 0: 1788.8, 1: 1783.3. Samples: 14157056. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 12:52:36,875][101941] Avg episode reward: [(0, '6.430'), (1, '6.870')] +[2023-10-08 12:52:37,448][102898] Updated weights for policy 1, policy_version 27650 (0.0009) +[2023-10-08 12:52:37,819][102898] Updated weights for policy 1, policy_version 27660 (0.0011) +[2023-10-08 12:52:38,188][102898] Updated weights for policy 1, policy_version 27670 (0.0009) +[2023-10-08 12:52:38,545][102898] Updated weights for policy 1, policy_version 27680 (0.0009) +[2023-10-08 12:52:40,458][102897] Updated weights for policy 0, policy_version 27650 (0.0008) +[2023-10-08 12:52:40,827][102897] Updated weights for policy 0, policy_version 27660 (0.0009) +[2023-10-08 12:52:41,204][102897] Updated weights for policy 0, policy_version 27670 (0.0007) +[2023-10-08 12:52:41,566][102897] Updated weights for policy 0, policy_version 27680 (0.0008) +[2023-10-08 12:52:41,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 56688640. Throughput: 0: 1807.1, 1: 1779.6. Samples: 14179338. Policy #0 lag: (min: 20.0, avg: 27.5, max: 52.0) +[2023-10-08 12:52:41,875][101941] Avg episode reward: [(0, '6.610'), (1, '6.420')] +[2023-10-08 12:52:42,276][102898] Updated weights for policy 1, policy_version 27690 (0.0007) +[2023-10-08 12:52:42,633][102898] Updated weights for policy 1, policy_version 27700 (0.0010) +[2023-10-08 12:52:43,001][102898] Updated weights for policy 1, policy_version 27710 (0.0011) +[2023-10-08 12:52:45,420][102897] Updated weights for policy 0, policy_version 27690 (0.0008) +[2023-10-08 12:52:45,797][102897] Updated weights for policy 0, policy_version 27700 (0.0008) +[2023-10-08 12:52:46,168][102897] Updated weights for policy 0, policy_version 27710 (0.0009) +[2023-10-08 12:52:46,711][102898] Updated weights for policy 1, policy_version 27720 (0.0011) +[2023-10-08 12:52:46,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 56754176. Throughput: 0: 1782.5, 1: 1806.1. Samples: 14200118. Policy #0 lag: (min: 20.0, avg: 27.5, max: 52.0) +[2023-10-08 12:52:46,875][101941] Avg episode reward: [(0, '6.810'), (1, '6.730')] +[2023-10-08 12:52:47,077][102898] Updated weights for policy 1, policy_version 27730 (0.0011) +[2023-10-08 12:52:47,446][102898] Updated weights for policy 1, policy_version 27740 (0.0008) +[2023-10-08 12:52:49,986][102897] Updated weights for policy 0, policy_version 27720 (0.0010) +[2023-10-08 12:52:50,358][102897] Updated weights for policy 0, policy_version 27730 (0.0009) +[2023-10-08 12:52:50,725][102897] Updated weights for policy 0, policy_version 27740 (0.0010) +[2023-10-08 12:52:51,360][102898] Updated weights for policy 1, policy_version 27750 (0.0009) +[2023-10-08 12:52:51,743][102898] Updated weights for policy 1, policy_version 27760 (0.0011) +[2023-10-08 12:52:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 56819712. Throughput: 0: 1794.5, 1: 1778.5. Samples: 14211116. Policy #0 lag: (min: 20.0, avg: 27.5, max: 52.0) +[2023-10-08 12:52:51,875][101941] Avg episode reward: [(0, '6.270'), (1, '6.420')] +[2023-10-08 12:52:52,107][102898] Updated weights for policy 1, policy_version 27770 (0.0009) +[2023-10-08 12:52:54,376][102897] Updated weights for policy 0, policy_version 27750 (0.0009) +[2023-10-08 12:52:54,756][102897] Updated weights for policy 0, policy_version 27760 (0.0007) +[2023-10-08 12:52:55,135][102897] Updated weights for policy 0, policy_version 27770 (0.0007) +[2023-10-08 12:52:55,963][102898] Updated weights for policy 1, policy_version 27780 (0.0010) +[2023-10-08 12:52:56,334][102898] Updated weights for policy 1, policy_version 27790 (0.0010) +[2023-10-08 12:52:56,695][102898] Updated weights for policy 1, policy_version 27800 (0.0008) +[2023-10-08 12:52:56,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 56885248. Throughput: 0: 1783.7, 1: 1803.0. Samples: 14231948. Policy #0 lag: (min: 20.0, avg: 27.5, max: 52.0) +[2023-10-08 12:52:56,876][101941] Avg episode reward: [(0, '6.310'), (1, '6.360')] +[2023-10-08 12:52:59,086][102897] Updated weights for policy 0, policy_version 27780 (0.0008) +[2023-10-08 12:52:59,469][102897] Updated weights for policy 0, policy_version 27790 (0.0010) +[2023-10-08 12:52:59,844][102897] Updated weights for policy 0, policy_version 27800 (0.0008) +[2023-10-08 12:53:00,515][102898] Updated weights for policy 1, policy_version 27810 (0.0008) +[2023-10-08 12:53:00,887][102898] Updated weights for policy 1, policy_version 27820 (0.0009) +[2023-10-08 12:53:01,259][102898] Updated weights for policy 1, policy_version 27830 (0.0010) +[2023-10-08 12:53:01,621][102898] Updated weights for policy 1, policy_version 27840 (0.0008) +[2023-10-08 12:53:01,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 56983552. Throughput: 0: 1774.5, 1: 1782.0. Samples: 14252780. Policy #0 lag: (min: 20.0, avg: 27.5, max: 52.0) +[2023-10-08 12:53:01,876][101941] Avg episode reward: [(0, '5.840'), (1, '7.680')] +[2023-10-08 12:53:03,693][102897] Updated weights for policy 0, policy_version 27810 (0.0010) +[2023-10-08 12:53:04,061][102897] Updated weights for policy 0, policy_version 27820 (0.0007) +[2023-10-08 12:53:04,431][102897] Updated weights for policy 0, policy_version 27830 (0.0007) +[2023-10-08 12:53:04,805][102897] Updated weights for policy 0, policy_version 27840 (0.0007) +[2023-10-08 12:53:05,322][102898] Updated weights for policy 1, policy_version 27850 (0.0010) +[2023-10-08 12:53:05,692][102898] Updated weights for policy 1, policy_version 27860 (0.0009) +[2023-10-08 12:53:06,074][102898] Updated weights for policy 1, policy_version 27870 (0.0009) +[2023-10-08 12:53:06,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 57049088. Throughput: 0: 1783.7, 1: 1797.3. Samples: 14264266. Policy #0 lag: (min: 4.0, avg: 4.2, max: 14.0) +[2023-10-08 12:53:06,876][101941] Avg episode reward: [(0, '5.660'), (1, '7.970')] +[2023-10-08 12:53:08,438][102897] Updated weights for policy 0, policy_version 27850 (0.0008) +[2023-10-08 12:53:08,806][102897] Updated weights for policy 0, policy_version 27860 (0.0008) +[2023-10-08 12:53:09,173][102897] Updated weights for policy 0, policy_version 27870 (0.0008) +[2023-10-08 12:53:09,704][102898] Updated weights for policy 1, policy_version 27880 (0.0008) +[2023-10-08 12:53:10,069][102898] Updated weights for policy 1, policy_version 27890 (0.0007) +[2023-10-08 12:53:10,432][102898] Updated weights for policy 1, policy_version 27900 (0.0009) +[2023-10-08 12:53:11,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 57114624. Throughput: 0: 1785.3, 1: 1780.8. Samples: 14285222. Policy #0 lag: (min: 4.0, avg: 4.2, max: 14.0) +[2023-10-08 12:53:11,876][101941] Avg episode reward: [(0, '6.360'), (1, '8.120')] +[2023-10-08 12:53:11,878][102760] Saving new best policy, reward=8.120! +[2023-10-08 12:53:12,863][102897] Updated weights for policy 0, policy_version 27880 (0.0010) +[2023-10-08 12:53:13,242][102897] Updated weights for policy 0, policy_version 27890 (0.0010) +[2023-10-08 12:53:13,623][102897] Updated weights for policy 0, policy_version 27900 (0.0009) +[2023-10-08 12:53:14,091][102898] Updated weights for policy 1, policy_version 27910 (0.0007) +[2023-10-08 12:53:14,456][102898] Updated weights for policy 1, policy_version 27920 (0.0008) +[2023-10-08 12:53:14,827][102898] Updated weights for policy 1, policy_version 27930 (0.0008) +[2023-10-08 12:53:16,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 57180160. Throughput: 0: 1784.3, 1: 1773.6. Samples: 14307366. Policy #0 lag: (min: 4.0, avg: 4.2, max: 14.0) +[2023-10-08 12:53:16,876][101941] Avg episode reward: [(0, '6.830'), (1, '7.740')] +[2023-10-08 12:53:17,303][102897] Updated weights for policy 0, policy_version 27910 (0.0007) +[2023-10-08 12:53:17,677][102897] Updated weights for policy 0, policy_version 27920 (0.0010) +[2023-10-08 12:53:18,048][102897] Updated weights for policy 0, policy_version 27930 (0.0007) +[2023-10-08 12:53:18,720][102898] Updated weights for policy 1, policy_version 27940 (0.0010) +[2023-10-08 12:53:19,092][102898] Updated weights for policy 1, policy_version 27950 (0.0008) +[2023-10-08 12:53:19,462][102898] Updated weights for policy 1, policy_version 27960 (0.0008) +[2023-10-08 12:53:21,723][102897] Updated weights for policy 0, policy_version 27940 (0.0008) +[2023-10-08 12:53:21,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 57245696. Throughput: 0: 1781.7, 1: 1782.8. Samples: 14317458. Policy #0 lag: (min: 4.0, avg: 4.2, max: 14.0) +[2023-10-08 12:53:21,875][101941] Avg episode reward: [(0, '7.190'), (1, '6.830')] +[2023-10-08 12:53:22,090][102897] Updated weights for policy 0, policy_version 27950 (0.0007) +[2023-10-08 12:53:22,459][102897] Updated weights for policy 0, policy_version 27960 (0.0007) +[2023-10-08 12:53:23,181][102898] Updated weights for policy 1, policy_version 27970 (0.0008) +[2023-10-08 12:53:23,549][102898] Updated weights for policy 1, policy_version 27980 (0.0007) +[2023-10-08 12:53:23,922][102898] Updated weights for policy 1, policy_version 27990 (0.0008) +[2023-10-08 12:53:24,287][102898] Updated weights for policy 1, policy_version 28000 (0.0009) +[2023-10-08 12:53:26,226][102897] Updated weights for policy 0, policy_version 27970 (0.0007) +[2023-10-08 12:53:26,608][102897] Updated weights for policy 0, policy_version 27980 (0.0009) +[2023-10-08 12:53:26,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 57311232. Throughput: 0: 1778.7, 1: 1778.6. Samples: 14339416. Policy #0 lag: (min: 4.0, avg: 4.2, max: 14.0) +[2023-10-08 12:53:26,875][101941] Avg episode reward: [(0, '7.290'), (1, '6.710')] +[2023-10-08 12:53:26,966][102897] Updated weights for policy 0, policy_version 27990 (0.0007) +[2023-10-08 12:53:27,337][102897] Updated weights for policy 0, policy_version 28000 (0.0008) +[2023-10-08 12:53:27,856][102898] Updated weights for policy 1, policy_version 28010 (0.0010) +[2023-10-08 12:53:28,221][102898] Updated weights for policy 1, policy_version 28020 (0.0011) +[2023-10-08 12:53:28,585][102898] Updated weights for policy 1, policy_version 28030 (0.0009) +[2023-10-08 12:53:30,999][102897] Updated weights for policy 0, policy_version 28010 (0.0008) +[2023-10-08 12:53:31,372][102897] Updated weights for policy 0, policy_version 28020 (0.0007) +[2023-10-08 12:53:31,753][102897] Updated weights for policy 0, policy_version 28030 (0.0008) +[2023-10-08 12:53:31,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 57409536. Throughput: 0: 1801.5, 1: 1778.1. Samples: 14361202. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 12:53:31,876][101941] Avg episode reward: [(0, '7.570'), (1, '6.940')] +[2023-10-08 12:53:31,886][102634] Saving new best policy, reward=7.570! +[2023-10-08 12:53:32,469][102898] Updated weights for policy 1, policy_version 28040 (0.0010) +[2023-10-08 12:53:32,833][102898] Updated weights for policy 1, policy_version 28050 (0.0007) +[2023-10-08 12:53:33,203][102898] Updated weights for policy 1, policy_version 28060 (0.0007) +[2023-10-08 12:53:35,725][102897] Updated weights for policy 0, policy_version 28040 (0.0009) +[2023-10-08 12:53:36,110][102897] Updated weights for policy 0, policy_version 28050 (0.0010) +[2023-10-08 12:53:36,488][102897] Updated weights for policy 0, policy_version 28060 (0.0009) +[2023-10-08 12:53:36,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 57475072. Throughput: 0: 1790.6, 1: 1781.5. Samples: 14371860. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 12:53:36,876][101941] Avg episode reward: [(0, '7.500'), (1, '7.080')] +[2023-10-08 12:53:37,093][102898] Updated weights for policy 1, policy_version 28070 (0.0008) +[2023-10-08 12:53:37,461][102898] Updated weights for policy 1, policy_version 28080 (0.0009) +[2023-10-08 12:53:37,826][102898] Updated weights for policy 1, policy_version 28090 (0.0011) +[2023-10-08 12:53:40,174][102897] Updated weights for policy 0, policy_version 28070 (0.0007) +[2023-10-08 12:53:40,548][102897] Updated weights for policy 0, policy_version 28080 (0.0007) +[2023-10-08 12:53:40,918][102897] Updated weights for policy 0, policy_version 28090 (0.0008) +[2023-10-08 12:53:41,617][102898] Updated weights for policy 1, policy_version 28100 (0.0010) +[2023-10-08 12:53:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 57540608. Throughput: 0: 1810.4, 1: 1781.2. Samples: 14393568. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 12:53:41,875][101941] Avg episode reward: [(0, '7.140'), (1, '7.340')] +[2023-10-08 12:53:41,985][102898] Updated weights for policy 1, policy_version 28110 (0.0010) +[2023-10-08 12:53:42,355][102898] Updated weights for policy 1, policy_version 28120 (0.0008) +[2023-10-08 12:53:44,725][102897] Updated weights for policy 0, policy_version 28100 (0.0009) +[2023-10-08 12:53:45,094][102897] Updated weights for policy 0, policy_version 28110 (0.0010) +[2023-10-08 12:53:45,471][102897] Updated weights for policy 0, policy_version 28120 (0.0008) +[2023-10-08 12:53:46,042][102898] Updated weights for policy 1, policy_version 28130 (0.0009) +[2023-10-08 12:53:46,415][102898] Updated weights for policy 1, policy_version 28140 (0.0007) +[2023-10-08 12:53:46,783][102898] Updated weights for policy 1, policy_version 28150 (0.0009) +[2023-10-08 12:53:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 57606144. Throughput: 0: 1802.1, 1: 1800.0. Samples: 14414876. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:53:46,875][101941] Avg episode reward: [(0, '6.940'), (1, '7.550')] +[2023-10-08 12:53:47,151][102898] Updated weights for policy 1, policy_version 28160 (0.0010) +[2023-10-08 12:53:49,136][102897] Updated weights for policy 0, policy_version 28130 (0.0008) +[2023-10-08 12:53:49,509][102897] Updated weights for policy 0, policy_version 28140 (0.0010) +[2023-10-08 12:53:49,877][102897] Updated weights for policy 0, policy_version 28150 (0.0009) +[2023-10-08 12:53:50,245][102897] Updated weights for policy 0, policy_version 28160 (0.0010) +[2023-10-08 12:53:51,009][102898] Updated weights for policy 1, policy_version 28170 (0.0009) +[2023-10-08 12:53:51,376][102898] Updated weights for policy 1, policy_version 28180 (0.0007) +[2023-10-08 12:53:51,743][102898] Updated weights for policy 1, policy_version 28190 (0.0009) +[2023-10-08 12:53:51,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 57704448. Throughput: 0: 1814.0, 1: 1781.4. Samples: 14426062. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:53:51,876][101941] Avg episode reward: [(0, '6.610'), (1, '7.700')] +[2023-10-08 12:53:54,122][102897] Updated weights for policy 0, policy_version 28170 (0.0007) +[2023-10-08 12:53:54,492][102897] Updated weights for policy 0, policy_version 28180 (0.0008) +[2023-10-08 12:53:54,864][102897] Updated weights for policy 0, policy_version 28190 (0.0007) +[2023-10-08 12:53:55,518][102898] Updated weights for policy 1, policy_version 28200 (0.0009) +[2023-10-08 12:53:55,889][102898] Updated weights for policy 1, policy_version 28210 (0.0008) +[2023-10-08 12:53:56,253][102898] Updated weights for policy 1, policy_version 28220 (0.0008) +[2023-10-08 12:53:56,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 57769984. Throughput: 0: 1794.0, 1: 1803.3. Samples: 14447102. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:53:56,876][101941] Avg episode reward: [(0, '6.760'), (1, '7.060')] +[2023-10-08 12:53:58,539][102897] Updated weights for policy 0, policy_version 28200 (0.0007) +[2023-10-08 12:53:58,911][102897] Updated weights for policy 0, policy_version 28210 (0.0010) +[2023-10-08 12:53:59,280][102897] Updated weights for policy 0, policy_version 28220 (0.0009) +[2023-10-08 12:54:00,037][102898] Updated weights for policy 1, policy_version 28230 (0.0009) +[2023-10-08 12:54:00,407][102898] Updated weights for policy 1, policy_version 28240 (0.0009) +[2023-10-08 12:54:00,780][102898] Updated weights for policy 1, policy_version 28250 (0.0010) +[2023-10-08 12:54:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 57835520. Throughput: 0: 1792.4, 1: 1786.4. Samples: 14468412. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:54:01,876][101941] Avg episode reward: [(0, '6.590'), (1, '6.740')] +[2023-10-08 12:54:03,185][102897] Updated weights for policy 0, policy_version 28230 (0.0008) +[2023-10-08 12:54:03,558][102897] Updated weights for policy 0, policy_version 28240 (0.0007) +[2023-10-08 12:54:03,928][102897] Updated weights for policy 0, policy_version 28250 (0.0008) +[2023-10-08 12:54:04,480][102898] Updated weights for policy 1, policy_version 28260 (0.0007) +[2023-10-08 12:54:04,848][102898] Updated weights for policy 1, policy_version 28270 (0.0010) +[2023-10-08 12:54:05,220][102898] Updated weights for policy 1, policy_version 28280 (0.0009) +[2023-10-08 12:54:06,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 57901056. Throughput: 0: 1790.0, 1: 1807.7. Samples: 14479356. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:54:06,875][101941] Avg episode reward: [(0, '7.410'), (1, '7.070')] +[2023-10-08 12:54:07,538][102897] Updated weights for policy 0, policy_version 28260 (0.0008) +[2023-10-08 12:54:07,911][102897] Updated weights for policy 0, policy_version 28270 (0.0007) +[2023-10-08 12:54:08,278][102897] Updated weights for policy 0, policy_version 28280 (0.0007) +[2023-10-08 12:54:09,134][102898] Updated weights for policy 1, policy_version 28290 (0.0008) +[2023-10-08 12:54:09,505][102898] Updated weights for policy 1, policy_version 28300 (0.0007) +[2023-10-08 12:54:09,865][102898] Updated weights for policy 1, policy_version 28310 (0.0008) +[2023-10-08 12:54:10,232][102898] Updated weights for policy 1, policy_version 28320 (0.0008) +[2023-10-08 12:54:11,862][102897] Updated weights for policy 0, policy_version 28290 (0.0008) +[2023-10-08 12:54:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 57966592. Throughput: 0: 1800.6, 1: 1787.2. Samples: 14500870. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 12:54:11,876][101941] Avg episode reward: [(0, '7.250'), (1, '7.230')] +[2023-10-08 12:54:12,240][102897] Updated weights for policy 0, policy_version 28300 (0.0008) +[2023-10-08 12:54:12,611][102897] Updated weights for policy 0, policy_version 28310 (0.0008) +[2023-10-08 12:54:12,984][102897] Updated weights for policy 0, policy_version 28320 (0.0008) +[2023-10-08 12:54:14,027][102898] Updated weights for policy 1, policy_version 28330 (0.0007) +[2023-10-08 12:54:14,385][102898] Updated weights for policy 1, policy_version 28340 (0.0007) +[2023-10-08 12:54:14,751][102898] Updated weights for policy 1, policy_version 28350 (0.0007) +[2023-10-08 12:54:16,732][102897] Updated weights for policy 0, policy_version 28330 (0.0007) +[2023-10-08 12:54:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 58032128. Throughput: 0: 1810.5, 1: 1783.3. Samples: 14522924. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 12:54:16,876][101941] Avg episode reward: [(0, '7.100'), (1, '6.580')] +[2023-10-08 12:54:16,884][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000028352_29032448.pth... +[2023-10-08 12:54:16,923][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000026688_27328512.pth +[2023-10-08 12:54:17,097][102897] Updated weights for policy 0, policy_version 28340 (0.0007) +[2023-10-08 12:54:17,473][102897] Updated weights for policy 0, policy_version 28350 (0.0007) +[2023-10-08 12:54:17,543][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000028352_29032448.pth... +[2023-10-08 12:54:17,582][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000026656_27295744.pth +[2023-10-08 12:54:18,343][102898] Updated weights for policy 1, policy_version 28360 (0.0009) +[2023-10-08 12:54:18,709][102898] Updated weights for policy 1, policy_version 28370 (0.0007) +[2023-10-08 12:54:19,072][102898] Updated weights for policy 1, policy_version 28380 (0.0008) +[2023-10-08 12:54:21,432][102897] Updated weights for policy 0, policy_version 28360 (0.0007) +[2023-10-08 12:54:21,810][102897] Updated weights for policy 0, policy_version 28370 (0.0008) +[2023-10-08 12:54:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 58097664. Throughput: 0: 1791.3, 1: 1787.9. Samples: 14532924. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 12:54:21,876][101941] Avg episode reward: [(0, '6.740'), (1, '6.660')] +[2023-10-08 12:54:22,175][102897] Updated weights for policy 0, policy_version 28380 (0.0009) +[2023-10-08 12:54:22,683][102898] Updated weights for policy 1, policy_version 28390 (0.0007) +[2023-10-08 12:54:23,053][102898] Updated weights for policy 1, policy_version 28400 (0.0007) +[2023-10-08 12:54:23,417][102898] Updated weights for policy 1, policy_version 28410 (0.0007) +[2023-10-08 12:54:26,033][102897] Updated weights for policy 0, policy_version 28390 (0.0009) +[2023-10-08 12:54:26,401][102897] Updated weights for policy 0, policy_version 28400 (0.0011) +[2023-10-08 12:54:26,769][102897] Updated weights for policy 0, policy_version 28410 (0.0009) +[2023-10-08 12:54:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 58163200. Throughput: 0: 1797.6, 1: 1793.3. Samples: 14555162. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 12:54:26,876][101941] Avg episode reward: [(0, '6.170'), (1, '7.040')] +[2023-10-08 12:54:27,165][102898] Updated weights for policy 1, policy_version 28420 (0.0008) +[2023-10-08 12:54:27,555][102898] Updated weights for policy 1, policy_version 28430 (0.0010) +[2023-10-08 12:54:27,922][102898] Updated weights for policy 1, policy_version 28440 (0.0007) +[2023-10-08 12:54:30,669][102897] Updated weights for policy 0, policy_version 28420 (0.0007) +[2023-10-08 12:54:31,042][102897] Updated weights for policy 0, policy_version 28430 (0.0009) +[2023-10-08 12:54:31,423][102897] Updated weights for policy 0, policy_version 28440 (0.0008) +[2023-10-08 12:54:31,607][102898] Updated weights for policy 1, policy_version 28450 (0.0008) +[2023-10-08 12:54:31,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 58261504. Throughput: 0: 1784.9, 1: 1800.4. Samples: 14576216. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:54:31,875][101941] Avg episode reward: [(0, '6.180'), (1, '6.900')] +[2023-10-08 12:54:31,979][102898] Updated weights for policy 1, policy_version 28460 (0.0009) +[2023-10-08 12:54:32,346][102898] Updated weights for policy 1, policy_version 28470 (0.0007) +[2023-10-08 12:54:32,707][102898] Updated weights for policy 1, policy_version 28480 (0.0008) +[2023-10-08 12:54:35,111][102897] Updated weights for policy 0, policy_version 28450 (0.0010) +[2023-10-08 12:54:35,481][102897] Updated weights for policy 0, policy_version 28460 (0.0010) +[2023-10-08 12:54:35,851][102897] Updated weights for policy 0, policy_version 28470 (0.0009) +[2023-10-08 12:54:36,224][102897] Updated weights for policy 0, policy_version 28480 (0.0008) +[2023-10-08 12:54:36,632][102898] Updated weights for policy 1, policy_version 28490 (0.0007) +[2023-10-08 12:54:36,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 58327040. Throughput: 0: 1787.5, 1: 1788.5. Samples: 14586980. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:54:36,876][101941] Avg episode reward: [(0, '6.990'), (1, '6.350')] +[2023-10-08 12:54:36,995][102898] Updated weights for policy 1, policy_version 28500 (0.0007) +[2023-10-08 12:54:37,352][102898] Updated weights for policy 1, policy_version 28510 (0.0007) +[2023-10-08 12:54:39,978][102897] Updated weights for policy 0, policy_version 28490 (0.0007) +[2023-10-08 12:54:40,352][102897] Updated weights for policy 0, policy_version 28500 (0.0008) +[2023-10-08 12:54:40,725][102897] Updated weights for policy 0, policy_version 28510 (0.0008) +[2023-10-08 12:54:41,100][102898] Updated weights for policy 1, policy_version 28520 (0.0007) +[2023-10-08 12:54:41,470][102898] Updated weights for policy 1, policy_version 28530 (0.0007) +[2023-10-08 12:54:41,838][102898] Updated weights for policy 1, policy_version 28540 (0.0009) +[2023-10-08 12:54:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 58392576. Throughput: 0: 1792.9, 1: 1795.7. Samples: 14608590. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:54:41,875][101941] Avg episode reward: [(0, '7.000'), (1, '6.860')] +[2023-10-08 12:54:44,414][102897] Updated weights for policy 0, policy_version 28520 (0.0008) +[2023-10-08 12:54:44,792][102897] Updated weights for policy 0, policy_version 28530 (0.0007) +[2023-10-08 12:54:45,166][102897] Updated weights for policy 0, policy_version 28540 (0.0007) +[2023-10-08 12:54:45,597][102898] Updated weights for policy 1, policy_version 28550 (0.0010) +[2023-10-08 12:54:45,963][102898] Updated weights for policy 1, policy_version 28560 (0.0010) +[2023-10-08 12:54:46,340][102898] Updated weights for policy 1, policy_version 28570 (0.0007) +[2023-10-08 12:54:46,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 58490880. Throughput: 0: 1782.4, 1: 1791.6. Samples: 14629242. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:54:46,876][101941] Avg episode reward: [(0, '7.680'), (1, '7.570')] +[2023-10-08 12:54:46,885][102634] Saving new best policy, reward=7.680! +[2023-10-08 12:54:48,897][102897] Updated weights for policy 0, policy_version 28550 (0.0009) +[2023-10-08 12:54:49,267][102897] Updated weights for policy 0, policy_version 28560 (0.0010) +[2023-10-08 12:54:49,637][102897] Updated weights for policy 0, policy_version 28570 (0.0010) +[2023-10-08 12:54:50,232][102898] Updated weights for policy 1, policy_version 28580 (0.0008) +[2023-10-08 12:54:50,602][102898] Updated weights for policy 1, policy_version 28590 (0.0009) +[2023-10-08 12:54:50,959][102898] Updated weights for policy 1, policy_version 28600 (0.0010) +[2023-10-08 12:54:51,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 58556416. Throughput: 0: 1797.9, 1: 1789.5. Samples: 14640788. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:54:51,876][101941] Avg episode reward: [(0, '6.810'), (1, '7.270')] +[2023-10-08 12:54:53,241][102897] Updated weights for policy 0, policy_version 28580 (0.0009) +[2023-10-08 12:54:53,620][102897] Updated weights for policy 0, policy_version 28590 (0.0008) +[2023-10-08 12:54:53,989][102897] Updated weights for policy 0, policy_version 28600 (0.0008) +[2023-10-08 12:54:54,768][102898] Updated weights for policy 1, policy_version 28610 (0.0009) +[2023-10-08 12:54:55,147][102898] Updated weights for policy 1, policy_version 28620 (0.0008) +[2023-10-08 12:54:55,511][102898] Updated weights for policy 1, policy_version 28630 (0.0009) +[2023-10-08 12:54:55,880][102898] Updated weights for policy 1, policy_version 28640 (0.0009) +[2023-10-08 12:54:56,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 58621952. Throughput: 0: 1772.3, 1: 1801.8. Samples: 14661706. Policy #0 lag: (min: 17.0, avg: 34.1, max: 49.0) +[2023-10-08 12:54:56,876][101941] Avg episode reward: [(0, '6.980'), (1, '7.200')] +[2023-10-08 12:54:57,764][102897] Updated weights for policy 0, policy_version 28610 (0.0009) +[2023-10-08 12:54:58,130][102897] Updated weights for policy 0, policy_version 28620 (0.0008) +[2023-10-08 12:54:58,506][102897] Updated weights for policy 0, policy_version 28630 (0.0007) +[2023-10-08 12:54:58,877][102897] Updated weights for policy 0, policy_version 28640 (0.0008) +[2023-10-08 12:54:59,594][102898] Updated weights for policy 1, policy_version 28650 (0.0007) +[2023-10-08 12:54:59,964][102898] Updated weights for policy 1, policy_version 28660 (0.0011) +[2023-10-08 12:55:00,339][102898] Updated weights for policy 1, policy_version 28670 (0.0008) +[2023-10-08 12:55:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 58687488. Throughput: 0: 1779.1, 1: 1793.6. Samples: 14683698. Policy #0 lag: (min: 17.0, avg: 34.1, max: 49.0) +[2023-10-08 12:55:01,876][101941] Avg episode reward: [(0, '6.660'), (1, '7.390')] +[2023-10-08 12:55:02,690][102897] Updated weights for policy 0, policy_version 28650 (0.0008) +[2023-10-08 12:55:03,064][102897] Updated weights for policy 0, policy_version 28660 (0.0007) +[2023-10-08 12:55:03,432][102897] Updated weights for policy 0, policy_version 28670 (0.0007) +[2023-10-08 12:55:04,049][102898] Updated weights for policy 1, policy_version 28680 (0.0009) +[2023-10-08 12:55:04,411][102898] Updated weights for policy 1, policy_version 28690 (0.0010) +[2023-10-08 12:55:04,765][102898] Updated weights for policy 1, policy_version 28700 (0.0010) +[2023-10-08 12:55:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 58753024. Throughput: 0: 1777.8, 1: 1802.7. Samples: 14694046. Policy #0 lag: (min: 17.0, avg: 34.1, max: 49.0) +[2023-10-08 12:55:06,875][101941] Avg episode reward: [(0, '6.700'), (1, '6.700')] +[2023-10-08 12:55:07,158][102897] Updated weights for policy 0, policy_version 28680 (0.0007) +[2023-10-08 12:55:07,527][102897] Updated weights for policy 0, policy_version 28690 (0.0009) +[2023-10-08 12:55:07,915][102897] Updated weights for policy 0, policy_version 28700 (0.0009) +[2023-10-08 12:55:08,522][102898] Updated weights for policy 1, policy_version 28710 (0.0009) +[2023-10-08 12:55:08,885][102898] Updated weights for policy 1, policy_version 28720 (0.0007) +[2023-10-08 12:55:09,249][102898] Updated weights for policy 1, policy_version 28730 (0.0010) +[2023-10-08 12:55:11,783][102897] Updated weights for policy 0, policy_version 28710 (0.0010) +[2023-10-08 12:55:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 58818560. Throughput: 0: 1781.7, 1: 1783.7. Samples: 14715604. Policy #0 lag: (min: 17.0, avg: 34.1, max: 49.0) +[2023-10-08 12:55:11,875][101941] Avg episode reward: [(0, '6.560'), (1, '6.220')] +[2023-10-08 12:55:12,158][102897] Updated weights for policy 0, policy_version 28720 (0.0009) +[2023-10-08 12:55:12,522][102897] Updated weights for policy 0, policy_version 28730 (0.0007) +[2023-10-08 12:55:13,124][102898] Updated weights for policy 1, policy_version 28740 (0.0010) +[2023-10-08 12:55:13,518][102898] Updated weights for policy 1, policy_version 28750 (0.0009) +[2023-10-08 12:55:13,876][102898] Updated weights for policy 1, policy_version 28760 (0.0009) +[2023-10-08 12:55:16,217][102897] Updated weights for policy 0, policy_version 28740 (0.0008) +[2023-10-08 12:55:16,591][102897] Updated weights for policy 0, policy_version 28750 (0.0009) +[2023-10-08 12:55:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 58884096. Throughput: 0: 1798.0, 1: 1785.1. Samples: 14737456. Policy #0 lag: (min: 17.0, avg: 34.1, max: 49.0) +[2023-10-08 12:55:16,876][101941] Avg episode reward: [(0, '6.810'), (1, '6.180')] +[2023-10-08 12:55:16,965][102897] Updated weights for policy 0, policy_version 28760 (0.0008) +[2023-10-08 12:55:17,558][102898] Updated weights for policy 1, policy_version 28770 (0.0007) +[2023-10-08 12:55:17,936][102898] Updated weights for policy 1, policy_version 28780 (0.0008) +[2023-10-08 12:55:18,297][102898] Updated weights for policy 1, policy_version 28790 (0.0008) +[2023-10-08 12:55:18,664][102898] Updated weights for policy 1, policy_version 28800 (0.0008) +[2023-10-08 12:55:20,693][102897] Updated weights for policy 0, policy_version 28770 (0.0008) +[2023-10-08 12:55:21,065][102897] Updated weights for policy 0, policy_version 28780 (0.0009) +[2023-10-08 12:55:21,433][102897] Updated weights for policy 0, policy_version 28790 (0.0008) +[2023-10-08 12:55:21,806][102897] Updated weights for policy 0, policy_version 28800 (0.0008) +[2023-10-08 12:55:21,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 58982400. Throughput: 0: 1782.7, 1: 1788.6. Samples: 14747686. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 12:55:21,875][101941] Avg episode reward: [(0, '6.460'), (1, '6.810')] +[2023-10-08 12:55:22,462][102898] Updated weights for policy 1, policy_version 28810 (0.0009) +[2023-10-08 12:55:22,823][102898] Updated weights for policy 1, policy_version 28820 (0.0008) +[2023-10-08 12:55:23,186][102898] Updated weights for policy 1, policy_version 28830 (0.0009) +[2023-10-08 12:55:25,726][102897] Updated weights for policy 0, policy_version 28810 (0.0010) +[2023-10-08 12:55:26,095][102897] Updated weights for policy 0, policy_version 28820 (0.0007) +[2023-10-08 12:55:26,458][102897] Updated weights for policy 0, policy_version 28830 (0.0008) +[2023-10-08 12:55:26,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 59047936. Throughput: 0: 1797.6, 1: 1782.6. Samples: 14769700. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 12:55:26,876][101941] Avg episode reward: [(0, '6.470'), (1, '7.380')] +[2023-10-08 12:55:26,880][102898] Updated weights for policy 1, policy_version 28840 (0.0009) +[2023-10-08 12:55:27,239][102898] Updated weights for policy 1, policy_version 28850 (0.0007) +[2023-10-08 12:55:27,604][102898] Updated weights for policy 1, policy_version 28860 (0.0007) +[2023-10-08 12:55:30,089][102897] Updated weights for policy 0, policy_version 28840 (0.0009) +[2023-10-08 12:55:30,459][102897] Updated weights for policy 0, policy_version 28850 (0.0007) +[2023-10-08 12:55:30,832][102897] Updated weights for policy 0, policy_version 28860 (0.0008) +[2023-10-08 12:55:31,451][102898] Updated weights for policy 1, policy_version 28870 (0.0009) +[2023-10-08 12:55:31,817][102898] Updated weights for policy 1, policy_version 28880 (0.0010) +[2023-10-08 12:55:31,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 59113472. Throughput: 0: 1777.5, 1: 1810.8. Samples: 14790716. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 12:55:31,876][101941] Avg episode reward: [(0, '6.680'), (1, '7.030')] +[2023-10-08 12:55:32,193][102898] Updated weights for policy 1, policy_version 28890 (0.0011) +[2023-10-08 12:55:34,512][102897] Updated weights for policy 0, policy_version 28870 (0.0009) +[2023-10-08 12:55:34,879][102897] Updated weights for policy 0, policy_version 28880 (0.0007) +[2023-10-08 12:55:35,253][102897] Updated weights for policy 0, policy_version 28890 (0.0008) +[2023-10-08 12:55:35,965][102898] Updated weights for policy 1, policy_version 28900 (0.0009) +[2023-10-08 12:55:36,346][102898] Updated weights for policy 1, policy_version 28910 (0.0008) +[2023-10-08 12:55:36,716][102898] Updated weights for policy 1, policy_version 28920 (0.0009) +[2023-10-08 12:55:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 59179008. Throughput: 0: 1797.4, 1: 1791.3. Samples: 14802280. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 12:55:36,876][101941] Avg episode reward: [(0, '6.910'), (1, '6.910')] +[2023-10-08 12:55:38,856][102897] Updated weights for policy 0, policy_version 28900 (0.0010) +[2023-10-08 12:55:39,226][102897] Updated weights for policy 0, policy_version 28910 (0.0009) +[2023-10-08 12:55:39,607][102897] Updated weights for policy 0, policy_version 28920 (0.0008) +[2023-10-08 12:55:40,324][102898] Updated weights for policy 1, policy_version 28930 (0.0009) +[2023-10-08 12:55:40,683][102898] Updated weights for policy 1, policy_version 28940 (0.0009) +[2023-10-08 12:55:41,046][102898] Updated weights for policy 1, policy_version 28950 (0.0010) +[2023-10-08 12:55:41,418][102898] Updated weights for policy 1, policy_version 28960 (0.0009) +[2023-10-08 12:55:41,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 59277312. Throughput: 0: 1787.3, 1: 1800.7. Samples: 14823164. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:55:41,876][101941] Avg episode reward: [(0, '7.350'), (1, '7.220')] +[2023-10-08 12:55:43,314][102897] Updated weights for policy 0, policy_version 28930 (0.0010) +[2023-10-08 12:55:43,677][102897] Updated weights for policy 0, policy_version 28940 (0.0010) +[2023-10-08 12:55:44,044][102897] Updated weights for policy 0, policy_version 28950 (0.0010) +[2023-10-08 12:55:44,431][102897] Updated weights for policy 0, policy_version 28960 (0.0011) +[2023-10-08 12:55:45,112][102898] Updated weights for policy 1, policy_version 28970 (0.0009) +[2023-10-08 12:55:45,475][102898] Updated weights for policy 1, policy_version 28980 (0.0009) +[2023-10-08 12:55:45,843][102898] Updated weights for policy 1, policy_version 28990 (0.0009) +[2023-10-08 12:55:46,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 59342848. Throughput: 0: 1787.8, 1: 1782.6. Samples: 14844366. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:55:46,875][101941] Avg episode reward: [(0, '6.620'), (1, '7.170')] +[2023-10-08 12:55:48,295][102897] Updated weights for policy 0, policy_version 28970 (0.0009) +[2023-10-08 12:55:48,671][102897] Updated weights for policy 0, policy_version 28980 (0.0007) +[2023-10-08 12:55:49,041][102897] Updated weights for policy 0, policy_version 28990 (0.0008) +[2023-10-08 12:55:49,709][102898] Updated weights for policy 1, policy_version 29000 (0.0007) +[2023-10-08 12:55:50,077][102898] Updated weights for policy 1, policy_version 29010 (0.0007) +[2023-10-08 12:55:50,449][102898] Updated weights for policy 1, policy_version 29020 (0.0008) +[2023-10-08 12:55:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 59408384. Throughput: 0: 1788.0, 1: 1798.4. Samples: 14855436. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:55:51,875][101941] Avg episode reward: [(0, '6.900'), (1, '6.890')] +[2023-10-08 12:55:52,814][102897] Updated weights for policy 0, policy_version 29000 (0.0007) +[2023-10-08 12:55:53,187][102897] Updated weights for policy 0, policy_version 29010 (0.0007) +[2023-10-08 12:55:53,554][102897] Updated weights for policy 0, policy_version 29020 (0.0007) +[2023-10-08 12:55:54,305][102898] Updated weights for policy 1, policy_version 29030 (0.0007) +[2023-10-08 12:55:54,680][102898] Updated weights for policy 1, policy_version 29040 (0.0007) +[2023-10-08 12:55:55,055][102898] Updated weights for policy 1, policy_version 29050 (0.0007) +[2023-10-08 12:55:56,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 59473920. Throughput: 0: 1789.0, 1: 1779.0. Samples: 14876164. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:55:56,876][101941] Avg episode reward: [(0, '7.280'), (1, '7.160')] +[2023-10-08 12:55:57,494][102897] Updated weights for policy 0, policy_version 29030 (0.0008) +[2023-10-08 12:55:57,875][102897] Updated weights for policy 0, policy_version 29040 (0.0010) +[2023-10-08 12:55:58,252][102897] Updated weights for policy 0, policy_version 29050 (0.0009) +[2023-10-08 12:55:58,852][102898] Updated weights for policy 1, policy_version 29060 (0.0009) +[2023-10-08 12:55:59,244][102898] Updated weights for policy 1, policy_version 29070 (0.0010) +[2023-10-08 12:55:59,603][102898] Updated weights for policy 1, policy_version 29080 (0.0010) +[2023-10-08 12:56:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 59539456. Throughput: 0: 1796.0, 1: 1783.4. Samples: 14898530. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:56:01,876][101941] Avg episode reward: [(0, '7.200'), (1, '7.190')] +[2023-10-08 12:56:02,145][102897] Updated weights for policy 0, policy_version 29060 (0.0009) +[2023-10-08 12:56:02,521][102897] Updated weights for policy 0, policy_version 29070 (0.0011) +[2023-10-08 12:56:02,888][102897] Updated weights for policy 0, policy_version 29080 (0.0010) +[2023-10-08 12:56:03,220][102898] Updated weights for policy 1, policy_version 29090 (0.0009) +[2023-10-08 12:56:03,589][102898] Updated weights for policy 1, policy_version 29100 (0.0007) +[2023-10-08 12:56:03,955][102898] Updated weights for policy 1, policy_version 29110 (0.0009) +[2023-10-08 12:56:04,322][102898] Updated weights for policy 1, policy_version 29120 (0.0010) +[2023-10-08 12:56:06,795][102897] Updated weights for policy 0, policy_version 29090 (0.0009) +[2023-10-08 12:56:06,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 59604992. Throughput: 0: 1786.2, 1: 1783.7. Samples: 14908334. Policy #0 lag: (min: 31.0, avg: 32.2, max: 54.0) +[2023-10-08 12:56:06,875][101941] Avg episode reward: [(0, '7.060'), (1, '6.840')] +[2023-10-08 12:56:07,166][102897] Updated weights for policy 0, policy_version 29100 (0.0009) +[2023-10-08 12:56:07,536][102897] Updated weights for policy 0, policy_version 29110 (0.0007) +[2023-10-08 12:56:07,903][102897] Updated weights for policy 0, policy_version 29120 (0.0008) +[2023-10-08 12:56:08,122][102898] Updated weights for policy 1, policy_version 29130 (0.0009) +[2023-10-08 12:56:08,479][102898] Updated weights for policy 1, policy_version 29140 (0.0008) +[2023-10-08 12:56:08,852][102898] Updated weights for policy 1, policy_version 29150 (0.0010) +[2023-10-08 12:56:11,558][102897] Updated weights for policy 0, policy_version 29130 (0.0007) +[2023-10-08 12:56:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 59670528. Throughput: 0: 1787.7, 1: 1784.4. Samples: 14930444. Policy #0 lag: (min: 31.0, avg: 32.2, max: 54.0) +[2023-10-08 12:56:11,875][101941] Avg episode reward: [(0, '6.860'), (1, '6.660')] +[2023-10-08 12:56:11,943][102897] Updated weights for policy 0, policy_version 29140 (0.0009) +[2023-10-08 12:56:12,315][102897] Updated weights for policy 0, policy_version 29150 (0.0008) +[2023-10-08 12:56:12,675][102898] Updated weights for policy 1, policy_version 29160 (0.0009) +[2023-10-08 12:56:13,050][102898] Updated weights for policy 1, policy_version 29170 (0.0008) +[2023-10-08 12:56:13,412][102898] Updated weights for policy 1, policy_version 29180 (0.0009) +[2023-10-08 12:56:15,922][102897] Updated weights for policy 0, policy_version 29160 (0.0007) +[2023-10-08 12:56:16,306][102897] Updated weights for policy 0, policy_version 29170 (0.0011) +[2023-10-08 12:56:16,674][102897] Updated weights for policy 0, policy_version 29180 (0.0007) +[2023-10-08 12:56:16,875][101941] Fps is (10 sec: 16383.4, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 59768832. Throughput: 0: 1796.3, 1: 1786.8. Samples: 14951954. Policy #0 lag: (min: 31.0, avg: 32.2, max: 54.0) +[2023-10-08 12:56:16,876][101941] Avg episode reward: [(0, '6.710'), (1, '6.110')] +[2023-10-08 12:56:16,888][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000029184_29884416.pth... +[2023-10-08 12:56:16,927][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000027488_28147712.pth +[2023-10-08 12:56:17,150][102898] Updated weights for policy 1, policy_version 29190 (0.0009) +[2023-10-08 12:56:17,516][102898] Updated weights for policy 1, policy_version 29200 (0.0009) +[2023-10-08 12:56:17,880][102898] Updated weights for policy 1, policy_version 29210 (0.0008) +[2023-10-08 12:56:18,100][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000029216_29917184.pth... +[2023-10-08 12:56:18,135][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000027520_28180480.pth +[2023-10-08 12:56:20,643][102897] Updated weights for policy 0, policy_version 29190 (0.0008) +[2023-10-08 12:56:21,014][102897] Updated weights for policy 0, policy_version 29200 (0.0009) +[2023-10-08 12:56:21,382][102897] Updated weights for policy 0, policy_version 29210 (0.0009) +[2023-10-08 12:56:21,819][102898] Updated weights for policy 1, policy_version 29220 (0.0010) +[2023-10-08 12:56:21,875][101941] Fps is (10 sec: 16383.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 59834368. Throughput: 0: 1782.3, 1: 1778.2. Samples: 14962500. Policy #0 lag: (min: 31.0, avg: 32.2, max: 54.0) +[2023-10-08 12:56:21,877][101941] Avg episode reward: [(0, '6.970'), (1, '6.840')] +[2023-10-08 12:56:22,182][102898] Updated weights for policy 1, policy_version 29230 (0.0011) +[2023-10-08 12:56:22,554][102898] Updated weights for policy 1, policy_version 29240 (0.0008) +[2023-10-08 12:56:25,100][102897] Updated weights for policy 0, policy_version 29220 (0.0009) +[2023-10-08 12:56:25,480][102897] Updated weights for policy 0, policy_version 29230 (0.0009) +[2023-10-08 12:56:25,849][102897] Updated weights for policy 0, policy_version 29240 (0.0007) +[2023-10-08 12:56:26,305][102898] Updated weights for policy 1, policy_version 29250 (0.0009) +[2023-10-08 12:56:26,671][102898] Updated weights for policy 1, policy_version 29260 (0.0010) +[2023-10-08 12:56:26,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 59899904. Throughput: 0: 1797.9, 1: 1779.6. Samples: 14984152. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:56:26,875][101941] Avg episode reward: [(0, '6.490'), (1, '7.140')] +[2023-10-08 12:56:27,040][102898] Updated weights for policy 1, policy_version 29270 (0.0007) +[2023-10-08 12:56:27,405][102898] Updated weights for policy 1, policy_version 29280 (0.0007) +[2023-10-08 12:56:29,502][102897] Updated weights for policy 0, policy_version 29250 (0.0008) +[2023-10-08 12:56:29,877][102897] Updated weights for policy 0, policy_version 29260 (0.0007) +[2023-10-08 12:56:30,259][102897] Updated weights for policy 0, policy_version 29270 (0.0007) +[2023-10-08 12:56:30,627][102897] Updated weights for policy 0, policy_version 29280 (0.0007) +[2023-10-08 12:56:31,160][102898] Updated weights for policy 1, policy_version 29290 (0.0008) +[2023-10-08 12:56:31,529][102898] Updated weights for policy 1, policy_version 29300 (0.0008) +[2023-10-08 12:56:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 59965440. Throughput: 0: 1777.0, 1: 1793.1. Samples: 15005018. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:56:31,876][101941] Avg episode reward: [(0, '6.810'), (1, '7.270')] +[2023-10-08 12:56:31,898][102898] Updated weights for policy 1, policy_version 29310 (0.0009) +[2023-10-08 12:56:34,404][102897] Updated weights for policy 0, policy_version 29290 (0.0008) +[2023-10-08 12:56:34,772][102897] Updated weights for policy 0, policy_version 29300 (0.0009) +[2023-10-08 12:56:35,142][102897] Updated weights for policy 0, policy_version 29310 (0.0009) +[2023-10-08 12:56:35,699][102898] Updated weights for policy 1, policy_version 29320 (0.0009) +[2023-10-08 12:56:36,083][102898] Updated weights for policy 1, policy_version 29330 (0.0010) +[2023-10-08 12:56:36,448][102898] Updated weights for policy 1, policy_version 29340 (0.0010) +[2023-10-08 12:56:36,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 60063744. Throughput: 0: 1799.2, 1: 1777.7. Samples: 15016398. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:56:36,876][101941] Avg episode reward: [(0, '6.510'), (1, '7.480')] +[2023-10-08 12:56:38,914][102897] Updated weights for policy 0, policy_version 29320 (0.0009) +[2023-10-08 12:56:39,281][102897] Updated weights for policy 0, policy_version 29330 (0.0008) +[2023-10-08 12:56:39,652][102897] Updated weights for policy 0, policy_version 29340 (0.0009) +[2023-10-08 12:56:40,373][102898] Updated weights for policy 1, policy_version 29350 (0.0010) +[2023-10-08 12:56:40,744][102898] Updated weights for policy 1, policy_version 29360 (0.0009) +[2023-10-08 12:56:41,115][102898] Updated weights for policy 1, policy_version 29370 (0.0009) +[2023-10-08 12:56:41,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 60129280. Throughput: 0: 1775.4, 1: 1800.8. Samples: 15037096. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:56:41,876][101941] Avg episode reward: [(0, '6.470'), (1, '6.830')] +[2023-10-08 12:56:43,593][102897] Updated weights for policy 0, policy_version 29350 (0.0011) +[2023-10-08 12:56:43,983][102897] Updated weights for policy 0, policy_version 29360 (0.0009) +[2023-10-08 12:56:44,360][102897] Updated weights for policy 0, policy_version 29370 (0.0008) +[2023-10-08 12:56:45,010][102898] Updated weights for policy 1, policy_version 29380 (0.0009) +[2023-10-08 12:56:45,391][102898] Updated weights for policy 1, policy_version 29390 (0.0010) +[2023-10-08 12:56:45,766][102898] Updated weights for policy 1, policy_version 29400 (0.0010) +[2023-10-08 12:56:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 60194816. Throughput: 0: 1777.0, 1: 1769.6. Samples: 15058126. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:56:46,876][101941] Avg episode reward: [(0, '6.980'), (1, '7.040')] +[2023-10-08 12:56:47,965][102897] Updated weights for policy 0, policy_version 29380 (0.0008) +[2023-10-08 12:56:48,332][102897] Updated weights for policy 0, policy_version 29390 (0.0009) +[2023-10-08 12:56:48,708][102897] Updated weights for policy 0, policy_version 29400 (0.0007) +[2023-10-08 12:56:49,511][102898] Updated weights for policy 1, policy_version 29410 (0.0008) +[2023-10-08 12:56:49,877][102898] Updated weights for policy 1, policy_version 29420 (0.0010) +[2023-10-08 12:56:50,257][102898] Updated weights for policy 1, policy_version 29430 (0.0010) +[2023-10-08 12:56:50,614][102898] Updated weights for policy 1, policy_version 29440 (0.0010) +[2023-10-08 12:56:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 60260352. Throughput: 0: 1778.5, 1: 1799.9. Samples: 15069364. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 12:56:51,876][101941] Avg episode reward: [(0, '7.060'), (1, '6.720')] +[2023-10-08 12:56:52,632][102897] Updated weights for policy 0, policy_version 29410 (0.0010) +[2023-10-08 12:56:52,994][102897] Updated weights for policy 0, policy_version 29420 (0.0008) +[2023-10-08 12:56:53,360][102897] Updated weights for policy 0, policy_version 29430 (0.0007) +[2023-10-08 12:56:53,733][102897] Updated weights for policy 0, policy_version 29440 (0.0007) +[2023-10-08 12:56:54,476][102898] Updated weights for policy 1, policy_version 29450 (0.0008) +[2023-10-08 12:56:54,834][102898] Updated weights for policy 1, policy_version 29460 (0.0007) +[2023-10-08 12:56:55,203][102898] Updated weights for policy 1, policy_version 29470 (0.0009) +[2023-10-08 12:56:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 60325888. Throughput: 0: 1780.7, 1: 1766.1. Samples: 15090052. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 12:56:56,876][101941] Avg episode reward: [(0, '6.250'), (1, '6.570')] +[2023-10-08 12:56:57,518][102897] Updated weights for policy 0, policy_version 29450 (0.0008) +[2023-10-08 12:56:57,891][102897] Updated weights for policy 0, policy_version 29460 (0.0007) +[2023-10-08 12:56:58,262][102897] Updated weights for policy 0, policy_version 29470 (0.0008) +[2023-10-08 12:56:58,713][102898] Updated weights for policy 1, policy_version 29480 (0.0008) +[2023-10-08 12:56:59,083][102898] Updated weights for policy 1, policy_version 29490 (0.0008) +[2023-10-08 12:56:59,450][102898] Updated weights for policy 1, policy_version 29500 (0.0008) +[2023-10-08 12:57:01,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 60391424. Throughput: 0: 1799.8, 1: 1770.3. Samples: 15112610. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 12:57:01,876][101941] Avg episode reward: [(0, '6.220'), (1, '7.050')] +[2023-10-08 12:57:01,971][102897] Updated weights for policy 0, policy_version 29480 (0.0008) +[2023-10-08 12:57:02,346][102897] Updated weights for policy 0, policy_version 29490 (0.0008) +[2023-10-08 12:57:02,715][102897] Updated weights for policy 0, policy_version 29500 (0.0009) +[2023-10-08 12:57:03,180][102898] Updated weights for policy 1, policy_version 29510 (0.0008) +[2023-10-08 12:57:03,554][102898] Updated weights for policy 1, policy_version 29520 (0.0008) +[2023-10-08 12:57:03,918][102898] Updated weights for policy 1, policy_version 29530 (0.0010) +[2023-10-08 12:57:06,435][102897] Updated weights for policy 0, policy_version 29510 (0.0007) +[2023-10-08 12:57:06,809][102897] Updated weights for policy 0, policy_version 29520 (0.0007) +[2023-10-08 12:57:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 60456960. Throughput: 0: 1782.7, 1: 1770.4. Samples: 15122388. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 12:57:06,876][101941] Avg episode reward: [(0, '6.360'), (1, '7.120')] +[2023-10-08 12:57:07,174][102897] Updated weights for policy 0, policy_version 29530 (0.0007) +[2023-10-08 12:57:07,825][102898] Updated weights for policy 1, policy_version 29540 (0.0009) +[2023-10-08 12:57:08,189][102898] Updated weights for policy 1, policy_version 29550 (0.0009) +[2023-10-08 12:57:08,552][102898] Updated weights for policy 1, policy_version 29560 (0.0009) +[2023-10-08 12:57:10,926][102897] Updated weights for policy 0, policy_version 29540 (0.0008) +[2023-10-08 12:57:11,303][102897] Updated weights for policy 0, policy_version 29550 (0.0009) +[2023-10-08 12:57:11,673][102897] Updated weights for policy 0, policy_version 29560 (0.0008) +[2023-10-08 12:57:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 60522496. Throughput: 0: 1792.2, 1: 1773.0. Samples: 15144584. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 12:57:11,876][101941] Avg episode reward: [(0, '6.790'), (1, '6.340')] +[2023-10-08 12:57:12,295][102898] Updated weights for policy 1, policy_version 29570 (0.0008) +[2023-10-08 12:57:12,673][102898] Updated weights for policy 1, policy_version 29580 (0.0007) +[2023-10-08 12:57:13,035][102898] Updated weights for policy 1, policy_version 29590 (0.0007) +[2023-10-08 12:57:13,401][102898] Updated weights for policy 1, policy_version 29600 (0.0007) +[2023-10-08 12:57:15,459][102897] Updated weights for policy 0, policy_version 29570 (0.0007) +[2023-10-08 12:57:15,832][102897] Updated weights for policy 0, policy_version 29580 (0.0008) +[2023-10-08 12:57:16,210][102897] Updated weights for policy 0, policy_version 29590 (0.0007) +[2023-10-08 12:57:16,580][102897] Updated weights for policy 0, policy_version 29600 (0.0008) +[2023-10-08 12:57:16,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 60620800. Throughput: 0: 1782.8, 1: 1786.8. Samples: 15165650. Policy #0 lag: (min: 31.0, avg: 31.9, max: 51.0) +[2023-10-08 12:57:16,876][101941] Avg episode reward: [(0, '6.330'), (1, '6.350')] +[2023-10-08 12:57:17,139][102898] Updated weights for policy 1, policy_version 29610 (0.0009) +[2023-10-08 12:57:17,506][102898] Updated weights for policy 1, policy_version 29620 (0.0007) +[2023-10-08 12:57:17,874][102898] Updated weights for policy 1, policy_version 29630 (0.0008) +[2023-10-08 12:57:20,265][102897] Updated weights for policy 0, policy_version 29610 (0.0008) +[2023-10-08 12:57:20,632][102897] Updated weights for policy 0, policy_version 29620 (0.0011) +[2023-10-08 12:57:21,008][102897] Updated weights for policy 0, policy_version 29630 (0.0010) +[2023-10-08 12:57:21,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 60686336. Throughput: 0: 1792.3, 1: 1769.5. Samples: 15176676. Policy #0 lag: (min: 31.0, avg: 31.9, max: 51.0) +[2023-10-08 12:57:21,875][101941] Avg episode reward: [(0, '6.160'), (1, '6.680')] +[2023-10-08 12:57:21,926][102898] Updated weights for policy 1, policy_version 29640 (0.0009) +[2023-10-08 12:57:22,294][102898] Updated weights for policy 1, policy_version 29650 (0.0008) +[2023-10-08 12:57:22,655][102898] Updated weights for policy 1, policy_version 29660 (0.0007) +[2023-10-08 12:57:24,821][102897] Updated weights for policy 0, policy_version 29640 (0.0007) +[2023-10-08 12:57:25,189][102897] Updated weights for policy 0, policy_version 29650 (0.0007) +[2023-10-08 12:57:25,563][102897] Updated weights for policy 0, policy_version 29660 (0.0007) +[2023-10-08 12:57:26,303][102898] Updated weights for policy 1, policy_version 29670 (0.0009) +[2023-10-08 12:57:26,671][102898] Updated weights for policy 1, policy_version 29680 (0.0009) +[2023-10-08 12:57:26,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 60751872. Throughput: 0: 1795.2, 1: 1787.1. Samples: 15198300. Policy #0 lag: (min: 31.0, avg: 31.9, max: 51.0) +[2023-10-08 12:57:26,875][101941] Avg episode reward: [(0, '6.140'), (1, '6.310')] +[2023-10-08 12:57:27,045][102898] Updated weights for policy 1, policy_version 29690 (0.0007) +[2023-10-08 12:57:29,159][102897] Updated weights for policy 0, policy_version 29670 (0.0008) +[2023-10-08 12:57:29,553][102897] Updated weights for policy 0, policy_version 29680 (0.0008) +[2023-10-08 12:57:29,930][102897] Updated weights for policy 0, policy_version 29690 (0.0009) +[2023-10-08 12:57:30,839][102898] Updated weights for policy 1, policy_version 29700 (0.0009) +[2023-10-08 12:57:31,243][102898] Updated weights for policy 1, policy_version 29710 (0.0010) +[2023-10-08 12:57:31,597][102898] Updated weights for policy 1, policy_version 29720 (0.0009) +[2023-10-08 12:57:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 60817408. Throughput: 0: 1789.2, 1: 1793.3. Samples: 15219338. Policy #0 lag: (min: 31.0, avg: 31.9, max: 51.0) +[2023-10-08 12:57:31,876][101941] Avg episode reward: [(0, '5.730'), (1, '6.920')] +[2023-10-08 12:57:33,439][102897] Updated weights for policy 0, policy_version 29700 (0.0008) +[2023-10-08 12:57:33,803][102897] Updated weights for policy 0, policy_version 29710 (0.0010) +[2023-10-08 12:57:34,170][102897] Updated weights for policy 0, policy_version 29720 (0.0010) +[2023-10-08 12:57:35,260][102898] Updated weights for policy 1, policy_version 29730 (0.0010) +[2023-10-08 12:57:35,625][102898] Updated weights for policy 1, policy_version 29740 (0.0011) +[2023-10-08 12:57:35,999][102898] Updated weights for policy 1, policy_version 29750 (0.0010) +[2023-10-08 12:57:36,363][102898] Updated weights for policy 1, policy_version 29760 (0.0010) +[2023-10-08 12:57:36,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 60915712. Throughput: 0: 1791.0, 1: 1783.6. Samples: 15230220. Policy #0 lag: (min: 31.0, avg: 42.2, max: 63.0) +[2023-10-08 12:57:36,876][101941] Avg episode reward: [(0, '6.390'), (1, '6.840')] +[2023-10-08 12:57:38,071][102897] Updated weights for policy 0, policy_version 29730 (0.0009) +[2023-10-08 12:57:38,449][102897] Updated weights for policy 0, policy_version 29740 (0.0009) +[2023-10-08 12:57:38,813][102897] Updated weights for policy 0, policy_version 29750 (0.0009) +[2023-10-08 12:57:39,180][102897] Updated weights for policy 0, policy_version 29760 (0.0010) +[2023-10-08 12:57:40,143][102898] Updated weights for policy 1, policy_version 29770 (0.0010) +[2023-10-08 12:57:40,515][102898] Updated weights for policy 1, policy_version 29780 (0.0007) +[2023-10-08 12:57:40,875][102898] Updated weights for policy 1, policy_version 29790 (0.0008) +[2023-10-08 12:57:41,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 60981248. Throughput: 0: 1788.4, 1: 1799.7. Samples: 15251518. Policy #0 lag: (min: 31.0, avg: 42.2, max: 63.0) +[2023-10-08 12:57:41,876][101941] Avg episode reward: [(0, '6.590'), (1, '6.960')] +[2023-10-08 12:57:42,925][102897] Updated weights for policy 0, policy_version 29770 (0.0009) +[2023-10-08 12:57:43,308][102897] Updated weights for policy 0, policy_version 29780 (0.0011) +[2023-10-08 12:57:43,670][102897] Updated weights for policy 0, policy_version 29790 (0.0010) +[2023-10-08 12:57:44,502][102898] Updated weights for policy 1, policy_version 29800 (0.0008) +[2023-10-08 12:57:44,865][102898] Updated weights for policy 1, policy_version 29810 (0.0008) +[2023-10-08 12:57:45,235][102898] Updated weights for policy 1, policy_version 29820 (0.0007) +[2023-10-08 12:57:46,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 61046784. Throughput: 0: 1789.0, 1: 1780.4. Samples: 15273234. Policy #0 lag: (min: 31.0, avg: 42.2, max: 63.0) +[2023-10-08 12:57:46,875][101941] Avg episode reward: [(0, '6.660'), (1, '6.680')] +[2023-10-08 12:57:47,451][102897] Updated weights for policy 0, policy_version 29800 (0.0008) +[2023-10-08 12:57:47,824][102897] Updated weights for policy 0, policy_version 29810 (0.0009) +[2023-10-08 12:57:48,195][102897] Updated weights for policy 0, policy_version 29820 (0.0008) +[2023-10-08 12:57:48,942][102898] Updated weights for policy 1, policy_version 29830 (0.0008) +[2023-10-08 12:57:49,313][102898] Updated weights for policy 1, policy_version 29840 (0.0007) +[2023-10-08 12:57:49,673][102898] Updated weights for policy 1, policy_version 29850 (0.0008) +[2023-10-08 12:57:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 61112320. Throughput: 0: 1788.0, 1: 1798.0. Samples: 15283760. Policy #0 lag: (min: 31.0, avg: 42.2, max: 63.0) +[2023-10-08 12:57:51,876][101941] Avg episode reward: [(0, '6.240'), (1, '7.340')] +[2023-10-08 12:57:51,993][102897] Updated weights for policy 0, policy_version 29830 (0.0009) +[2023-10-08 12:57:52,358][102897] Updated weights for policy 0, policy_version 29840 (0.0008) +[2023-10-08 12:57:52,731][102897] Updated weights for policy 0, policy_version 29850 (0.0010) +[2023-10-08 12:57:53,468][102898] Updated weights for policy 1, policy_version 29860 (0.0007) +[2023-10-08 12:57:53,833][102898] Updated weights for policy 1, policy_version 29870 (0.0008) +[2023-10-08 12:57:54,200][102898] Updated weights for policy 1, policy_version 29880 (0.0010) +[2023-10-08 12:57:56,477][102897] Updated weights for policy 0, policy_version 29860 (0.0007) +[2023-10-08 12:57:56,851][102897] Updated weights for policy 0, policy_version 29870 (0.0008) +[2023-10-08 12:57:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 61177856. Throughput: 0: 1789.4, 1: 1784.8. Samples: 15305420. Policy #0 lag: (min: 31.0, avg: 42.2, max: 63.0) +[2023-10-08 12:57:56,875][101941] Avg episode reward: [(0, '5.710'), (1, '7.560')] +[2023-10-08 12:57:57,221][102897] Updated weights for policy 0, policy_version 29880 (0.0009) +[2023-10-08 12:57:57,961][102898] Updated weights for policy 1, policy_version 29890 (0.0010) +[2023-10-08 12:57:58,322][102898] Updated weights for policy 1, policy_version 29900 (0.0010) +[2023-10-08 12:57:58,700][102898] Updated weights for policy 1, policy_version 29910 (0.0011) +[2023-10-08 12:57:59,061][102898] Updated weights for policy 1, policy_version 29920 (0.0010) +[2023-10-08 12:58:01,026][102897] Updated weights for policy 0, policy_version 29890 (0.0007) +[2023-10-08 12:58:01,397][102897] Updated weights for policy 0, policy_version 29900 (0.0007) +[2023-10-08 12:58:01,770][102897] Updated weights for policy 0, policy_version 29910 (0.0007) +[2023-10-08 12:58:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 61243392. Throughput: 0: 1806.6, 1: 1786.7. Samples: 15327348. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:58:01,876][101941] Avg episode reward: [(0, '6.360'), (1, '7.040')] +[2023-10-08 12:58:02,137][102897] Updated weights for policy 0, policy_version 29920 (0.0007) +[2023-10-08 12:58:02,869][102898] Updated weights for policy 1, policy_version 29930 (0.0009) +[2023-10-08 12:58:03,248][102898] Updated weights for policy 1, policy_version 29940 (0.0009) +[2023-10-08 12:58:03,612][102898] Updated weights for policy 1, policy_version 29950 (0.0008) +[2023-10-08 12:58:05,798][102897] Updated weights for policy 0, policy_version 29930 (0.0011) +[2023-10-08 12:58:06,167][102897] Updated weights for policy 0, policy_version 29940 (0.0007) +[2023-10-08 12:58:06,549][102897] Updated weights for policy 0, policy_version 29950 (0.0008) +[2023-10-08 12:58:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 61341696. Throughput: 0: 1788.5, 1: 1790.4. Samples: 15337728. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:58:06,876][101941] Avg episode reward: [(0, '6.460'), (1, '6.960')] +[2023-10-08 12:58:07,398][102898] Updated weights for policy 1, policy_version 29960 (0.0007) +[2023-10-08 12:58:07,766][102898] Updated weights for policy 1, policy_version 29970 (0.0008) +[2023-10-08 12:58:08,130][102898] Updated weights for policy 1, policy_version 29980 (0.0007) +[2023-10-08 12:58:10,403][102897] Updated weights for policy 0, policy_version 29960 (0.0008) +[2023-10-08 12:58:10,775][102897] Updated weights for policy 0, policy_version 29970 (0.0009) +[2023-10-08 12:58:11,156][102897] Updated weights for policy 0, policy_version 29980 (0.0009) +[2023-10-08 12:58:11,856][102898] Updated weights for policy 1, policy_version 29990 (0.0008) +[2023-10-08 12:58:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 61407232. Throughput: 0: 1800.3, 1: 1786.9. Samples: 15359728. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:58:11,876][101941] Avg episode reward: [(0, '6.640'), (1, '7.170')] +[2023-10-08 12:58:12,229][102898] Updated weights for policy 1, policy_version 30000 (0.0008) +[2023-10-08 12:58:12,603][102898] Updated weights for policy 1, policy_version 30010 (0.0008) +[2023-10-08 12:58:14,983][102897] Updated weights for policy 0, policy_version 29990 (0.0007) +[2023-10-08 12:58:15,351][102897] Updated weights for policy 0, policy_version 30000 (0.0007) +[2023-10-08 12:58:15,725][102897] Updated weights for policy 0, policy_version 30010 (0.0007) +[2023-10-08 12:58:16,422][102898] Updated weights for policy 1, policy_version 30020 (0.0008) +[2023-10-08 12:58:16,825][102898] Updated weights for policy 1, policy_version 30030 (0.0007) +[2023-10-08 12:58:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 61472768. Throughput: 0: 1787.3, 1: 1803.5. Samples: 15380924. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:58:16,876][101941] Avg episode reward: [(0, '7.300'), (1, '6.670')] +[2023-10-08 12:58:16,885][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000030016_30736384.pth... +[2023-10-08 12:58:16,924][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000028352_29032448.pth +[2023-10-08 12:58:17,197][102898] Updated weights for policy 1, policy_version 30040 (0.0007) +[2023-10-08 12:58:17,484][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000030048_30769152.pth... +[2023-10-08 12:58:17,513][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000028352_29032448.pth +[2023-10-08 12:58:19,432][102897] Updated weights for policy 0, policy_version 30020 (0.0008) +[2023-10-08 12:58:19,799][102897] Updated weights for policy 0, policy_version 30030 (0.0011) +[2023-10-08 12:58:20,169][102897] Updated weights for policy 0, policy_version 30040 (0.0010) +[2023-10-08 12:58:20,870][102898] Updated weights for policy 1, policy_version 30050 (0.0008) +[2023-10-08 12:58:21,241][102898] Updated weights for policy 1, policy_version 30060 (0.0011) +[2023-10-08 12:58:21,607][102898] Updated weights for policy 1, policy_version 30070 (0.0008) +[2023-10-08 12:58:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 61538304. Throughput: 0: 1812.0, 1: 1786.5. Samples: 15392154. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 12:58:21,875][101941] Avg episode reward: [(0, '6.880'), (1, '6.810')] +[2023-10-08 12:58:21,977][102898] Updated weights for policy 1, policy_version 30080 (0.0010) +[2023-10-08 12:58:23,986][102897] Updated weights for policy 0, policy_version 30050 (0.0009) +[2023-10-08 12:58:24,351][102897] Updated weights for policy 0, policy_version 30060 (0.0008) +[2023-10-08 12:58:24,726][102897] Updated weights for policy 0, policy_version 30070 (0.0009) +[2023-10-08 12:58:25,095][102897] Updated weights for policy 0, policy_version 30080 (0.0008) +[2023-10-08 12:58:25,700][102898] Updated weights for policy 1, policy_version 30090 (0.0010) +[2023-10-08 12:58:26,071][102898] Updated weights for policy 1, policy_version 30100 (0.0011) +[2023-10-08 12:58:26,432][102898] Updated weights for policy 1, policy_version 30110 (0.0007) +[2023-10-08 12:58:26,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 61636608. Throughput: 0: 1781.6, 1: 1804.9. Samples: 15412908. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 12:58:26,876][101941] Avg episode reward: [(0, '6.460'), (1, '7.340')] +[2023-10-08 12:58:28,705][102897] Updated weights for policy 0, policy_version 30090 (0.0008) +[2023-10-08 12:58:29,076][102897] Updated weights for policy 0, policy_version 30100 (0.0007) +[2023-10-08 12:58:29,453][102897] Updated weights for policy 0, policy_version 30110 (0.0009) +[2023-10-08 12:58:30,180][102898] Updated weights for policy 1, policy_version 30120 (0.0008) +[2023-10-08 12:58:30,547][102898] Updated weights for policy 1, policy_version 30130 (0.0008) +[2023-10-08 12:58:30,916][102898] Updated weights for policy 1, policy_version 30140 (0.0009) +[2023-10-08 12:58:31,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14745.5, 300 sec: 14329.1). Total num frames: 61702144. Throughput: 0: 1784.2, 1: 1791.9. Samples: 15434156. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 12:58:31,876][101941] Avg episode reward: [(0, '6.210'), (1, '7.010')] +[2023-10-08 12:58:33,350][102897] Updated weights for policy 0, policy_version 30120 (0.0008) +[2023-10-08 12:58:33,715][102897] Updated weights for policy 0, policy_version 30130 (0.0007) +[2023-10-08 12:58:34,093][102897] Updated weights for policy 0, policy_version 30140 (0.0007) +[2023-10-08 12:58:34,715][102898] Updated weights for policy 1, policy_version 30150 (0.0008) +[2023-10-08 12:58:35,073][102898] Updated weights for policy 1, policy_version 30160 (0.0009) +[2023-10-08 12:58:35,444][102898] Updated weights for policy 1, policy_version 30170 (0.0009) +[2023-10-08 12:58:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 61767680. Throughput: 0: 1780.3, 1: 1811.7. Samples: 15445400. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 12:58:36,876][101941] Avg episode reward: [(0, '6.470'), (1, '6.210')] +[2023-10-08 12:58:37,672][102897] Updated weights for policy 0, policy_version 30150 (0.0009) +[2023-10-08 12:58:38,031][102897] Updated weights for policy 0, policy_version 30160 (0.0010) +[2023-10-08 12:58:38,406][102897] Updated weights for policy 0, policy_version 30170 (0.0009) +[2023-10-08 12:58:39,009][102898] Updated weights for policy 1, policy_version 30180 (0.0007) +[2023-10-08 12:58:39,372][102898] Updated weights for policy 1, policy_version 30190 (0.0007) +[2023-10-08 12:58:39,740][102898] Updated weights for policy 1, policy_version 30200 (0.0009) +[2023-10-08 12:58:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 61833216. Throughput: 0: 1782.2, 1: 1799.6. Samples: 15466600. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 12:58:41,876][101941] Avg episode reward: [(0, '6.410'), (1, '7.010')] +[2023-10-08 12:58:42,233][102897] Updated weights for policy 0, policy_version 30180 (0.0007) +[2023-10-08 12:58:42,603][102897] Updated weights for policy 0, policy_version 30190 (0.0007) +[2023-10-08 12:58:42,972][102897] Updated weights for policy 0, policy_version 30200 (0.0009) +[2023-10-08 12:58:43,512][102898] Updated weights for policy 1, policy_version 30210 (0.0008) +[2023-10-08 12:58:43,883][102898] Updated weights for policy 1, policy_version 30220 (0.0009) +[2023-10-08 12:58:44,250][102898] Updated weights for policy 1, policy_version 30230 (0.0008) +[2023-10-08 12:58:44,618][102898] Updated weights for policy 1, policy_version 30240 (0.0008) +[2023-10-08 12:58:46,700][102897] Updated weights for policy 0, policy_version 30210 (0.0007) +[2023-10-08 12:58:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 61898752. Throughput: 0: 1790.4, 1: 1800.4. Samples: 15488934. Policy #0 lag: (min: 26.0, avg: 26.0, max: 26.0) +[2023-10-08 12:58:46,876][101941] Avg episode reward: [(0, '6.770'), (1, '6.680')] +[2023-10-08 12:58:47,067][102897] Updated weights for policy 0, policy_version 30220 (0.0007) +[2023-10-08 12:58:47,442][102897] Updated weights for policy 0, policy_version 30230 (0.0007) +[2023-10-08 12:58:47,810][102897] Updated weights for policy 0, policy_version 30240 (0.0008) +[2023-10-08 12:58:48,443][102898] Updated weights for policy 1, policy_version 30250 (0.0009) +[2023-10-08 12:58:48,814][102898] Updated weights for policy 1, policy_version 30260 (0.0008) +[2023-10-08 12:58:49,181][102898] Updated weights for policy 1, policy_version 30270 (0.0008) +[2023-10-08 12:58:51,623][102897] Updated weights for policy 0, policy_version 30250 (0.0009) +[2023-10-08 12:58:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 61964288. Throughput: 0: 1778.7, 1: 1799.5. Samples: 15498746. Policy #0 lag: (min: 26.0, avg: 26.0, max: 26.0) +[2023-10-08 12:58:51,876][101941] Avg episode reward: [(0, '6.670'), (1, '6.870')] +[2023-10-08 12:58:51,995][102897] Updated weights for policy 0, policy_version 30260 (0.0007) +[2023-10-08 12:58:52,359][102897] Updated weights for policy 0, policy_version 30270 (0.0009) +[2023-10-08 12:58:52,852][102898] Updated weights for policy 1, policy_version 30280 (0.0010) +[2023-10-08 12:58:53,226][102898] Updated weights for policy 1, policy_version 30290 (0.0010) +[2023-10-08 12:58:53,587][102898] Updated weights for policy 1, policy_version 30300 (0.0008) +[2023-10-08 12:58:56,259][102897] Updated weights for policy 0, policy_version 30280 (0.0009) +[2023-10-08 12:58:56,635][102897] Updated weights for policy 0, policy_version 30290 (0.0008) +[2023-10-08 12:58:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 62029824. Throughput: 0: 1788.0, 1: 1795.9. Samples: 15521002. Policy #0 lag: (min: 26.0, avg: 26.0, max: 26.0) +[2023-10-08 12:58:56,876][101941] Avg episode reward: [(0, '6.170'), (1, '7.780')] +[2023-10-08 12:58:56,998][102897] Updated weights for policy 0, policy_version 30300 (0.0008) +[2023-10-08 12:58:57,376][102898] Updated weights for policy 1, policy_version 30310 (0.0010) +[2023-10-08 12:58:57,749][102898] Updated weights for policy 1, policy_version 30320 (0.0007) +[2023-10-08 12:58:58,108][102898] Updated weights for policy 1, policy_version 30330 (0.0008) +[2023-10-08 12:59:00,959][102897] Updated weights for policy 0, policy_version 30310 (0.0008) +[2023-10-08 12:59:01,338][102897] Updated weights for policy 0, policy_version 30320 (0.0009) +[2023-10-08 12:59:01,703][102897] Updated weights for policy 0, policy_version 30330 (0.0010) +[2023-10-08 12:59:01,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 62095360. Throughput: 0: 1789.6, 1: 1800.6. Samples: 15542482. Policy #0 lag: (min: 26.0, avg: 26.0, max: 26.0) +[2023-10-08 12:59:01,876][101941] Avg episode reward: [(0, '6.600'), (1, '7.080')] +[2023-10-08 12:59:02,020][102898] Updated weights for policy 1, policy_version 30340 (0.0007) +[2023-10-08 12:59:02,409][102898] Updated weights for policy 1, policy_version 30350 (0.0008) +[2023-10-08 12:59:02,779][102898] Updated weights for policy 1, policy_version 30360 (0.0008) +[2023-10-08 12:59:05,488][102897] Updated weights for policy 0, policy_version 30340 (0.0009) +[2023-10-08 12:59:05,856][102897] Updated weights for policy 0, policy_version 30350 (0.0010) +[2023-10-08 12:59:06,223][102897] Updated weights for policy 0, policy_version 30360 (0.0008) +[2023-10-08 12:59:06,537][102898] Updated weights for policy 1, policy_version 30370 (0.0008) +[2023-10-08 12:59:06,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 62193664. Throughput: 0: 1778.8, 1: 1793.8. Samples: 15552922. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:59:06,875][101941] Avg episode reward: [(0, '6.410'), (1, '6.840')] +[2023-10-08 12:59:06,907][102898] Updated weights for policy 1, policy_version 30380 (0.0008) +[2023-10-08 12:59:07,286][102898] Updated weights for policy 1, policy_version 30390 (0.0008) +[2023-10-08 12:59:07,652][102898] Updated weights for policy 1, policy_version 30400 (0.0007) +[2023-10-08 12:59:09,882][102897] Updated weights for policy 0, policy_version 30370 (0.0007) +[2023-10-08 12:59:10,252][102897] Updated weights for policy 0, policy_version 30380 (0.0007) +[2023-10-08 12:59:10,627][102897] Updated weights for policy 0, policy_version 30390 (0.0007) +[2023-10-08 12:59:10,993][102897] Updated weights for policy 0, policy_version 30400 (0.0007) +[2023-10-08 12:59:11,360][102898] Updated weights for policy 1, policy_version 30410 (0.0008) +[2023-10-08 12:59:11,735][102898] Updated weights for policy 1, policy_version 30420 (0.0009) +[2023-10-08 12:59:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 62259200. Throughput: 0: 1795.6, 1: 1797.4. Samples: 15574592. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:59:11,875][101941] Avg episode reward: [(0, '6.700'), (1, '6.700')] +[2023-10-08 12:59:12,092][102898] Updated weights for policy 1, policy_version 30430 (0.0010) +[2023-10-08 12:59:14,874][102897] Updated weights for policy 0, policy_version 30410 (0.0008) +[2023-10-08 12:59:15,244][102897] Updated weights for policy 0, policy_version 30420 (0.0010) +[2023-10-08 12:59:15,614][102897] Updated weights for policy 0, policy_version 30430 (0.0009) +[2023-10-08 12:59:15,943][102898] Updated weights for policy 1, policy_version 30440 (0.0011) +[2023-10-08 12:59:16,309][102898] Updated weights for policy 1, policy_version 30450 (0.0011) +[2023-10-08 12:59:16,686][102898] Updated weights for policy 1, policy_version 30460 (0.0008) +[2023-10-08 12:59:16,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 62357504. Throughput: 0: 1777.7, 1: 1803.6. Samples: 15595312. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:59:16,876][101941] Avg episode reward: [(0, '6.510'), (1, '6.720')] +[2023-10-08 12:59:19,289][102897] Updated weights for policy 0, policy_version 30440 (0.0007) +[2023-10-08 12:59:19,663][102897] Updated weights for policy 0, policy_version 30450 (0.0007) +[2023-10-08 12:59:20,025][102897] Updated weights for policy 0, policy_version 30460 (0.0008) +[2023-10-08 12:59:20,510][102898] Updated weights for policy 1, policy_version 30470 (0.0009) +[2023-10-08 12:59:20,878][102898] Updated weights for policy 1, policy_version 30480 (0.0011) +[2023-10-08 12:59:21,257][102898] Updated weights for policy 1, policy_version 30490 (0.0010) +[2023-10-08 12:59:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 62423040. Throughput: 0: 1807.8, 1: 1786.9. Samples: 15607162. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:59:21,876][101941] Avg episode reward: [(0, '6.170'), (1, '6.990')] +[2023-10-08 12:59:23,723][102897] Updated weights for policy 0, policy_version 30470 (0.0009) +[2023-10-08 12:59:24,096][102897] Updated weights for policy 0, policy_version 30480 (0.0008) +[2023-10-08 12:59:24,467][102897] Updated weights for policy 0, policy_version 30490 (0.0007) +[2023-10-08 12:59:25,227][102898] Updated weights for policy 1, policy_version 30500 (0.0009) +[2023-10-08 12:59:25,590][102898] Updated weights for policy 1, policy_version 30510 (0.0009) +[2023-10-08 12:59:25,950][102898] Updated weights for policy 1, policy_version 30520 (0.0009) +[2023-10-08 12:59:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 62488576. Throughput: 0: 1786.7, 1: 1799.5. Samples: 15627978. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 12:59:26,875][101941] Avg episode reward: [(0, '6.540'), (1, '6.760')] +[2023-10-08 12:59:28,044][102897] Updated weights for policy 0, policy_version 30500 (0.0008) +[2023-10-08 12:59:28,412][102897] Updated weights for policy 0, policy_version 30510 (0.0007) +[2023-10-08 12:59:28,782][102897] Updated weights for policy 0, policy_version 30520 (0.0010) +[2023-10-08 12:59:29,566][102898] Updated weights for policy 1, policy_version 30530 (0.0007) +[2023-10-08 12:59:29,932][102898] Updated weights for policy 1, policy_version 30540 (0.0008) +[2023-10-08 12:59:30,295][102898] Updated weights for policy 1, policy_version 30550 (0.0007) +[2023-10-08 12:59:30,662][102898] Updated weights for policy 1, policy_version 30560 (0.0008) +[2023-10-08 12:59:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 62554112. Throughput: 0: 1796.4, 1: 1780.4. Samples: 15649892. Policy #0 lag: (min: 44.0, avg: 47.9, max: 48.0) +[2023-10-08 12:59:31,876][101941] Avg episode reward: [(0, '6.690'), (1, '6.960')] +[2023-10-08 12:59:32,572][102897] Updated weights for policy 0, policy_version 30530 (0.0007) +[2023-10-08 12:59:32,940][102897] Updated weights for policy 0, policy_version 30540 (0.0008) +[2023-10-08 12:59:33,318][102897] Updated weights for policy 0, policy_version 30550 (0.0008) +[2023-10-08 12:59:33,681][102897] Updated weights for policy 0, policy_version 30560 (0.0008) +[2023-10-08 12:59:34,320][102898] Updated weights for policy 1, policy_version 30570 (0.0007) +[2023-10-08 12:59:34,684][102898] Updated weights for policy 1, policy_version 30580 (0.0007) +[2023-10-08 12:59:35,054][102898] Updated weights for policy 1, policy_version 30590 (0.0007) +[2023-10-08 12:59:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 62619648. Throughput: 0: 1792.1, 1: 1804.4. Samples: 15660588. Policy #0 lag: (min: 44.0, avg: 47.9, max: 48.0) +[2023-10-08 12:59:36,876][101941] Avg episode reward: [(0, '7.250'), (1, '7.680')] +[2023-10-08 12:59:37,420][102897] Updated weights for policy 0, policy_version 30570 (0.0008) +[2023-10-08 12:59:37,792][102897] Updated weights for policy 0, policy_version 30580 (0.0009) +[2023-10-08 12:59:38,173][102897] Updated weights for policy 0, policy_version 30590 (0.0008) +[2023-10-08 12:59:38,580][102898] Updated weights for policy 1, policy_version 30600 (0.0008) +[2023-10-08 12:59:38,956][102898] Updated weights for policy 1, policy_version 30610 (0.0007) +[2023-10-08 12:59:39,326][102898] Updated weights for policy 1, policy_version 30620 (0.0007) +[2023-10-08 12:59:41,868][102897] Updated weights for policy 0, policy_version 30600 (0.0008) +[2023-10-08 12:59:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 62685184. Throughput: 0: 1795.6, 1: 1791.7. Samples: 15682434. Policy #0 lag: (min: 44.0, avg: 47.9, max: 48.0) +[2023-10-08 12:59:41,876][101941] Avg episode reward: [(0, '6.850'), (1, '7.490')] +[2023-10-08 12:59:42,248][102897] Updated weights for policy 0, policy_version 30610 (0.0010) +[2023-10-08 12:59:42,634][102897] Updated weights for policy 0, policy_version 30620 (0.0010) +[2023-10-08 12:59:43,051][102898] Updated weights for policy 1, policy_version 30630 (0.0008) +[2023-10-08 12:59:43,411][102898] Updated weights for policy 1, policy_version 30640 (0.0007) +[2023-10-08 12:59:43,781][102898] Updated weights for policy 1, policy_version 30650 (0.0008) +[2023-10-08 12:59:46,356][102897] Updated weights for policy 0, policy_version 30630 (0.0009) +[2023-10-08 12:59:46,732][102897] Updated weights for policy 0, policy_version 30640 (0.0009) +[2023-10-08 12:59:46,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 62750720. Throughput: 0: 1803.7, 1: 1792.3. Samples: 15704302. Policy #0 lag: (min: 44.0, avg: 47.9, max: 48.0) +[2023-10-08 12:59:46,876][101941] Avg episode reward: [(0, '7.050'), (1, '6.940')] +[2023-10-08 12:59:47,110][102897] Updated weights for policy 0, policy_version 30650 (0.0007) +[2023-10-08 12:59:47,485][102898] Updated weights for policy 1, policy_version 30660 (0.0010) +[2023-10-08 12:59:47,863][102898] Updated weights for policy 1, policy_version 30670 (0.0009) +[2023-10-08 12:59:48,225][102898] Updated weights for policy 1, policy_version 30680 (0.0011) +[2023-10-08 12:59:50,934][102897] Updated weights for policy 0, policy_version 30660 (0.0008) +[2023-10-08 12:59:51,307][102897] Updated weights for policy 0, policy_version 30670 (0.0008) +[2023-10-08 12:59:51,678][102897] Updated weights for policy 0, policy_version 30680 (0.0007) +[2023-10-08 12:59:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 62816256. Throughput: 0: 1789.3, 1: 1791.6. Samples: 15714062. Policy #0 lag: (min: 44.0, avg: 47.9, max: 48.0) +[2023-10-08 12:59:51,876][101941] Avg episode reward: [(0, '6.550'), (1, '7.000')] +[2023-10-08 12:59:51,937][102898] Updated weights for policy 1, policy_version 30690 (0.0011) +[2023-10-08 12:59:52,302][102898] Updated weights for policy 1, policy_version 30700 (0.0010) +[2023-10-08 12:59:52,668][102898] Updated weights for policy 1, policy_version 30710 (0.0007) +[2023-10-08 12:59:53,037][102898] Updated weights for policy 1, policy_version 30720 (0.0010) +[2023-10-08 12:59:55,386][102897] Updated weights for policy 0, policy_version 30690 (0.0008) +[2023-10-08 12:59:55,759][102897] Updated weights for policy 0, policy_version 30700 (0.0009) +[2023-10-08 12:59:56,132][102897] Updated weights for policy 0, policy_version 30710 (0.0007) +[2023-10-08 12:59:56,508][102897] Updated weights for policy 0, policy_version 30720 (0.0007) +[2023-10-08 12:59:56,858][102898] Updated weights for policy 1, policy_version 30730 (0.0010) +[2023-10-08 12:59:56,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 62914560. Throughput: 0: 1803.5, 1: 1786.7. Samples: 15736150. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 12:59:56,876][101941] Avg episode reward: [(0, '6.890'), (1, '7.670')] +[2023-10-08 12:59:57,226][102898] Updated weights for policy 1, policy_version 30740 (0.0008) +[2023-10-08 12:59:57,599][102898] Updated weights for policy 1, policy_version 30750 (0.0008) +[2023-10-08 13:00:00,345][102897] Updated weights for policy 0, policy_version 30730 (0.0008) +[2023-10-08 13:00:00,712][102897] Updated weights for policy 0, policy_version 30740 (0.0008) +[2023-10-08 13:00:01,079][102897] Updated weights for policy 0, policy_version 30750 (0.0009) +[2023-10-08 13:00:01,458][102898] Updated weights for policy 1, policy_version 30760 (0.0007) +[2023-10-08 13:00:01,827][102898] Updated weights for policy 1, policy_version 30770 (0.0008) +[2023-10-08 13:00:01,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 62980096. Throughput: 0: 1786.4, 1: 1799.8. Samples: 15756692. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 13:00:01,876][101941] Avg episode reward: [(0, '6.870'), (1, '7.190')] +[2023-10-08 13:00:02,197][102898] Updated weights for policy 1, policy_version 30780 (0.0008) +[2023-10-08 13:00:04,931][102897] Updated weights for policy 0, policy_version 30760 (0.0007) +[2023-10-08 13:00:05,305][102897] Updated weights for policy 0, policy_version 30770 (0.0008) +[2023-10-08 13:00:05,665][102897] Updated weights for policy 0, policy_version 30780 (0.0009) +[2023-10-08 13:00:06,082][102898] Updated weights for policy 1, policy_version 30790 (0.0009) +[2023-10-08 13:00:06,440][102898] Updated weights for policy 1, policy_version 30800 (0.0011) +[2023-10-08 13:00:06,814][102898] Updated weights for policy 1, policy_version 30810 (0.0010) +[2023-10-08 13:00:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 63045632. Throughput: 0: 1790.8, 1: 1787.1. Samples: 15768166. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 13:00:06,876][101941] Avg episode reward: [(0, '6.800'), (1, '7.030')] +[2023-10-08 13:00:09,330][102897] Updated weights for policy 0, policy_version 30790 (0.0007) +[2023-10-08 13:00:09,696][102897] Updated weights for policy 0, policy_version 30800 (0.0007) +[2023-10-08 13:00:10,077][102897] Updated weights for policy 0, policy_version 30810 (0.0008) +[2023-10-08 13:00:10,528][102898] Updated weights for policy 1, policy_version 30820 (0.0010) +[2023-10-08 13:00:10,902][102898] Updated weights for policy 1, policy_version 30830 (0.0012) +[2023-10-08 13:00:11,260][102898] Updated weights for policy 1, policy_version 30840 (0.0011) +[2023-10-08 13:00:11,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 63143936. Throughput: 0: 1780.3, 1: 1805.4. Samples: 15789334. Policy #0 lag: (min: 31.0, avg: 32.1, max: 53.0) +[2023-10-08 13:00:11,876][101941] Avg episode reward: [(0, '6.720'), (1, '7.300')] +[2023-10-08 13:00:13,904][102897] Updated weights for policy 0, policy_version 30820 (0.0008) +[2023-10-08 13:00:14,265][102897] Updated weights for policy 0, policy_version 30830 (0.0007) +[2023-10-08 13:00:14,642][102897] Updated weights for policy 0, policy_version 30840 (0.0008) +[2023-10-08 13:00:14,816][102898] Updated weights for policy 1, policy_version 30850 (0.0009) +[2023-10-08 13:00:15,191][102898] Updated weights for policy 1, policy_version 30860 (0.0009) +[2023-10-08 13:00:15,563][102898] Updated weights for policy 1, policy_version 30870 (0.0010) +[2023-10-08 13:00:15,923][102898] Updated weights for policy 1, policy_version 30880 (0.0011) +[2023-10-08 13:00:16,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 63209472. Throughput: 0: 1768.9, 1: 1795.2. Samples: 15810276. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:00:16,876][101941] Avg episode reward: [(0, '6.900'), (1, '6.410')] +[2023-10-08 13:00:16,882][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000030880_31621120.pth... +[2023-10-08 13:00:16,882][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000030848_31588352.pth... +[2023-10-08 13:00:16,920][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000029216_29917184.pth +[2023-10-08 13:00:16,930][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000029184_29884416.pth +[2023-10-08 13:00:18,448][102897] Updated weights for policy 0, policy_version 30850 (0.0009) +[2023-10-08 13:00:18,820][102897] Updated weights for policy 0, policy_version 30860 (0.0008) +[2023-10-08 13:00:19,189][102897] Updated weights for policy 0, policy_version 30870 (0.0009) +[2023-10-08 13:00:19,554][102897] Updated weights for policy 0, policy_version 30880 (0.0008) +[2023-10-08 13:00:19,685][102898] Updated weights for policy 1, policy_version 30890 (0.0008) +[2023-10-08 13:00:20,059][102898] Updated weights for policy 1, policy_version 30900 (0.0009) +[2023-10-08 13:00:20,425][102898] Updated weights for policy 1, policy_version 30910 (0.0009) +[2023-10-08 13:00:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 63275008. Throughput: 0: 1777.8, 1: 1800.1. Samples: 15821596. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:00:21,875][101941] Avg episode reward: [(0, '7.720'), (1, '6.910')] +[2023-10-08 13:00:21,876][102634] Saving new best policy, reward=7.720! +[2023-10-08 13:00:23,380][102897] Updated weights for policy 0, policy_version 30890 (0.0008) +[2023-10-08 13:00:23,743][102897] Updated weights for policy 0, policy_version 30900 (0.0010) +[2023-10-08 13:00:24,117][102897] Updated weights for policy 0, policy_version 30910 (0.0007) +[2023-10-08 13:00:24,258][102898] Updated weights for policy 1, policy_version 30920 (0.0011) +[2023-10-08 13:00:24,622][102898] Updated weights for policy 1, policy_version 30930 (0.0009) +[2023-10-08 13:00:25,001][102898] Updated weights for policy 1, policy_version 30940 (0.0009) +[2023-10-08 13:00:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 63340544. Throughput: 0: 1766.7, 1: 1779.2. Samples: 15842000. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:00:26,876][101941] Avg episode reward: [(0, '6.680'), (1, '7.550')] +[2023-10-08 13:00:27,996][102897] Updated weights for policy 0, policy_version 30920 (0.0007) +[2023-10-08 13:00:28,363][102897] Updated weights for policy 0, policy_version 30930 (0.0009) +[2023-10-08 13:00:28,732][102897] Updated weights for policy 0, policy_version 30940 (0.0008) +[2023-10-08 13:00:28,878][102898] Updated weights for policy 1, policy_version 30950 (0.0008) +[2023-10-08 13:00:29,247][102898] Updated weights for policy 1, policy_version 30960 (0.0010) +[2023-10-08 13:00:29,624][102898] Updated weights for policy 1, policy_version 30970 (0.0008) +[2023-10-08 13:00:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 63406080. Throughput: 0: 1776.9, 1: 1777.4. Samples: 15864246. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:00:31,876][101941] Avg episode reward: [(0, '5.580'), (1, '7.110')] +[2023-10-08 13:00:32,478][102897] Updated weights for policy 0, policy_version 30950 (0.0007) +[2023-10-08 13:00:32,860][102897] Updated weights for policy 0, policy_version 30960 (0.0007) +[2023-10-08 13:00:33,226][102897] Updated weights for policy 0, policy_version 30970 (0.0008) +[2023-10-08 13:00:33,514][102898] Updated weights for policy 1, policy_version 30980 (0.0009) +[2023-10-08 13:00:33,897][102898] Updated weights for policy 1, policy_version 30990 (0.0009) +[2023-10-08 13:00:34,264][102898] Updated weights for policy 1, policy_version 31000 (0.0007) +[2023-10-08 13:00:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 63471616. Throughput: 0: 1771.0, 1: 1782.7. Samples: 15873976. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:00:36,876][101941] Avg episode reward: [(0, '5.640'), (1, '6.530')] +[2023-10-08 13:00:36,950][102897] Updated weights for policy 0, policy_version 30980 (0.0008) +[2023-10-08 13:00:37,315][102897] Updated weights for policy 0, policy_version 30990 (0.0007) +[2023-10-08 13:00:37,687][102897] Updated weights for policy 0, policy_version 31000 (0.0007) +[2023-10-08 13:00:37,881][102898] Updated weights for policy 1, policy_version 31010 (0.0007) +[2023-10-08 13:00:38,252][102898] Updated weights for policy 1, policy_version 31020 (0.0008) +[2023-10-08 13:00:38,619][102898] Updated weights for policy 1, policy_version 31030 (0.0007) +[2023-10-08 13:00:38,991][102898] Updated weights for policy 1, policy_version 31040 (0.0008) +[2023-10-08 13:00:41,496][102897] Updated weights for policy 0, policy_version 31010 (0.0008) +[2023-10-08 13:00:41,859][102897] Updated weights for policy 0, policy_version 31020 (0.0007) +[2023-10-08 13:00:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 63537152. Throughput: 0: 1771.7, 1: 1786.0. Samples: 15896244. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:00:41,875][101941] Avg episode reward: [(0, '6.350'), (1, '6.480')] +[2023-10-08 13:00:42,242][102897] Updated weights for policy 0, policy_version 31030 (0.0007) +[2023-10-08 13:00:42,607][102897] Updated weights for policy 0, policy_version 31040 (0.0008) +[2023-10-08 13:00:42,710][102898] Updated weights for policy 1, policy_version 31050 (0.0007) +[2023-10-08 13:00:43,078][102898] Updated weights for policy 1, policy_version 31060 (0.0010) +[2023-10-08 13:00:43,452][102898] Updated weights for policy 1, policy_version 31070 (0.0008) +[2023-10-08 13:00:46,486][102897] Updated weights for policy 0, policy_version 31050 (0.0009) +[2023-10-08 13:00:46,853][102897] Updated weights for policy 0, policy_version 31060 (0.0007) +[2023-10-08 13:00:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 63602688. Throughput: 0: 1799.5, 1: 1793.5. Samples: 15918374. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:00:46,875][101941] Avg episode reward: [(0, '6.690'), (1, '6.900')] +[2023-10-08 13:00:47,221][102897] Updated weights for policy 0, policy_version 31070 (0.0009) +[2023-10-08 13:00:47,261][102898] Updated weights for policy 1, policy_version 31080 (0.0009) +[2023-10-08 13:00:47,623][102898] Updated weights for policy 1, policy_version 31090 (0.0009) +[2023-10-08 13:00:47,993][102898] Updated weights for policy 1, policy_version 31100 (0.0009) +[2023-10-08 13:00:51,051][102897] Updated weights for policy 0, policy_version 31080 (0.0009) +[2023-10-08 13:00:51,431][102897] Updated weights for policy 0, policy_version 31090 (0.0010) +[2023-10-08 13:00:51,792][102897] Updated weights for policy 0, policy_version 31100 (0.0009) +[2023-10-08 13:00:51,835][102898] Updated weights for policy 1, policy_version 31110 (0.0008) +[2023-10-08 13:00:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 63668224. Throughput: 0: 1774.1, 1: 1785.2. Samples: 15928334. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:00:51,875][101941] Avg episode reward: [(0, '6.200'), (1, '7.480')] +[2023-10-08 13:00:52,198][102898] Updated weights for policy 1, policy_version 31120 (0.0007) +[2023-10-08 13:00:52,564][102898] Updated weights for policy 1, policy_version 31130 (0.0009) +[2023-10-08 13:00:55,541][102897] Updated weights for policy 0, policy_version 31110 (0.0008) +[2023-10-08 13:00:55,908][102897] Updated weights for policy 0, policy_version 31120 (0.0008) +[2023-10-08 13:00:56,282][102897] Updated weights for policy 0, policy_version 31130 (0.0009) +[2023-10-08 13:00:56,336][102898] Updated weights for policy 1, policy_version 31140 (0.0009) +[2023-10-08 13:00:56,709][102898] Updated weights for policy 1, policy_version 31150 (0.0008) +[2023-10-08 13:00:56,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 63766528. Throughput: 0: 1801.7, 1: 1785.2. Samples: 15950744. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:00:56,875][101941] Avg episode reward: [(0, '6.660'), (1, '7.030')] +[2023-10-08 13:00:57,079][102898] Updated weights for policy 1, policy_version 31160 (0.0007) +[2023-10-08 13:01:00,056][102897] Updated weights for policy 0, policy_version 31140 (0.0007) +[2023-10-08 13:01:00,414][102897] Updated weights for policy 0, policy_version 31150 (0.0008) +[2023-10-08 13:01:00,799][102897] Updated weights for policy 0, policy_version 31160 (0.0008) +[2023-10-08 13:01:00,899][102898] Updated weights for policy 1, policy_version 31170 (0.0008) +[2023-10-08 13:01:01,264][102898] Updated weights for policy 1, policy_version 31180 (0.0010) +[2023-10-08 13:01:01,636][102898] Updated weights for policy 1, policy_version 31190 (0.0010) +[2023-10-08 13:01:01,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 63832064. Throughput: 0: 1773.3, 1: 1795.3. Samples: 15970858. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:01:01,875][101941] Avg episode reward: [(0, '6.750'), (1, '7.000')] +[2023-10-08 13:01:01,999][102898] Updated weights for policy 1, policy_version 31200 (0.0008) +[2023-10-08 13:01:04,687][102897] Updated weights for policy 0, policy_version 31170 (0.0009) +[2023-10-08 13:01:05,069][102897] Updated weights for policy 0, policy_version 31180 (0.0008) +[2023-10-08 13:01:05,428][102897] Updated weights for policy 0, policy_version 31190 (0.0008) +[2023-10-08 13:01:05,563][102898] Updated weights for policy 1, policy_version 31210 (0.0008) +[2023-10-08 13:01:05,800][102897] Updated weights for policy 0, policy_version 31200 (0.0009) +[2023-10-08 13:01:05,931][102898] Updated weights for policy 1, policy_version 31220 (0.0007) +[2023-10-08 13:01:06,299][102898] Updated weights for policy 1, policy_version 31230 (0.0010) +[2023-10-08 13:01:06,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 63930368. Throughput: 0: 1794.3, 1: 1783.5. Samples: 15982602. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:01:06,876][101941] Avg episode reward: [(0, '6.820'), (1, '7.030')] +[2023-10-08 13:01:09,616][102897] Updated weights for policy 0, policy_version 31210 (0.0009) +[2023-10-08 13:01:09,986][102897] Updated weights for policy 0, policy_version 31220 (0.0009) +[2023-10-08 13:01:10,127][102898] Updated weights for policy 1, policy_version 31240 (0.0009) +[2023-10-08 13:01:10,356][102897] Updated weights for policy 0, policy_version 31230 (0.0009) +[2023-10-08 13:01:10,491][102898] Updated weights for policy 1, policy_version 31250 (0.0008) +[2023-10-08 13:01:10,855][102898] Updated weights for policy 1, policy_version 31260 (0.0010) +[2023-10-08 13:01:11,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 63995904. Throughput: 0: 1773.4, 1: 1804.3. Samples: 16002996. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:01:11,876][101941] Avg episode reward: [(0, '6.810'), (1, '6.940')] +[2023-10-08 13:01:14,082][102897] Updated weights for policy 0, policy_version 31240 (0.0010) +[2023-10-08 13:01:14,456][102897] Updated weights for policy 0, policy_version 31250 (0.0010) +[2023-10-08 13:01:14,596][102898] Updated weights for policy 1, policy_version 31270 (0.0009) +[2023-10-08 13:01:14,825][102897] Updated weights for policy 0, policy_version 31260 (0.0009) +[2023-10-08 13:01:14,957][102898] Updated weights for policy 1, policy_version 31280 (0.0009) +[2023-10-08 13:01:15,318][102898] Updated weights for policy 1, policy_version 31290 (0.0009) +[2023-10-08 13:01:16,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 64061440. Throughput: 0: 1771.0, 1: 1789.5. Samples: 16024470. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:01:16,876][101941] Avg episode reward: [(0, '6.820'), (1, '7.170')] +[2023-10-08 13:01:18,466][102897] Updated weights for policy 0, policy_version 31270 (0.0008) +[2023-10-08 13:01:18,832][102897] Updated weights for policy 0, policy_version 31280 (0.0008) +[2023-10-08 13:01:19,198][102897] Updated weights for policy 0, policy_version 31290 (0.0008) +[2023-10-08 13:01:19,231][102898] Updated weights for policy 1, policy_version 31300 (0.0008) +[2023-10-08 13:01:19,626][102898] Updated weights for policy 1, policy_version 31310 (0.0009) +[2023-10-08 13:01:19,986][102898] Updated weights for policy 1, policy_version 31320 (0.0008) +[2023-10-08 13:01:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 64126976. Throughput: 0: 1778.2, 1: 1806.0. Samples: 16035264. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:01:21,876][101941] Avg episode reward: [(0, '6.600'), (1, '6.870')] +[2023-10-08 13:01:22,992][102897] Updated weights for policy 0, policy_version 31300 (0.0007) +[2023-10-08 13:01:23,361][102897] Updated weights for policy 0, policy_version 31310 (0.0008) +[2023-10-08 13:01:23,733][102897] Updated weights for policy 0, policy_version 31320 (0.0011) +[2023-10-08 13:01:23,740][102898] Updated weights for policy 1, policy_version 31330 (0.0008) +[2023-10-08 13:01:24,111][102898] Updated weights for policy 1, policy_version 31340 (0.0009) +[2023-10-08 13:01:24,486][102898] Updated weights for policy 1, policy_version 31350 (0.0011) +[2023-10-08 13:01:24,865][102898] Updated weights for policy 1, policy_version 31360 (0.0008) +[2023-10-08 13:01:26,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 64192512. Throughput: 0: 1772.2, 1: 1785.2. Samples: 16056330. Policy #0 lag: (min: 4.0, avg: 28.6, max: 32.0) +[2023-10-08 13:01:26,877][101941] Avg episode reward: [(0, '6.480'), (1, '6.460')] +[2023-10-08 13:01:27,510][102897] Updated weights for policy 0, policy_version 31330 (0.0008) +[2023-10-08 13:01:27,881][102897] Updated weights for policy 0, policy_version 31340 (0.0008) +[2023-10-08 13:01:28,258][102897] Updated weights for policy 0, policy_version 31350 (0.0009) +[2023-10-08 13:01:28,621][102898] Updated weights for policy 1, policy_version 31370 (0.0008) +[2023-10-08 13:01:28,627][102897] Updated weights for policy 0, policy_version 31360 (0.0009) +[2023-10-08 13:01:28,983][102898] Updated weights for policy 1, policy_version 31380 (0.0009) +[2023-10-08 13:01:29,358][102898] Updated weights for policy 1, policy_version 31390 (0.0008) +[2023-10-08 13:01:31,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 64258048. Throughput: 0: 1776.6, 1: 1789.2. Samples: 16078834. Policy #0 lag: (min: 4.0, avg: 28.6, max: 32.0) +[2023-10-08 13:01:31,876][101941] Avg episode reward: [(0, '6.240'), (1, '7.310')] +[2023-10-08 13:01:32,386][102897] Updated weights for policy 0, policy_version 31370 (0.0009) +[2023-10-08 13:01:32,750][102897] Updated weights for policy 0, policy_version 31380 (0.0007) +[2023-10-08 13:01:33,102][102898] Updated weights for policy 1, policy_version 31400 (0.0007) +[2023-10-08 13:01:33,118][102897] Updated weights for policy 0, policy_version 31390 (0.0007) +[2023-10-08 13:01:33,476][102898] Updated weights for policy 1, policy_version 31410 (0.0009) +[2023-10-08 13:01:33,845][102898] Updated weights for policy 1, policy_version 31420 (0.0008) +[2023-10-08 13:01:36,806][102897] Updated weights for policy 0, policy_version 31400 (0.0009) +[2023-10-08 13:01:36,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 64323584. Throughput: 0: 1771.1, 1: 1788.1. Samples: 16088500. Policy #0 lag: (min: 4.0, avg: 28.6, max: 32.0) +[2023-10-08 13:01:36,875][101941] Avg episode reward: [(0, '6.590'), (1, '7.230')] +[2023-10-08 13:01:37,176][102897] Updated weights for policy 0, policy_version 31410 (0.0008) +[2023-10-08 13:01:37,502][102898] Updated weights for policy 1, policy_version 31430 (0.0008) +[2023-10-08 13:01:37,557][102897] Updated weights for policy 0, policy_version 31420 (0.0008) +[2023-10-08 13:01:37,859][102898] Updated weights for policy 1, policy_version 31440 (0.0007) +[2023-10-08 13:01:38,230][102898] Updated weights for policy 1, policy_version 31450 (0.0007) +[2023-10-08 13:01:41,337][102897] Updated weights for policy 0, policy_version 31430 (0.0010) +[2023-10-08 13:01:41,708][102897] Updated weights for policy 0, policy_version 31440 (0.0008) +[2023-10-08 13:01:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 64389120. Throughput: 0: 1774.8, 1: 1783.5. Samples: 16110868. Policy #0 lag: (min: 4.0, avg: 28.6, max: 32.0) +[2023-10-08 13:01:41,875][101941] Avg episode reward: [(0, '7.220'), (1, '6.930')] +[2023-10-08 13:01:42,023][102898] Updated weights for policy 1, policy_version 31460 (0.0007) +[2023-10-08 13:01:42,077][102897] Updated weights for policy 0, policy_version 31450 (0.0009) +[2023-10-08 13:01:42,387][102898] Updated weights for policy 1, policy_version 31470 (0.0007) +[2023-10-08 13:01:42,752][102898] Updated weights for policy 1, policy_version 31480 (0.0009) +[2023-10-08 13:01:45,909][102897] Updated weights for policy 0, policy_version 31460 (0.0007) +[2023-10-08 13:01:46,284][102897] Updated weights for policy 0, policy_version 31470 (0.0008) +[2023-10-08 13:01:46,593][102898] Updated weights for policy 1, policy_version 31490 (0.0008) +[2023-10-08 13:01:46,652][102897] Updated weights for policy 0, policy_version 31480 (0.0008) +[2023-10-08 13:01:46,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 64454656. Throughput: 0: 1791.2, 1: 1800.1. Samples: 16132466. Policy #0 lag: (min: 4.0, avg: 28.6, max: 32.0) +[2023-10-08 13:01:46,876][101941] Avg episode reward: [(0, '6.800'), (1, '7.030')] +[2023-10-08 13:01:46,968][102898] Updated weights for policy 1, policy_version 31500 (0.0008) +[2023-10-08 13:01:47,335][102898] Updated weights for policy 1, policy_version 31510 (0.0008) +[2023-10-08 13:01:47,702][102898] Updated weights for policy 1, policy_version 31520 (0.0007) +[2023-10-08 13:01:50,471][102897] Updated weights for policy 0, policy_version 31490 (0.0008) +[2023-10-08 13:01:50,845][102897] Updated weights for policy 0, policy_version 31500 (0.0007) +[2023-10-08 13:01:51,218][102897] Updated weights for policy 0, policy_version 31510 (0.0008) +[2023-10-08 13:01:51,403][102898] Updated weights for policy 1, policy_version 31530 (0.0007) +[2023-10-08 13:01:51,584][102897] Updated weights for policy 0, policy_version 31520 (0.0007) +[2023-10-08 13:01:51,773][102898] Updated weights for policy 1, policy_version 31540 (0.0008) +[2023-10-08 13:01:51,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 64552960. Throughput: 0: 1780.5, 1: 1781.9. Samples: 16142910. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 13:01:51,876][101941] Avg episode reward: [(0, '6.240'), (1, '7.260')] +[2023-10-08 13:01:52,145][102898] Updated weights for policy 1, policy_version 31550 (0.0008) +[2023-10-08 13:01:55,318][102897] Updated weights for policy 0, policy_version 31530 (0.0008) +[2023-10-08 13:01:55,683][102897] Updated weights for policy 0, policy_version 31540 (0.0010) +[2023-10-08 13:01:55,992][102898] Updated weights for policy 1, policy_version 31560 (0.0008) +[2023-10-08 13:01:56,066][102897] Updated weights for policy 0, policy_version 31550 (0.0010) +[2023-10-08 13:01:56,372][102898] Updated weights for policy 1, policy_version 31570 (0.0008) +[2023-10-08 13:01:56,751][102898] Updated weights for policy 1, policy_version 31580 (0.0010) +[2023-10-08 13:01:56,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 64618496. Throughput: 0: 1798.6, 1: 1793.9. Samples: 16164660. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 13:01:56,876][101941] Avg episode reward: [(0, '6.100'), (1, '6.770')] +[2023-10-08 13:01:59,834][102897] Updated weights for policy 0, policy_version 31560 (0.0008) +[2023-10-08 13:02:00,204][102897] Updated weights for policy 0, policy_version 31570 (0.0008) +[2023-10-08 13:02:00,537][102898] Updated weights for policy 1, policy_version 31590 (0.0007) +[2023-10-08 13:02:00,566][102897] Updated weights for policy 0, policy_version 31580 (0.0008) +[2023-10-08 13:02:00,898][102898] Updated weights for policy 1, policy_version 31600 (0.0010) +[2023-10-08 13:02:01,275][102898] Updated weights for policy 1, policy_version 31610 (0.0007) +[2023-10-08 13:02:01,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 64716800. Throughput: 0: 1780.5, 1: 1780.6. Samples: 16184718. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 13:02:01,876][101941] Avg episode reward: [(0, '6.310'), (1, '6.760')] +[2023-10-08 13:02:04,584][102897] Updated weights for policy 0, policy_version 31590 (0.0008) +[2023-10-08 13:02:04,966][102897] Updated weights for policy 0, policy_version 31600 (0.0009) +[2023-10-08 13:02:05,005][102898] Updated weights for policy 1, policy_version 31620 (0.0007) +[2023-10-08 13:02:05,335][102897] Updated weights for policy 0, policy_version 31610 (0.0008) +[2023-10-08 13:02:05,381][102898] Updated weights for policy 1, policy_version 31630 (0.0008) +[2023-10-08 13:02:05,752][102898] Updated weights for policy 1, policy_version 31640 (0.0009) +[2023-10-08 13:02:06,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 64782336. Throughput: 0: 1803.7, 1: 1792.5. Samples: 16197096. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 13:02:06,875][101941] Avg episode reward: [(0, '6.740'), (1, '7.130')] +[2023-10-08 13:02:09,135][102897] Updated weights for policy 0, policy_version 31620 (0.0007) +[2023-10-08 13:02:09,492][102898] Updated weights for policy 1, policy_version 31650 (0.0010) +[2023-10-08 13:02:09,516][102897] Updated weights for policy 0, policy_version 31630 (0.0008) +[2023-10-08 13:02:09,854][102898] Updated weights for policy 1, policy_version 31660 (0.0009) +[2023-10-08 13:02:09,879][102897] Updated weights for policy 0, policy_version 31640 (0.0008) +[2023-10-08 13:02:10,218][102898] Updated weights for policy 1, policy_version 31670 (0.0008) +[2023-10-08 13:02:10,590][102898] Updated weights for policy 1, policy_version 31680 (0.0007) +[2023-10-08 13:02:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 64847872. Throughput: 0: 1778.5, 1: 1787.7. Samples: 16216804. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:02:11,875][101941] Avg episode reward: [(0, '6.210'), (1, '7.680')] +[2023-10-08 13:02:13,544][102897] Updated weights for policy 0, policy_version 31650 (0.0009) +[2023-10-08 13:02:13,910][102897] Updated weights for policy 0, policy_version 31660 (0.0008) +[2023-10-08 13:02:14,289][102897] Updated weights for policy 0, policy_version 31670 (0.0007) +[2023-10-08 13:02:14,446][102898] Updated weights for policy 1, policy_version 31690 (0.0008) +[2023-10-08 13:02:14,655][102897] Updated weights for policy 0, policy_version 31680 (0.0007) +[2023-10-08 13:02:14,810][102898] Updated weights for policy 1, policy_version 31700 (0.0007) +[2023-10-08 13:02:15,173][102898] Updated weights for policy 1, policy_version 31710 (0.0007) +[2023-10-08 13:02:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 64913408. Throughput: 0: 1780.0, 1: 1772.9. Samples: 16238718. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:02:16,876][101941] Avg episode reward: [(0, '5.610'), (1, '7.020')] +[2023-10-08 13:02:16,886][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000031712_32473088.pth... +[2023-10-08 13:02:16,887][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000031680_32440320.pth... +[2023-10-08 13:02:16,924][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000030016_30736384.pth +[2023-10-08 13:02:16,926][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000030048_30769152.pth +[2023-10-08 13:02:18,416][102897] Updated weights for policy 0, policy_version 31690 (0.0009) +[2023-10-08 13:02:18,787][102897] Updated weights for policy 0, policy_version 31700 (0.0008) +[2023-10-08 13:02:18,943][102898] Updated weights for policy 1, policy_version 31720 (0.0008) +[2023-10-08 13:02:19,163][102897] Updated weights for policy 0, policy_version 31710 (0.0007) +[2023-10-08 13:02:19,307][102898] Updated weights for policy 1, policy_version 31730 (0.0010) +[2023-10-08 13:02:19,677][102898] Updated weights for policy 1, policy_version 31740 (0.0009) +[2023-10-08 13:02:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 64978944. Throughput: 0: 1779.6, 1: 1786.6. Samples: 16248982. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:02:21,875][101941] Avg episode reward: [(0, '5.830'), (1, '6.450')] +[2023-10-08 13:02:22,949][102897] Updated weights for policy 0, policy_version 31720 (0.0009) +[2023-10-08 13:02:23,338][102897] Updated weights for policy 0, policy_version 31730 (0.0009) +[2023-10-08 13:02:23,476][102898] Updated weights for policy 1, policy_version 31750 (0.0009) +[2023-10-08 13:02:23,706][102897] Updated weights for policy 0, policy_version 31740 (0.0009) +[2023-10-08 13:02:23,833][102898] Updated weights for policy 1, policy_version 31760 (0.0009) +[2023-10-08 13:02:24,201][102898] Updated weights for policy 1, policy_version 31770 (0.0007) +[2023-10-08 13:02:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 65044480. Throughput: 0: 1773.5, 1: 1776.0. Samples: 16270596. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:02:26,876][101941] Avg episode reward: [(0, '6.440'), (1, '7.290')] +[2023-10-08 13:02:27,559][102897] Updated weights for policy 0, policy_version 31750 (0.0008) +[2023-10-08 13:02:27,940][102897] Updated weights for policy 0, policy_version 31760 (0.0007) +[2023-10-08 13:02:27,952][102898] Updated weights for policy 1, policy_version 31780 (0.0009) +[2023-10-08 13:02:28,321][102897] Updated weights for policy 0, policy_version 31770 (0.0008) +[2023-10-08 13:02:28,327][102898] Updated weights for policy 1, policy_version 31790 (0.0010) +[2023-10-08 13:02:28,690][102898] Updated weights for policy 1, policy_version 31800 (0.0007) +[2023-10-08 13:02:31,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 65110016. Throughput: 0: 1786.4, 1: 1778.9. Samples: 16292904. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:02:31,876][101941] Avg episode reward: [(0, '7.100'), (1, '7.210')] +[2023-10-08 13:02:31,992][102897] Updated weights for policy 0, policy_version 31780 (0.0007) +[2023-10-08 13:02:32,378][102897] Updated weights for policy 0, policy_version 31790 (0.0007) +[2023-10-08 13:02:32,424][102898] Updated weights for policy 1, policy_version 31810 (0.0007) +[2023-10-08 13:02:32,751][102897] Updated weights for policy 0, policy_version 31800 (0.0007) +[2023-10-08 13:02:32,796][102898] Updated weights for policy 1, policy_version 31820 (0.0007) +[2023-10-08 13:02:33,155][102898] Updated weights for policy 1, policy_version 31830 (0.0007) +[2023-10-08 13:02:33,523][102898] Updated weights for policy 1, policy_version 31840 (0.0009) +[2023-10-08 13:02:36,469][102897] Updated weights for policy 0, policy_version 31810 (0.0007) +[2023-10-08 13:02:36,853][102897] Updated weights for policy 0, policy_version 31820 (0.0009) +[2023-10-08 13:02:36,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 65175552. Throughput: 0: 1770.7, 1: 1777.6. Samples: 16302582. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:02:36,875][101941] Avg episode reward: [(0, '7.280'), (1, '7.070')] +[2023-10-08 13:02:37,227][102897] Updated weights for policy 0, policy_version 31830 (0.0008) +[2023-10-08 13:02:37,288][102898] Updated weights for policy 1, policy_version 31850 (0.0008) +[2023-10-08 13:02:37,601][102897] Updated weights for policy 0, policy_version 31840 (0.0008) +[2023-10-08 13:02:37,658][102898] Updated weights for policy 1, policy_version 31860 (0.0009) +[2023-10-08 13:02:38,030][102898] Updated weights for policy 1, policy_version 31870 (0.0011) +[2023-10-08 13:02:41,406][102897] Updated weights for policy 0, policy_version 31850 (0.0007) +[2023-10-08 13:02:41,770][102897] Updated weights for policy 0, policy_version 31860 (0.0007) +[2023-10-08 13:02:41,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 65241088. Throughput: 0: 1781.8, 1: 1774.4. Samples: 16324686. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:02:41,875][101941] Avg episode reward: [(0, '6.600'), (1, '7.070')] +[2023-10-08 13:02:41,950][102898] Updated weights for policy 1, policy_version 31880 (0.0008) +[2023-10-08 13:02:42,143][102897] Updated weights for policy 0, policy_version 31870 (0.0011) +[2023-10-08 13:02:42,318][102898] Updated weights for policy 1, policy_version 31890 (0.0008) +[2023-10-08 13:02:42,684][102898] Updated weights for policy 1, policy_version 31900 (0.0009) +[2023-10-08 13:02:45,956][102897] Updated weights for policy 0, policy_version 31880 (0.0007) +[2023-10-08 13:02:46,324][102897] Updated weights for policy 0, policy_version 31890 (0.0009) +[2023-10-08 13:02:46,533][102898] Updated weights for policy 1, policy_version 31910 (0.0008) +[2023-10-08 13:02:46,698][102897] Updated weights for policy 0, policy_version 31900 (0.0007) +[2023-10-08 13:02:46,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 65339392. Throughput: 0: 1782.0, 1: 1800.0. Samples: 16345906. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:02:46,876][101941] Avg episode reward: [(0, '6.890'), (1, '7.520')] +[2023-10-08 13:02:46,898][102898] Updated weights for policy 1, policy_version 31920 (0.0007) +[2023-10-08 13:02:47,263][102898] Updated weights for policy 1, policy_version 31930 (0.0010) +[2023-10-08 13:02:50,667][102897] Updated weights for policy 0, policy_version 31910 (0.0007) +[2023-10-08 13:02:51,047][102897] Updated weights for policy 0, policy_version 31920 (0.0007) +[2023-10-08 13:02:51,312][102898] Updated weights for policy 1, policy_version 31940 (0.0009) +[2023-10-08 13:02:51,424][102897] Updated weights for policy 0, policy_version 31930 (0.0007) +[2023-10-08 13:02:51,700][102898] Updated weights for policy 1, policy_version 31950 (0.0009) +[2023-10-08 13:02:51,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 65404928. Throughput: 0: 1770.0, 1: 1769.0. Samples: 16356352. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:02:51,875][101941] Avg episode reward: [(0, '6.910'), (1, '7.030')] +[2023-10-08 13:02:52,078][102898] Updated weights for policy 1, policy_version 31960 (0.0009) +[2023-10-08 13:02:55,084][102897] Updated weights for policy 0, policy_version 31940 (0.0009) +[2023-10-08 13:02:55,461][102897] Updated weights for policy 0, policy_version 31950 (0.0010) +[2023-10-08 13:02:55,613][102898] Updated weights for policy 1, policy_version 31970 (0.0008) +[2023-10-08 13:02:55,822][102897] Updated weights for policy 0, policy_version 31960 (0.0008) +[2023-10-08 13:02:55,972][102898] Updated weights for policy 1, policy_version 31980 (0.0007) +[2023-10-08 13:02:56,348][102898] Updated weights for policy 1, policy_version 31990 (0.0010) +[2023-10-08 13:02:56,720][102898] Updated weights for policy 1, policy_version 32000 (0.0010) +[2023-10-08 13:02:56,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 65503232. Throughput: 0: 1792.3, 1: 1795.1. Samples: 16378242. Policy #0 lag: (min: 6.0, avg: 13.2, max: 38.0) +[2023-10-08 13:02:56,876][101941] Avg episode reward: [(0, '7.890'), (1, '6.520')] +[2023-10-08 13:02:56,877][102634] Saving new best policy, reward=7.890! +[2023-10-08 13:02:59,442][102897] Updated weights for policy 0, policy_version 31970 (0.0007) +[2023-10-08 13:02:59,813][102897] Updated weights for policy 0, policy_version 31980 (0.0007) +[2023-10-08 13:03:00,178][102897] Updated weights for policy 0, policy_version 31990 (0.0007) +[2023-10-08 13:03:00,547][102897] Updated weights for policy 0, policy_version 32000 (0.0007) +[2023-10-08 13:03:00,617][102898] Updated weights for policy 1, policy_version 32010 (0.0008) +[2023-10-08 13:03:00,988][102898] Updated weights for policy 1, policy_version 32020 (0.0008) +[2023-10-08 13:03:01,351][102898] Updated weights for policy 1, policy_version 32030 (0.0007) +[2023-10-08 13:03:01,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 65568768. Throughput: 0: 1769.6, 1: 1770.8. Samples: 16398032. Policy #0 lag: (min: 6.0, avg: 13.2, max: 38.0) +[2023-10-08 13:03:01,876][101941] Avg episode reward: [(0, '7.430'), (1, '6.850')] +[2023-10-08 13:03:04,319][102897] Updated weights for policy 0, policy_version 32010 (0.0007) +[2023-10-08 13:03:04,690][102897] Updated weights for policy 0, policy_version 32020 (0.0007) +[2023-10-08 13:03:05,057][102897] Updated weights for policy 0, policy_version 32030 (0.0009) +[2023-10-08 13:03:05,116][102898] Updated weights for policy 1, policy_version 32040 (0.0008) +[2023-10-08 13:03:05,489][102898] Updated weights for policy 1, policy_version 32050 (0.0008) +[2023-10-08 13:03:05,849][102898] Updated weights for policy 1, policy_version 32060 (0.0008) +[2023-10-08 13:03:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 65634304. Throughput: 0: 1793.3, 1: 1789.3. Samples: 16410200. Policy #0 lag: (min: 6.0, avg: 13.2, max: 38.0) +[2023-10-08 13:03:06,876][101941] Avg episode reward: [(0, '6.950'), (1, '5.840')] +[2023-10-08 13:03:08,771][102897] Updated weights for policy 0, policy_version 32040 (0.0008) +[2023-10-08 13:03:09,149][102897] Updated weights for policy 0, policy_version 32050 (0.0009) +[2023-10-08 13:03:09,499][102898] Updated weights for policy 1, policy_version 32070 (0.0008) +[2023-10-08 13:03:09,507][102897] Updated weights for policy 0, policy_version 32060 (0.0007) +[2023-10-08 13:03:09,875][102898] Updated weights for policy 1, policy_version 32080 (0.0007) +[2023-10-08 13:03:10,237][102898] Updated weights for policy 1, policy_version 32090 (0.0009) +[2023-10-08 13:03:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 65699840. Throughput: 0: 1774.8, 1: 1773.7. Samples: 16430276. Policy #0 lag: (min: 6.0, avg: 13.2, max: 38.0) +[2023-10-08 13:03:11,876][101941] Avg episode reward: [(0, '6.270'), (1, '5.110')] +[2023-10-08 13:03:13,351][102897] Updated weights for policy 0, policy_version 32070 (0.0009) +[2023-10-08 13:03:13,716][102897] Updated weights for policy 0, policy_version 32080 (0.0010) +[2023-10-08 13:03:13,992][102898] Updated weights for policy 1, policy_version 32100 (0.0009) +[2023-10-08 13:03:14,079][102897] Updated weights for policy 0, policy_version 32090 (0.0007) +[2023-10-08 13:03:14,356][102898] Updated weights for policy 1, policy_version 32110 (0.0008) +[2023-10-08 13:03:14,732][102898] Updated weights for policy 1, policy_version 32120 (0.0011) +[2023-10-08 13:03:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 65765376. Throughput: 0: 1778.8, 1: 1772.0. Samples: 16452690. Policy #0 lag: (min: 6.0, avg: 13.2, max: 38.0) +[2023-10-08 13:03:16,875][101941] Avg episode reward: [(0, '6.770'), (1, '5.760')] +[2023-10-08 13:03:18,026][102897] Updated weights for policy 0, policy_version 32100 (0.0009) +[2023-10-08 13:03:18,393][102897] Updated weights for policy 0, policy_version 32110 (0.0009) +[2023-10-08 13:03:18,455][102898] Updated weights for policy 1, policy_version 32130 (0.0008) +[2023-10-08 13:03:18,762][102897] Updated weights for policy 0, policy_version 32120 (0.0009) +[2023-10-08 13:03:18,824][102898] Updated weights for policy 1, policy_version 32140 (0.0007) +[2023-10-08 13:03:19,188][102898] Updated weights for policy 1, policy_version 32150 (0.0007) +[2023-10-08 13:03:19,569][102898] Updated weights for policy 1, policy_version 32160 (0.0007) +[2023-10-08 13:03:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 65830912. Throughput: 0: 1775.1, 1: 1779.3. Samples: 16462530. Policy #0 lag: (min: 14.0, avg: 14.2, max: 23.0) +[2023-10-08 13:03:21,876][101941] Avg episode reward: [(0, '6.830'), (1, '6.520')] +[2023-10-08 13:03:22,634][102897] Updated weights for policy 0, policy_version 32130 (0.0011) +[2023-10-08 13:03:23,002][102897] Updated weights for policy 0, policy_version 32140 (0.0008) +[2023-10-08 13:03:23,330][102898] Updated weights for policy 1, policy_version 32170 (0.0008) +[2023-10-08 13:03:23,377][102897] Updated weights for policy 0, policy_version 32150 (0.0009) +[2023-10-08 13:03:23,697][102898] Updated weights for policy 1, policy_version 32180 (0.0008) +[2023-10-08 13:03:23,751][102897] Updated weights for policy 0, policy_version 32160 (0.0009) +[2023-10-08 13:03:24,060][102898] Updated weights for policy 1, policy_version 32190 (0.0010) +[2023-10-08 13:03:26,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 65896448. Throughput: 0: 1774.6, 1: 1776.8. Samples: 16484500. Policy #0 lag: (min: 14.0, avg: 14.2, max: 23.0) +[2023-10-08 13:03:26,876][101941] Avg episode reward: [(0, '6.270'), (1, '6.580')] +[2023-10-08 13:03:27,459][102897] Updated weights for policy 0, policy_version 32170 (0.0007) +[2023-10-08 13:03:27,836][102897] Updated weights for policy 0, policy_version 32180 (0.0007) +[2023-10-08 13:03:27,849][102898] Updated weights for policy 1, policy_version 32200 (0.0009) +[2023-10-08 13:03:28,201][102897] Updated weights for policy 0, policy_version 32190 (0.0009) +[2023-10-08 13:03:28,211][102898] Updated weights for policy 1, policy_version 32210 (0.0007) +[2023-10-08 13:03:28,574][102898] Updated weights for policy 1, policy_version 32220 (0.0007) +[2023-10-08 13:03:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 65961984. Throughput: 0: 1794.4, 1: 1779.9. Samples: 16506752. Policy #0 lag: (min: 14.0, avg: 14.2, max: 23.0) +[2023-10-08 13:03:31,876][101941] Avg episode reward: [(0, '5.670'), (1, '6.480')] +[2023-10-08 13:03:32,012][102897] Updated weights for policy 0, policy_version 32200 (0.0008) +[2023-10-08 13:03:32,387][102897] Updated weights for policy 0, policy_version 32210 (0.0007) +[2023-10-08 13:03:32,423][102898] Updated weights for policy 1, policy_version 32230 (0.0008) +[2023-10-08 13:03:32,752][102897] Updated weights for policy 0, policy_version 32220 (0.0007) +[2023-10-08 13:03:32,778][102898] Updated weights for policy 1, policy_version 32240 (0.0007) +[2023-10-08 13:03:33,146][102898] Updated weights for policy 1, policy_version 32250 (0.0007) +[2023-10-08 13:03:36,531][102897] Updated weights for policy 0, policy_version 32230 (0.0009) +[2023-10-08 13:03:36,870][102898] Updated weights for policy 1, policy_version 32260 (0.0008) +[2023-10-08 13:03:36,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 66027520. Throughput: 0: 1779.7, 1: 1780.6. Samples: 16516566. Policy #0 lag: (min: 14.0, avg: 14.2, max: 23.0) +[2023-10-08 13:03:36,875][101941] Avg episode reward: [(0, '5.510'), (1, '7.030')] +[2023-10-08 13:03:36,910][102897] Updated weights for policy 0, policy_version 32240 (0.0007) +[2023-10-08 13:03:37,262][102898] Updated weights for policy 1, policy_version 32270 (0.0008) +[2023-10-08 13:03:37,281][102897] Updated weights for policy 0, policy_version 32250 (0.0007) +[2023-10-08 13:03:37,640][102898] Updated weights for policy 1, policy_version 32280 (0.0007) +[2023-10-08 13:03:41,046][102897] Updated weights for policy 0, policy_version 32260 (0.0008) +[2023-10-08 13:03:41,411][102897] Updated weights for policy 0, policy_version 32270 (0.0008) +[2023-10-08 13:03:41,447][102898] Updated weights for policy 1, policy_version 32290 (0.0009) +[2023-10-08 13:03:41,775][102897] Updated weights for policy 0, policy_version 32280 (0.0009) +[2023-10-08 13:03:41,810][102898] Updated weights for policy 1, policy_version 32300 (0.0007) +[2023-10-08 13:03:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 66093056. Throughput: 0: 1788.7, 1: 1778.4. Samples: 16538758. Policy #0 lag: (min: 14.0, avg: 14.2, max: 23.0) +[2023-10-08 13:03:41,875][101941] Avg episode reward: [(0, '5.760'), (1, '6.430')] +[2023-10-08 13:03:42,180][102898] Updated weights for policy 1, policy_version 32310 (0.0007) +[2023-10-08 13:03:42,545][102898] Updated weights for policy 1, policy_version 32320 (0.0007) +[2023-10-08 13:03:45,459][102897] Updated weights for policy 0, policy_version 32290 (0.0007) +[2023-10-08 13:03:45,826][102897] Updated weights for policy 0, policy_version 32300 (0.0010) +[2023-10-08 13:03:46,192][102897] Updated weights for policy 0, policy_version 32310 (0.0007) +[2023-10-08 13:03:46,283][102898] Updated weights for policy 1, policy_version 32330 (0.0007) +[2023-10-08 13:03:46,560][102897] Updated weights for policy 0, policy_version 32320 (0.0007) +[2023-10-08 13:03:46,657][102898] Updated weights for policy 1, policy_version 32340 (0.0007) +[2023-10-08 13:03:46,875][101941] Fps is (10 sec: 16383.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 66191360. Throughput: 0: 1783.5, 1: 1803.9. Samples: 16559466. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 13:03:46,876][101941] Avg episode reward: [(0, '6.230'), (1, '6.000')] +[2023-10-08 13:03:47,033][102898] Updated weights for policy 1, policy_version 32350 (0.0008) +[2023-10-08 13:03:50,419][102897] Updated weights for policy 0, policy_version 32330 (0.0008) +[2023-10-08 13:03:50,805][102897] Updated weights for policy 0, policy_version 32340 (0.0007) +[2023-10-08 13:03:50,813][102898] Updated weights for policy 1, policy_version 32360 (0.0007) +[2023-10-08 13:03:51,171][102897] Updated weights for policy 0, policy_version 32350 (0.0007) +[2023-10-08 13:03:51,182][102898] Updated weights for policy 1, policy_version 32370 (0.0008) +[2023-10-08 13:03:51,545][102898] Updated weights for policy 1, policy_version 32380 (0.0007) +[2023-10-08 13:03:51,875][101941] Fps is (10 sec: 19660.4, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 66289664. Throughput: 0: 1785.9, 1: 1782.8. Samples: 16570794. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 13:03:51,876][101941] Avg episode reward: [(0, '6.310'), (1, '6.290')] +[2023-10-08 13:03:55,029][102897] Updated weights for policy 0, policy_version 32360 (0.0008) +[2023-10-08 13:03:55,330][102898] Updated weights for policy 1, policy_version 32390 (0.0008) +[2023-10-08 13:03:55,393][102897] Updated weights for policy 0, policy_version 32370 (0.0007) +[2023-10-08 13:03:55,702][102898] Updated weights for policy 1, policy_version 32400 (0.0010) +[2023-10-08 13:03:55,767][102897] Updated weights for policy 0, policy_version 32380 (0.0008) +[2023-10-08 13:03:56,062][102898] Updated weights for policy 1, policy_version 32410 (0.0007) +[2023-10-08 13:03:56,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 66355200. Throughput: 0: 1786.6, 1: 1805.7. Samples: 16591928. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 13:03:56,876][101941] Avg episode reward: [(0, '6.510'), (1, '6.830')] +[2023-10-08 13:03:59,494][102897] Updated weights for policy 0, policy_version 32390 (0.0009) +[2023-10-08 13:03:59,762][102898] Updated weights for policy 1, policy_version 32420 (0.0007) +[2023-10-08 13:03:59,859][102897] Updated weights for policy 0, policy_version 32400 (0.0007) +[2023-10-08 13:04:00,126][102898] Updated weights for policy 1, policy_version 32430 (0.0007) +[2023-10-08 13:04:00,236][102897] Updated weights for policy 0, policy_version 32410 (0.0007) +[2023-10-08 13:04:00,482][102898] Updated weights for policy 1, policy_version 32440 (0.0009) +[2023-10-08 13:04:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 66420736. Throughput: 0: 1772.4, 1: 1783.8. Samples: 16612720. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 13:04:01,876][101941] Avg episode reward: [(0, '6.880'), (1, '6.570')] +[2023-10-08 13:04:04,022][102897] Updated weights for policy 0, policy_version 32420 (0.0007) +[2023-10-08 13:04:04,195][102898] Updated weights for policy 1, policy_version 32450 (0.0010) +[2023-10-08 13:04:04,383][102897] Updated weights for policy 0, policy_version 32430 (0.0009) +[2023-10-08 13:04:04,558][102898] Updated weights for policy 1, policy_version 32460 (0.0009) +[2023-10-08 13:04:04,752][102897] Updated weights for policy 0, policy_version 32440 (0.0007) +[2023-10-08 13:04:04,933][102898] Updated weights for policy 1, policy_version 32470 (0.0007) +[2023-10-08 13:04:05,297][102898] Updated weights for policy 1, policy_version 32480 (0.0008) +[2023-10-08 13:04:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 66486272. Throughput: 0: 1792.7, 1: 1802.8. Samples: 16624330. Policy #0 lag: (min: 31.0, avg: 31.2, max: 40.0) +[2023-10-08 13:04:06,876][101941] Avg episode reward: [(0, '5.990'), (1, '6.210')] +[2023-10-08 13:04:08,509][102897] Updated weights for policy 0, policy_version 32450 (0.0008) +[2023-10-08 13:04:08,881][102897] Updated weights for policy 0, policy_version 32460 (0.0008) +[2023-10-08 13:04:08,971][102898] Updated weights for policy 1, policy_version 32490 (0.0008) +[2023-10-08 13:04:09,259][102897] Updated weights for policy 0, policy_version 32470 (0.0009) +[2023-10-08 13:04:09,329][102898] Updated weights for policy 1, policy_version 32500 (0.0007) +[2023-10-08 13:04:09,628][102897] Updated weights for policy 0, policy_version 32480 (0.0008) +[2023-10-08 13:04:09,696][102898] Updated weights for policy 1, policy_version 32510 (0.0007) +[2023-10-08 13:04:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 66551808. Throughput: 0: 1776.1, 1: 1788.4. Samples: 16644904. Policy #0 lag: (min: 31.0, avg: 31.2, max: 40.0) +[2023-10-08 13:04:11,876][101941] Avg episode reward: [(0, '5.590'), (1, '6.400')] +[2023-10-08 13:04:13,438][102898] Updated weights for policy 1, policy_version 32520 (0.0009) +[2023-10-08 13:04:13,494][102897] Updated weights for policy 0, policy_version 32490 (0.0009) +[2023-10-08 13:04:13,806][102898] Updated weights for policy 1, policy_version 32530 (0.0007) +[2023-10-08 13:04:13,861][102897] Updated weights for policy 0, policy_version 32500 (0.0009) +[2023-10-08 13:04:14,180][102898] Updated weights for policy 1, policy_version 32540 (0.0008) +[2023-10-08 13:04:14,239][102897] Updated weights for policy 0, policy_version 32510 (0.0007) +[2023-10-08 13:04:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 66617344. Throughput: 0: 1772.2, 1: 1787.3. Samples: 16666928. Policy #0 lag: (min: 31.0, avg: 31.2, max: 40.0) +[2023-10-08 13:04:16,875][101941] Avg episode reward: [(0, '5.970'), (1, '6.890')] +[2023-10-08 13:04:16,884][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000032544_33325056.pth... +[2023-10-08 13:04:16,884][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000032512_33292288.pth... +[2023-10-08 13:04:16,918][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000030880_31621120.pth +[2023-10-08 13:04:16,921][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000030848_31588352.pth +[2023-10-08 13:04:17,984][102898] Updated weights for policy 1, policy_version 32550 (0.0009) +[2023-10-08 13:04:18,037][102897] Updated weights for policy 0, policy_version 32520 (0.0008) +[2023-10-08 13:04:18,356][102898] Updated weights for policy 1, policy_version 32560 (0.0007) +[2023-10-08 13:04:18,409][102897] Updated weights for policy 0, policy_version 32530 (0.0008) +[2023-10-08 13:04:18,725][102898] Updated weights for policy 1, policy_version 32570 (0.0007) +[2023-10-08 13:04:18,775][102897] Updated weights for policy 0, policy_version 32540 (0.0009) +[2023-10-08 13:04:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 66682880. Throughput: 0: 1774.2, 1: 1782.3. Samples: 16676606. Policy #0 lag: (min: 31.0, avg: 31.2, max: 40.0) +[2023-10-08 13:04:21,876][101941] Avg episode reward: [(0, '6.200'), (1, '6.800')] +[2023-10-08 13:04:22,583][102897] Updated weights for policy 0, policy_version 32550 (0.0007) +[2023-10-08 13:04:22,684][102898] Updated weights for policy 1, policy_version 32580 (0.0007) +[2023-10-08 13:04:22,961][102897] Updated weights for policy 0, policy_version 32560 (0.0007) +[2023-10-08 13:04:23,060][102898] Updated weights for policy 1, policy_version 32590 (0.0008) +[2023-10-08 13:04:23,331][102897] Updated weights for policy 0, policy_version 32570 (0.0007) +[2023-10-08 13:04:23,428][102898] Updated weights for policy 1, policy_version 32600 (0.0009) +[2023-10-08 13:04:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 66748416. Throughput: 0: 1770.8, 1: 1778.9. Samples: 16698496. Policy #0 lag: (min: 31.0, avg: 31.2, max: 40.0) +[2023-10-08 13:04:26,876][101941] Avg episode reward: [(0, '6.510'), (1, '6.830')] +[2023-10-08 13:04:27,156][102897] Updated weights for policy 0, policy_version 32580 (0.0007) +[2023-10-08 13:04:27,213][102898] Updated weights for policy 1, policy_version 32610 (0.0007) +[2023-10-08 13:04:27,543][102897] Updated weights for policy 0, policy_version 32590 (0.0007) +[2023-10-08 13:04:27,618][102898] Updated weights for policy 1, policy_version 32620 (0.0008) +[2023-10-08 13:04:27,913][102897] Updated weights for policy 0, policy_version 32600 (0.0009) +[2023-10-08 13:04:27,978][102898] Updated weights for policy 1, policy_version 32630 (0.0008) +[2023-10-08 13:04:28,354][102898] Updated weights for policy 1, policy_version 32640 (0.0008) +[2023-10-08 13:04:31,636][102897] Updated weights for policy 0, policy_version 32610 (0.0009) +[2023-10-08 13:04:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 66813952. Throughput: 0: 1793.3, 1: 1779.8. Samples: 16720254. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 13:04:31,875][101941] Avg episode reward: [(0, '7.080'), (1, '6.650')] +[2023-10-08 13:04:32,003][102897] Updated weights for policy 0, policy_version 32620 (0.0008) +[2023-10-08 13:04:32,230][102898] Updated weights for policy 1, policy_version 32650 (0.0007) +[2023-10-08 13:04:32,375][102897] Updated weights for policy 0, policy_version 32630 (0.0008) +[2023-10-08 13:04:32,588][102898] Updated weights for policy 1, policy_version 32660 (0.0008) +[2023-10-08 13:04:32,736][102897] Updated weights for policy 0, policy_version 32640 (0.0007) +[2023-10-08 13:04:32,961][102898] Updated weights for policy 1, policy_version 32670 (0.0007) +[2023-10-08 13:04:36,493][102897] Updated weights for policy 0, policy_version 32650 (0.0008) +[2023-10-08 13:04:36,847][102898] Updated weights for policy 1, policy_version 32680 (0.0007) +[2023-10-08 13:04:36,867][102897] Updated weights for policy 0, policy_version 32660 (0.0008) +[2023-10-08 13:04:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 66879488. Throughput: 0: 1766.3, 1: 1770.3. Samples: 16729942. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 13:04:36,876][101941] Avg episode reward: [(0, '7.170'), (1, '5.960')] +[2023-10-08 13:04:37,214][102898] Updated weights for policy 1, policy_version 32690 (0.0008) +[2023-10-08 13:04:37,238][102897] Updated weights for policy 0, policy_version 32670 (0.0007) +[2023-10-08 13:04:37,589][102898] Updated weights for policy 1, policy_version 32700 (0.0010) +[2023-10-08 13:04:41,031][102897] Updated weights for policy 0, policy_version 32680 (0.0009) +[2023-10-08 13:04:41,360][102898] Updated weights for policy 1, policy_version 32710 (0.0009) +[2023-10-08 13:04:41,407][102897] Updated weights for policy 0, policy_version 32690 (0.0007) +[2023-10-08 13:04:41,732][102898] Updated weights for policy 1, policy_version 32720 (0.0008) +[2023-10-08 13:04:41,773][102897] Updated weights for policy 0, policy_version 32700 (0.0008) +[2023-10-08 13:04:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 66945024. Throughput: 0: 1788.4, 1: 1771.8. Samples: 16752138. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 13:04:41,875][101941] Avg episode reward: [(0, '6.360'), (1, '5.770')] +[2023-10-08 13:04:42,098][102898] Updated weights for policy 1, policy_version 32730 (0.0008) +[2023-10-08 13:04:45,509][102897] Updated weights for policy 0, policy_version 32710 (0.0008) +[2023-10-08 13:04:45,880][102897] Updated weights for policy 0, policy_version 32720 (0.0009) +[2023-10-08 13:04:45,943][102898] Updated weights for policy 1, policy_version 32740 (0.0009) +[2023-10-08 13:04:46,263][102897] Updated weights for policy 0, policy_version 32730 (0.0009) +[2023-10-08 13:04:46,308][102898] Updated weights for policy 1, policy_version 32750 (0.0007) +[2023-10-08 13:04:46,677][102898] Updated weights for policy 1, policy_version 32760 (0.0008) +[2023-10-08 13:04:46,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 67043328. Throughput: 0: 1770.7, 1: 1773.4. Samples: 16772204. Policy #0 lag: (min: 31.0, avg: 33.7, max: 63.0) +[2023-10-08 13:04:46,876][101941] Avg episode reward: [(0, '6.100'), (1, '6.910')] +[2023-10-08 13:04:49,984][102897] Updated weights for policy 0, policy_version 32740 (0.0008) +[2023-10-08 13:04:50,359][102897] Updated weights for policy 0, policy_version 32750 (0.0009) +[2023-10-08 13:04:50,474][102898] Updated weights for policy 1, policy_version 32770 (0.0010) +[2023-10-08 13:04:50,736][102897] Updated weights for policy 0, policy_version 32760 (0.0007) +[2023-10-08 13:04:50,840][102898] Updated weights for policy 1, policy_version 32780 (0.0009) +[2023-10-08 13:04:51,211][102898] Updated weights for policy 1, policy_version 32790 (0.0007) +[2023-10-08 13:04:51,571][102898] Updated weights for policy 1, policy_version 32800 (0.0007) +[2023-10-08 13:04:51,875][101941] Fps is (10 sec: 19660.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 67141632. Throughput: 0: 1782.6, 1: 1761.7. Samples: 16783822. Policy #0 lag: (min: 12.0, avg: 14.0, max: 43.0) +[2023-10-08 13:04:51,876][101941] Avg episode reward: [(0, '6.170'), (1, '7.270')] +[2023-10-08 13:04:54,668][102897] Updated weights for policy 0, policy_version 32770 (0.0008) +[2023-10-08 13:04:55,048][102897] Updated weights for policy 0, policy_version 32780 (0.0007) +[2023-10-08 13:04:55,407][102897] Updated weights for policy 0, policy_version 32790 (0.0007) +[2023-10-08 13:04:55,442][102898] Updated weights for policy 1, policy_version 32810 (0.0007) +[2023-10-08 13:04:55,786][102897] Updated weights for policy 0, policy_version 32800 (0.0009) +[2023-10-08 13:04:55,810][102898] Updated weights for policy 1, policy_version 32820 (0.0009) +[2023-10-08 13:04:56,171][102898] Updated weights for policy 1, policy_version 32830 (0.0007) +[2023-10-08 13:04:56,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 67207168. Throughput: 0: 1772.2, 1: 1772.3. Samples: 16804406. Policy #0 lag: (min: 12.0, avg: 14.0, max: 43.0) +[2023-10-08 13:04:56,876][101941] Avg episode reward: [(0, '6.200'), (1, '7.590')] +[2023-10-08 13:04:59,497][102897] Updated weights for policy 0, policy_version 32810 (0.0007) +[2023-10-08 13:04:59,860][102897] Updated weights for policy 0, policy_version 32820 (0.0007) +[2023-10-08 13:05:00,044][102898] Updated weights for policy 1, policy_version 32840 (0.0007) +[2023-10-08 13:05:00,224][102897] Updated weights for policy 0, policy_version 32830 (0.0008) +[2023-10-08 13:05:00,412][102898] Updated weights for policy 1, policy_version 32850 (0.0007) +[2023-10-08 13:05:00,778][102898] Updated weights for policy 1, policy_version 32860 (0.0007) +[2023-10-08 13:05:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 67272704. Throughput: 0: 1766.8, 1: 1753.9. Samples: 16825362. Policy #0 lag: (min: 12.0, avg: 14.0, max: 43.0) +[2023-10-08 13:05:01,876][101941] Avg episode reward: [(0, '6.480'), (1, '7.240')] +[2023-10-08 13:05:03,868][102897] Updated weights for policy 0, policy_version 32840 (0.0008) +[2023-10-08 13:05:04,236][102897] Updated weights for policy 0, policy_version 32850 (0.0007) +[2023-10-08 13:05:04,473][102898] Updated weights for policy 1, policy_version 32870 (0.0008) +[2023-10-08 13:05:04,614][102897] Updated weights for policy 0, policy_version 32860 (0.0007) +[2023-10-08 13:05:04,843][102898] Updated weights for policy 1, policy_version 32880 (0.0009) +[2023-10-08 13:05:05,222][102898] Updated weights for policy 1, policy_version 32890 (0.0007) +[2023-10-08 13:05:06,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 67338240. Throughput: 0: 1780.9, 1: 1786.3. Samples: 16837130. Policy #0 lag: (min: 12.0, avg: 14.0, max: 43.0) +[2023-10-08 13:05:06,876][101941] Avg episode reward: [(0, '7.190'), (1, '7.350')] +[2023-10-08 13:05:08,384][102897] Updated weights for policy 0, policy_version 32870 (0.0008) +[2023-10-08 13:05:08,756][102897] Updated weights for policy 0, policy_version 32880 (0.0008) +[2023-10-08 13:05:09,062][102898] Updated weights for policy 1, policy_version 32900 (0.0008) +[2023-10-08 13:05:09,127][102897] Updated weights for policy 0, policy_version 32890 (0.0010) +[2023-10-08 13:05:09,432][102898] Updated weights for policy 1, policy_version 32910 (0.0008) +[2023-10-08 13:05:09,797][102898] Updated weights for policy 1, policy_version 32920 (0.0008) +[2023-10-08 13:05:11,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 67403776. Throughput: 0: 1775.9, 1: 1761.3. Samples: 16857672. Policy #0 lag: (min: 12.0, avg: 14.0, max: 43.0) +[2023-10-08 13:05:11,876][101941] Avg episode reward: [(0, '6.640'), (1, '7.870')] +[2023-10-08 13:05:13,086][102897] Updated weights for policy 0, policy_version 32900 (0.0008) +[2023-10-08 13:05:13,470][102897] Updated weights for policy 0, policy_version 32910 (0.0008) +[2023-10-08 13:05:13,648][102898] Updated weights for policy 1, policy_version 32930 (0.0007) +[2023-10-08 13:05:13,836][102897] Updated weights for policy 0, policy_version 32920 (0.0008) +[2023-10-08 13:05:14,041][102898] Updated weights for policy 1, policy_version 32940 (0.0008) +[2023-10-08 13:05:14,400][102898] Updated weights for policy 1, policy_version 32950 (0.0007) +[2023-10-08 13:05:14,768][102898] Updated weights for policy 1, policy_version 32960 (0.0008) +[2023-10-08 13:05:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 67469312. Throughput: 0: 1776.4, 1: 1767.2. Samples: 16879718. Policy #0 lag: (min: 31.0, avg: 31.2, max: 41.0) +[2023-10-08 13:05:16,876][101941] Avg episode reward: [(0, '6.430'), (1, '7.440')] +[2023-10-08 13:05:17,483][102897] Updated weights for policy 0, policy_version 32930 (0.0008) +[2023-10-08 13:05:17,859][102897] Updated weights for policy 0, policy_version 32940 (0.0008) +[2023-10-08 13:05:18,227][102897] Updated weights for policy 0, policy_version 32950 (0.0008) +[2023-10-08 13:05:18,475][102898] Updated weights for policy 1, policy_version 32970 (0.0008) +[2023-10-08 13:05:18,598][102897] Updated weights for policy 0, policy_version 32960 (0.0008) +[2023-10-08 13:05:18,851][102898] Updated weights for policy 1, policy_version 32980 (0.0008) +[2023-10-08 13:05:19,215][102898] Updated weights for policy 1, policy_version 32990 (0.0007) +[2023-10-08 13:05:21,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 67534848. Throughput: 0: 1777.9, 1: 1767.4. Samples: 16889480. Policy #0 lag: (min: 31.0, avg: 31.2, max: 41.0) +[2023-10-08 13:05:21,875][101941] Avg episode reward: [(0, '6.210'), (1, '7.120')] +[2023-10-08 13:05:22,562][102897] Updated weights for policy 0, policy_version 32970 (0.0011) +[2023-10-08 13:05:22,933][102897] Updated weights for policy 0, policy_version 32980 (0.0009) +[2023-10-08 13:05:23,170][102898] Updated weights for policy 1, policy_version 33000 (0.0007) +[2023-10-08 13:05:23,306][102897] Updated weights for policy 0, policy_version 32990 (0.0009) +[2023-10-08 13:05:23,541][102898] Updated weights for policy 1, policy_version 33010 (0.0007) +[2023-10-08 13:05:23,903][102898] Updated weights for policy 1, policy_version 33020 (0.0008) +[2023-10-08 13:05:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 67600384. Throughput: 0: 1772.9, 1: 1768.7. Samples: 16911508. Policy #0 lag: (min: 31.0, avg: 31.2, max: 41.0) +[2023-10-08 13:05:26,876][101941] Avg episode reward: [(0, '5.880'), (1, '7.350')] +[2023-10-08 13:05:27,075][102897] Updated weights for policy 0, policy_version 33000 (0.0007) +[2023-10-08 13:05:27,449][102897] Updated weights for policy 0, policy_version 33010 (0.0010) +[2023-10-08 13:05:27,578][102898] Updated weights for policy 1, policy_version 33030 (0.0007) +[2023-10-08 13:05:27,824][102897] Updated weights for policy 0, policy_version 33020 (0.0008) +[2023-10-08 13:05:27,939][102898] Updated weights for policy 1, policy_version 33040 (0.0009) +[2023-10-08 13:05:28,306][102898] Updated weights for policy 1, policy_version 33050 (0.0010) +[2023-10-08 13:05:31,626][102897] Updated weights for policy 0, policy_version 33030 (0.0007) +[2023-10-08 13:05:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 67665920. Throughput: 0: 1800.8, 1: 1787.6. Samples: 16933678. Policy #0 lag: (min: 31.0, avg: 31.2, max: 41.0) +[2023-10-08 13:05:31,876][101941] Avg episode reward: [(0, '5.820'), (1, '7.280')] +[2023-10-08 13:05:32,001][102897] Updated weights for policy 0, policy_version 33040 (0.0008) +[2023-10-08 13:05:32,029][102898] Updated weights for policy 1, policy_version 33060 (0.0010) +[2023-10-08 13:05:32,378][102897] Updated weights for policy 0, policy_version 33050 (0.0007) +[2023-10-08 13:05:32,389][102898] Updated weights for policy 1, policy_version 33070 (0.0010) +[2023-10-08 13:05:32,754][102898] Updated weights for policy 1, policy_version 33080 (0.0010) +[2023-10-08 13:05:36,148][102897] Updated weights for policy 0, policy_version 33060 (0.0007) +[2023-10-08 13:05:36,516][102897] Updated weights for policy 0, policy_version 33070 (0.0007) +[2023-10-08 13:05:36,591][102898] Updated weights for policy 1, policy_version 33090 (0.0010) +[2023-10-08 13:05:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 67731456. Throughput: 0: 1770.9, 1: 1774.4. Samples: 16943364. Policy #0 lag: (min: 31.0, avg: 31.2, max: 41.0) +[2023-10-08 13:05:36,876][101941] Avg episode reward: [(0, '6.420'), (1, '7.230')] +[2023-10-08 13:05:36,885][102897] Updated weights for policy 0, policy_version 33080 (0.0009) +[2023-10-08 13:05:36,961][102898] Updated weights for policy 1, policy_version 33100 (0.0007) +[2023-10-08 13:05:37,338][102898] Updated weights for policy 1, policy_version 33110 (0.0008) +[2023-10-08 13:05:37,698][102898] Updated weights for policy 1, policy_version 33120 (0.0010) +[2023-10-08 13:05:40,668][102897] Updated weights for policy 0, policy_version 33090 (0.0007) +[2023-10-08 13:05:41,041][102897] Updated weights for policy 0, policy_version 33100 (0.0008) +[2023-10-08 13:05:41,412][102897] Updated weights for policy 0, policy_version 33110 (0.0008) +[2023-10-08 13:05:41,576][102898] Updated weights for policy 1, policy_version 33130 (0.0010) +[2023-10-08 13:05:41,783][102897] Updated weights for policy 0, policy_version 33120 (0.0007) +[2023-10-08 13:05:41,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 67829760. Throughput: 0: 1797.3, 1: 1780.6. Samples: 16965412. Policy #0 lag: (min: 16.0, avg: 32.6, max: 48.0) +[2023-10-08 13:05:41,876][101941] Avg episode reward: [(0, '6.970'), (1, '7.430')] +[2023-10-08 13:05:41,948][102898] Updated weights for policy 1, policy_version 33140 (0.0009) +[2023-10-08 13:05:42,310][102898] Updated weights for policy 1, policy_version 33150 (0.0010) +[2023-10-08 13:05:45,636][102897] Updated weights for policy 0, policy_version 33130 (0.0009) +[2023-10-08 13:05:45,996][102897] Updated weights for policy 0, policy_version 33140 (0.0009) +[2023-10-08 13:05:46,157][102898] Updated weights for policy 1, policy_version 33160 (0.0009) +[2023-10-08 13:05:46,363][102897] Updated weights for policy 0, policy_version 33150 (0.0008) +[2023-10-08 13:05:46,516][102898] Updated weights for policy 1, policy_version 33170 (0.0007) +[2023-10-08 13:05:46,875][102898] Updated weights for policy 1, policy_version 33180 (0.0008) +[2023-10-08 13:05:46,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 67895296. Throughput: 0: 1775.4, 1: 1784.3. Samples: 16985548. Policy #0 lag: (min: 16.0, avg: 32.6, max: 48.0) +[2023-10-08 13:05:46,876][101941] Avg episode reward: [(0, '6.440'), (1, '7.250')] +[2023-10-08 13:05:50,056][102897] Updated weights for policy 0, policy_version 33160 (0.0009) +[2023-10-08 13:05:50,435][102897] Updated weights for policy 0, policy_version 33170 (0.0008) +[2023-10-08 13:05:50,801][102897] Updated weights for policy 0, policy_version 33180 (0.0008) +[2023-10-08 13:05:50,816][102898] Updated weights for policy 1, policy_version 33190 (0.0009) +[2023-10-08 13:05:51,172][102898] Updated weights for policy 1, policy_version 33200 (0.0008) +[2023-10-08 13:05:51,546][102898] Updated weights for policy 1, policy_version 33210 (0.0008) +[2023-10-08 13:05:51,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 67993600. Throughput: 0: 1789.4, 1: 1768.0. Samples: 16997212. Policy #0 lag: (min: 16.0, avg: 32.6, max: 48.0) +[2023-10-08 13:05:51,876][101941] Avg episode reward: [(0, '6.220'), (1, '7.070')] +[2023-10-08 13:05:54,590][102897] Updated weights for policy 0, policy_version 33190 (0.0008) +[2023-10-08 13:05:54,960][102897] Updated weights for policy 0, policy_version 33200 (0.0007) +[2023-10-08 13:05:55,323][102898] Updated weights for policy 1, policy_version 33220 (0.0008) +[2023-10-08 13:05:55,332][102897] Updated weights for policy 0, policy_version 33210 (0.0008) +[2023-10-08 13:05:55,695][102898] Updated weights for policy 1, policy_version 33230 (0.0008) +[2023-10-08 13:05:56,057][102898] Updated weights for policy 1, policy_version 33240 (0.0007) +[2023-10-08 13:05:56,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 68059136. Throughput: 0: 1772.8, 1: 1789.5. Samples: 17017974. Policy #0 lag: (min: 16.0, avg: 32.6, max: 48.0) +[2023-10-08 13:05:56,876][101941] Avg episode reward: [(0, '6.480'), (1, '7.130')] +[2023-10-08 13:05:59,171][102897] Updated weights for policy 0, policy_version 33220 (0.0009) +[2023-10-08 13:05:59,568][102897] Updated weights for policy 0, policy_version 33230 (0.0008) +[2023-10-08 13:05:59,942][102897] Updated weights for policy 0, policy_version 33240 (0.0008) +[2023-10-08 13:05:59,957][102898] Updated weights for policy 1, policy_version 33250 (0.0009) +[2023-10-08 13:06:00,356][102898] Updated weights for policy 1, policy_version 33260 (0.0009) +[2023-10-08 13:06:00,727][102898] Updated weights for policy 1, policy_version 33270 (0.0008) +[2023-10-08 13:06:01,091][102898] Updated weights for policy 1, policy_version 33280 (0.0008) +[2023-10-08 13:06:01,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 68124672. Throughput: 0: 1767.2, 1: 1762.0. Samples: 17038532. Policy #0 lag: (min: 20.0, avg: 20.1, max: 27.0) +[2023-10-08 13:06:01,876][101941] Avg episode reward: [(0, '6.600'), (1, '6.740')] +[2023-10-08 13:06:03,728][102897] Updated weights for policy 0, policy_version 33250 (0.0008) +[2023-10-08 13:06:04,096][102897] Updated weights for policy 0, policy_version 33260 (0.0008) +[2023-10-08 13:06:04,468][102897] Updated weights for policy 0, policy_version 33270 (0.0007) +[2023-10-08 13:06:04,844][102897] Updated weights for policy 0, policy_version 33280 (0.0007) +[2023-10-08 13:06:04,877][102898] Updated weights for policy 1, policy_version 33290 (0.0007) +[2023-10-08 13:06:05,246][102898] Updated weights for policy 1, policy_version 33300 (0.0009) +[2023-10-08 13:06:05,603][102898] Updated weights for policy 1, policy_version 33310 (0.0008) +[2023-10-08 13:06:06,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 68190208. Throughput: 0: 1776.3, 1: 1791.3. Samples: 17050022. Policy #0 lag: (min: 20.0, avg: 20.1, max: 27.0) +[2023-10-08 13:06:06,876][101941] Avg episode reward: [(0, '7.090'), (1, '6.960')] +[2023-10-08 13:06:08,662][102897] Updated weights for policy 0, policy_version 33290 (0.0008) +[2023-10-08 13:06:09,033][102897] Updated weights for policy 0, policy_version 33300 (0.0008) +[2023-10-08 13:06:09,273][102898] Updated weights for policy 1, policy_version 33320 (0.0007) +[2023-10-08 13:06:09,404][102897] Updated weights for policy 0, policy_version 33310 (0.0007) +[2023-10-08 13:06:09,640][102898] Updated weights for policy 1, policy_version 33330 (0.0007) +[2023-10-08 13:06:10,006][102898] Updated weights for policy 1, policy_version 33340 (0.0007) +[2023-10-08 13:06:11,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 68255744. Throughput: 0: 1766.9, 1: 1765.6. Samples: 17070468. Policy #0 lag: (min: 20.0, avg: 20.1, max: 27.0) +[2023-10-08 13:06:11,875][101941] Avg episode reward: [(0, '6.890'), (1, '7.690')] +[2023-10-08 13:06:13,352][102897] Updated weights for policy 0, policy_version 33320 (0.0007) +[2023-10-08 13:06:13,717][102897] Updated weights for policy 0, policy_version 33330 (0.0009) +[2023-10-08 13:06:13,837][102898] Updated weights for policy 1, policy_version 33350 (0.0008) +[2023-10-08 13:06:14,073][102897] Updated weights for policy 0, policy_version 33340 (0.0007) +[2023-10-08 13:06:14,202][102898] Updated weights for policy 1, policy_version 33360 (0.0007) +[2023-10-08 13:06:14,562][102898] Updated weights for policy 1, policy_version 33370 (0.0010) +[2023-10-08 13:06:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 68321280. Throughput: 0: 1770.4, 1: 1764.4. Samples: 17092744. Policy #0 lag: (min: 20.0, avg: 20.1, max: 27.0) +[2023-10-08 13:06:16,876][101941] Avg episode reward: [(0, '6.110'), (1, '7.370')] +[2023-10-08 13:06:16,884][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000033344_34144256.pth... +[2023-10-08 13:06:16,884][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000033376_34177024.pth... +[2023-10-08 13:06:16,915][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000031712_32473088.pth +[2023-10-08 13:06:16,916][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000031680_32440320.pth +[2023-10-08 13:06:16,919][102760] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p1/milestones/checkpoint_000033376_34177024.pth +[2023-10-08 13:06:16,920][102634] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p0/milestones/checkpoint_000033344_34144256.pth +[2023-10-08 13:06:17,533][102897] Updated weights for policy 0, policy_version 33350 (0.0009) +[2023-10-08 13:06:17,900][102897] Updated weights for policy 0, policy_version 33360 (0.0009) +[2023-10-08 13:06:18,268][102897] Updated weights for policy 0, policy_version 33370 (0.0008) +[2023-10-08 13:06:18,309][102898] Updated weights for policy 1, policy_version 33380 (0.0009) +[2023-10-08 13:06:18,675][102898] Updated weights for policy 1, policy_version 33390 (0.0007) +[2023-10-08 13:06:19,040][102898] Updated weights for policy 1, policy_version 33400 (0.0007) +[2023-10-08 13:06:21,875][101941] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 68386816. Throughput: 0: 1773.0, 1: 1766.3. Samples: 17102630. Policy #0 lag: (min: 20.0, avg: 20.1, max: 27.0) +[2023-10-08 13:06:21,876][101941] Avg episode reward: [(0, '6.570'), (1, '7.040')] +[2023-10-08 13:06:22,192][102897] Updated weights for policy 0, policy_version 33380 (0.0007) +[2023-10-08 13:06:22,560][102897] Updated weights for policy 0, policy_version 33390 (0.0009) +[2023-10-08 13:06:22,848][102898] Updated weights for policy 1, policy_version 33410 (0.0007) +[2023-10-08 13:06:22,939][102897] Updated weights for policy 0, policy_version 33400 (0.0008) +[2023-10-08 13:06:23,209][102898] Updated weights for policy 1, policy_version 33420 (0.0007) +[2023-10-08 13:06:23,584][102898] Updated weights for policy 1, policy_version 33430 (0.0009) +[2023-10-08 13:06:23,945][102898] Updated weights for policy 1, policy_version 33440 (0.0009) +[2023-10-08 13:06:26,662][102897] Updated weights for policy 0, policy_version 33410 (0.0008) +[2023-10-08 13:06:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 68452352. Throughput: 0: 1771.8, 1: 1769.8. Samples: 17124786. Policy #0 lag: (min: 31.0, avg: 34.9, max: 63.0) +[2023-10-08 13:06:26,876][101941] Avg episode reward: [(0, '6.470'), (1, '7.020')] +[2023-10-08 13:06:27,031][102897] Updated weights for policy 0, policy_version 33420 (0.0011) +[2023-10-08 13:06:27,402][102897] Updated weights for policy 0, policy_version 33430 (0.0010) +[2023-10-08 13:06:27,773][102897] Updated weights for policy 0, policy_version 33440 (0.0007) +[2023-10-08 13:06:27,824][102898] Updated weights for policy 1, policy_version 33450 (0.0009) +[2023-10-08 13:06:28,199][102898] Updated weights for policy 1, policy_version 33460 (0.0008) +[2023-10-08 13:06:28,558][102898] Updated weights for policy 1, policy_version 33470 (0.0008) +[2023-10-08 13:06:31,669][102897] Updated weights for policy 0, policy_version 33450 (0.0007) +[2023-10-08 13:06:31,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 68517888. Throughput: 0: 1799.2, 1: 1784.3. Samples: 17146804. Policy #0 lag: (min: 31.0, avg: 34.9, max: 63.0) +[2023-10-08 13:06:31,876][101941] Avg episode reward: [(0, '6.590'), (1, '7.510')] +[2023-10-08 13:06:32,042][102897] Updated weights for policy 0, policy_version 33460 (0.0007) +[2023-10-08 13:06:32,305][102898] Updated weights for policy 1, policy_version 33480 (0.0007) +[2023-10-08 13:06:32,417][102897] Updated weights for policy 0, policy_version 33470 (0.0008) +[2023-10-08 13:06:32,677][102898] Updated weights for policy 1, policy_version 33490 (0.0008) +[2023-10-08 13:06:33,047][102898] Updated weights for policy 1, policy_version 33500 (0.0010) +[2023-10-08 13:06:36,210][102897] Updated weights for policy 0, policy_version 33480 (0.0009) +[2023-10-08 13:06:36,586][102897] Updated weights for policy 0, policy_version 33490 (0.0011) +[2023-10-08 13:06:36,857][102898] Updated weights for policy 1, policy_version 33510 (0.0009) +[2023-10-08 13:06:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 68583424. Throughput: 0: 1768.4, 1: 1770.6. Samples: 17156470. Policy #0 lag: (min: 31.0, avg: 34.9, max: 63.0) +[2023-10-08 13:06:36,875][101941] Avg episode reward: [(0, '6.150'), (1, '7.550')] +[2023-10-08 13:06:36,951][102897] Updated weights for policy 0, policy_version 33500 (0.0007) +[2023-10-08 13:06:37,229][102898] Updated weights for policy 1, policy_version 33520 (0.0008) +[2023-10-08 13:06:37,597][102898] Updated weights for policy 1, policy_version 33530 (0.0009) +[2023-10-08 13:06:40,796][102897] Updated weights for policy 0, policy_version 33510 (0.0008) +[2023-10-08 13:06:41,160][102897] Updated weights for policy 0, policy_version 33520 (0.0008) +[2023-10-08 13:06:41,385][102898] Updated weights for policy 1, policy_version 33540 (0.0007) +[2023-10-08 13:06:41,530][102897] Updated weights for policy 0, policy_version 33530 (0.0007) +[2023-10-08 13:06:41,745][102898] Updated weights for policy 1, policy_version 33550 (0.0008) +[2023-10-08 13:06:41,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 68681728. Throughput: 0: 1789.6, 1: 1780.9. Samples: 17178648. Policy #0 lag: (min: 31.0, avg: 34.9, max: 63.0) +[2023-10-08 13:06:41,876][101941] Avg episode reward: [(0, '6.080'), (1, '7.270')] +[2023-10-08 13:06:42,114][102898] Updated weights for policy 1, policy_version 33560 (0.0008) +[2023-10-08 13:06:45,404][102897] Updated weights for policy 0, policy_version 33540 (0.0008) +[2023-10-08 13:06:45,789][102897] Updated weights for policy 0, policy_version 33550 (0.0010) +[2023-10-08 13:06:45,801][102898] Updated weights for policy 1, policy_version 33570 (0.0008) +[2023-10-08 13:06:46,157][102897] Updated weights for policy 0, policy_version 33560 (0.0007) +[2023-10-08 13:06:46,189][102898] Updated weights for policy 1, policy_version 33580 (0.0007) +[2023-10-08 13:06:46,559][102898] Updated weights for policy 1, policy_version 33590 (0.0008) +[2023-10-08 13:06:46,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 68747264. Throughput: 0: 1763.2, 1: 1791.4. Samples: 17198488. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:06:46,876][101941] Avg episode reward: [(0, '6.030'), (1, '7.260')] +[2023-10-08 13:06:46,924][102898] Updated weights for policy 1, policy_version 33600 (0.0007) +[2023-10-08 13:06:49,839][102897] Updated weights for policy 0, policy_version 33570 (0.0009) +[2023-10-08 13:06:50,207][102897] Updated weights for policy 0, policy_version 33580 (0.0007) +[2023-10-08 13:06:50,576][102897] Updated weights for policy 0, policy_version 33590 (0.0008) +[2023-10-08 13:06:50,613][102898] Updated weights for policy 1, policy_version 33610 (0.0009) +[2023-10-08 13:06:50,952][102897] Updated weights for policy 0, policy_version 33600 (0.0008) +[2023-10-08 13:06:50,979][102898] Updated weights for policy 1, policy_version 33620 (0.0008) +[2023-10-08 13:06:51,346][102898] Updated weights for policy 1, policy_version 33630 (0.0009) +[2023-10-08 13:06:51,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 68845568. Throughput: 0: 1785.1, 1: 1779.6. Samples: 17210436. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:06:51,876][101941] Avg episode reward: [(0, '6.260'), (1, '8.000')] +[2023-10-08 13:06:54,700][102897] Updated weights for policy 0, policy_version 33610 (0.0010) +[2023-10-08 13:06:55,069][102898] Updated weights for policy 1, policy_version 33640 (0.0007) +[2023-10-08 13:06:55,069][102897] Updated weights for policy 0, policy_version 33620 (0.0010) +[2023-10-08 13:06:55,435][102898] Updated weights for policy 1, policy_version 33650 (0.0009) +[2023-10-08 13:06:55,440][102897] Updated weights for policy 0, policy_version 33630 (0.0007) +[2023-10-08 13:06:55,803][102898] Updated weights for policy 1, policy_version 33660 (0.0009) +[2023-10-08 13:06:56,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 68911104. Throughput: 0: 1766.7, 1: 1791.0. Samples: 17230566. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:06:56,876][101941] Avg episode reward: [(0, '6.790'), (1, '7.380')] +[2023-10-08 13:06:59,324][102897] Updated weights for policy 0, policy_version 33640 (0.0009) +[2023-10-08 13:06:59,695][102897] Updated weights for policy 0, policy_version 33650 (0.0008) +[2023-10-08 13:06:59,702][102898] Updated weights for policy 1, policy_version 33670 (0.0009) +[2023-10-08 13:07:00,063][102897] Updated weights for policy 0, policy_version 33660 (0.0007) +[2023-10-08 13:07:00,073][102898] Updated weights for policy 1, policy_version 33680 (0.0008) +[2023-10-08 13:07:00,446][102898] Updated weights for policy 1, policy_version 33690 (0.0008) +[2023-10-08 13:07:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 68976640. Throughput: 0: 1759.2, 1: 1774.3. Samples: 17251752. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:07:01,876][101941] Avg episode reward: [(0, '6.580'), (1, '6.900')] +[2023-10-08 13:07:04,040][102897] Updated weights for policy 0, policy_version 33670 (0.0009) +[2023-10-08 13:07:04,227][102898] Updated weights for policy 1, policy_version 33700 (0.0009) +[2023-10-08 13:07:04,417][102897] Updated weights for policy 0, policy_version 33680 (0.0009) +[2023-10-08 13:07:04,575][102898] Updated weights for policy 1, policy_version 33710 (0.0007) +[2023-10-08 13:07:04,786][102897] Updated weights for policy 0, policy_version 33690 (0.0009) +[2023-10-08 13:07:04,941][102898] Updated weights for policy 1, policy_version 33720 (0.0007) +[2023-10-08 13:07:06,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 69042176. Throughput: 0: 1773.1, 1: 1799.7. Samples: 17263408. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:07:06,875][101941] Avg episode reward: [(0, '6.700'), (1, '7.300')] +[2023-10-08 13:07:08,680][102898] Updated weights for policy 1, policy_version 33730 (0.0009) +[2023-10-08 13:07:08,799][102897] Updated weights for policy 0, policy_version 33700 (0.0009) +[2023-10-08 13:07:09,045][102898] Updated weights for policy 1, policy_version 33740 (0.0007) +[2023-10-08 13:07:09,170][102897] Updated weights for policy 0, policy_version 33710 (0.0009) +[2023-10-08 13:07:09,413][102898] Updated weights for policy 1, policy_version 33750 (0.0007) +[2023-10-08 13:07:09,534][102897] Updated weights for policy 0, policy_version 33720 (0.0007) +[2023-10-08 13:07:09,778][102898] Updated weights for policy 1, policy_version 33760 (0.0007) +[2023-10-08 13:07:11,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 69107712. Throughput: 0: 1755.7, 1: 1783.3. Samples: 17284044. Policy #0 lag: (min: 5.0, avg: 5.0, max: 9.0) +[2023-10-08 13:07:11,876][101941] Avg episode reward: [(0, '6.670'), (1, '7.920')] +[2023-10-08 13:07:13,312][102897] Updated weights for policy 0, policy_version 33730 (0.0009) +[2023-10-08 13:07:13,519][102898] Updated weights for policy 1, policy_version 33770 (0.0007) +[2023-10-08 13:07:13,671][102897] Updated weights for policy 0, policy_version 33740 (0.0007) +[2023-10-08 13:07:13,880][102898] Updated weights for policy 1, policy_version 33780 (0.0007) +[2023-10-08 13:07:14,047][102897] Updated weights for policy 0, policy_version 33750 (0.0007) +[2023-10-08 13:07:14,254][102898] Updated weights for policy 1, policy_version 33790 (0.0007) +[2023-10-08 13:07:14,416][102897] Updated weights for policy 0, policy_version 33760 (0.0008) +[2023-10-08 13:07:16,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 69173248. Throughput: 0: 1757.7, 1: 1782.4. Samples: 17306108. Policy #0 lag: (min: 5.0, avg: 5.0, max: 9.0) +[2023-10-08 13:07:16,876][101941] Avg episode reward: [(0, '6.140'), (1, '7.830')] +[2023-10-08 13:07:18,070][102898] Updated weights for policy 1, policy_version 33800 (0.0009) +[2023-10-08 13:07:18,247][102897] Updated weights for policy 0, policy_version 33770 (0.0007) +[2023-10-08 13:07:18,431][102898] Updated weights for policy 1, policy_version 33810 (0.0008) +[2023-10-08 13:07:18,615][102897] Updated weights for policy 0, policy_version 33780 (0.0009) +[2023-10-08 13:07:18,804][102898] Updated weights for policy 1, policy_version 33820 (0.0009) +[2023-10-08 13:07:18,980][102897] Updated weights for policy 0, policy_version 33790 (0.0008) +[2023-10-08 13:07:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 69238784. Throughput: 0: 1755.7, 1: 1782.7. Samples: 17315700. Policy #0 lag: (min: 5.0, avg: 5.0, max: 9.0) +[2023-10-08 13:07:21,876][101941] Avg episode reward: [(0, '6.640'), (1, '7.470')] +[2023-10-08 13:07:22,701][102898] Updated weights for policy 1, policy_version 33830 (0.0008) +[2023-10-08 13:07:22,819][102897] Updated weights for policy 0, policy_version 33800 (0.0007) +[2023-10-08 13:07:23,071][102898] Updated weights for policy 1, policy_version 33840 (0.0007) +[2023-10-08 13:07:23,192][102897] Updated weights for policy 0, policy_version 33810 (0.0008) +[2023-10-08 13:07:23,429][102898] Updated weights for policy 1, policy_version 33850 (0.0008) +[2023-10-08 13:07:23,568][102897] Updated weights for policy 0, policy_version 33820 (0.0009) +[2023-10-08 13:07:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 69304320. Throughput: 0: 1759.9, 1: 1777.2. Samples: 17337818. Policy #0 lag: (min: 5.0, avg: 5.0, max: 9.0) +[2023-10-08 13:07:26,876][101941] Avg episode reward: [(0, '6.790'), (1, '7.220')] +[2023-10-08 13:07:27,244][102898] Updated weights for policy 1, policy_version 33860 (0.0009) +[2023-10-08 13:07:27,244][102897] Updated weights for policy 0, policy_version 33830 (0.0009) +[2023-10-08 13:07:27,599][102898] Updated weights for policy 1, policy_version 33870 (0.0007) +[2023-10-08 13:07:27,610][102897] Updated weights for policy 0, policy_version 33840 (0.0007) +[2023-10-08 13:07:27,962][102898] Updated weights for policy 1, policy_version 33880 (0.0007) +[2023-10-08 13:07:27,982][102897] Updated weights for policy 0, policy_version 33850 (0.0007) +[2023-10-08 13:07:31,837][102897] Updated weights for policy 0, policy_version 33860 (0.0009) +[2023-10-08 13:07:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 69369856. Throughput: 0: 1792.3, 1: 1793.6. Samples: 17359852. Policy #0 lag: (min: 5.0, avg: 5.0, max: 9.0) +[2023-10-08 13:07:31,876][101941] Avg episode reward: [(0, '6.560'), (1, '6.720')] +[2023-10-08 13:07:31,923][102898] Updated weights for policy 1, policy_version 33890 (0.0009) +[2023-10-08 13:07:32,219][102897] Updated weights for policy 0, policy_version 33870 (0.0009) +[2023-10-08 13:07:32,307][102898] Updated weights for policy 1, policy_version 33900 (0.0008) +[2023-10-08 13:07:32,597][102897] Updated weights for policy 0, policy_version 33880 (0.0008) +[2023-10-08 13:07:32,679][102898] Updated weights for policy 1, policy_version 33910 (0.0007) +[2023-10-08 13:07:33,049][102898] Updated weights for policy 1, policy_version 33920 (0.0010) +[2023-10-08 13:07:36,285][102897] Updated weights for policy 0, policy_version 33890 (0.0007) +[2023-10-08 13:07:36,647][102898] Updated weights for policy 1, policy_version 33930 (0.0007) +[2023-10-08 13:07:36,652][102897] Updated weights for policy 0, policy_version 33900 (0.0007) +[2023-10-08 13:07:36,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 69435392. Throughput: 0: 1757.5, 1: 1770.9. Samples: 17369214. Policy #0 lag: (min: 4.0, avg: 11.0, max: 36.0) +[2023-10-08 13:07:36,875][101941] Avg episode reward: [(0, '6.510'), (1, '7.020')] +[2023-10-08 13:07:37,010][102898] Updated weights for policy 1, policy_version 33940 (0.0007) +[2023-10-08 13:07:37,023][102897] Updated weights for policy 0, policy_version 33910 (0.0007) +[2023-10-08 13:07:37,382][102898] Updated weights for policy 1, policy_version 33950 (0.0008) +[2023-10-08 13:07:37,393][102897] Updated weights for policy 0, policy_version 33920 (0.0008) +[2023-10-08 13:07:41,154][102897] Updated weights for policy 0, policy_version 33930 (0.0010) +[2023-10-08 13:07:41,191][102898] Updated weights for policy 1, policy_version 33960 (0.0008) +[2023-10-08 13:07:41,533][102897] Updated weights for policy 0, policy_version 33940 (0.0008) +[2023-10-08 13:07:41,555][102898] Updated weights for policy 1, policy_version 33970 (0.0009) +[2023-10-08 13:07:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 14106.9). Total num frames: 69500928. Throughput: 0: 1791.9, 1: 1791.0. Samples: 17391796. Policy #0 lag: (min: 4.0, avg: 11.0, max: 36.0) +[2023-10-08 13:07:41,876][101941] Avg episode reward: [(0, '6.750'), (1, '7.130')] +[2023-10-08 13:07:41,907][102897] Updated weights for policy 0, policy_version 33950 (0.0009) +[2023-10-08 13:07:41,913][102898] Updated weights for policy 1, policy_version 33980 (0.0009) +[2023-10-08 13:07:45,685][102897] Updated weights for policy 0, policy_version 33960 (0.0010) +[2023-10-08 13:07:45,804][102898] Updated weights for policy 1, policy_version 33990 (0.0009) +[2023-10-08 13:07:46,054][102897] Updated weights for policy 0, policy_version 33970 (0.0008) +[2023-10-08 13:07:46,170][102898] Updated weights for policy 1, policy_version 34000 (0.0007) +[2023-10-08 13:07:46,434][102897] Updated weights for policy 0, policy_version 33980 (0.0007) +[2023-10-08 13:07:46,548][102898] Updated weights for policy 1, policy_version 34010 (0.0007) +[2023-10-08 13:07:46,875][101941] Fps is (10 sec: 19660.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 69632000. Throughput: 0: 1772.2, 1: 1784.5. Samples: 17411804. Policy #0 lag: (min: 4.0, avg: 11.0, max: 36.0) +[2023-10-08 13:07:46,875][101941] Avg episode reward: [(0, '6.910'), (1, '6.810')] +[2023-10-08 13:07:50,273][102897] Updated weights for policy 0, policy_version 33990 (0.0007) +[2023-10-08 13:07:50,429][102898] Updated weights for policy 1, policy_version 34020 (0.0009) +[2023-10-08 13:07:50,642][102897] Updated weights for policy 0, policy_version 34000 (0.0007) +[2023-10-08 13:07:50,793][102898] Updated weights for policy 1, policy_version 34030 (0.0008) +[2023-10-08 13:07:51,004][102897] Updated weights for policy 0, policy_version 34010 (0.0007) +[2023-10-08 13:07:51,162][102898] Updated weights for policy 1, policy_version 34040 (0.0009) +[2023-10-08 13:07:51,875][101941] Fps is (10 sec: 19660.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 69697536. Throughput: 0: 1782.3, 1: 1777.7. Samples: 17423610. Policy #0 lag: (min: 4.0, avg: 11.0, max: 36.0) +[2023-10-08 13:07:51,876][101941] Avg episode reward: [(0, '6.530'), (1, '7.190')] +[2023-10-08 13:07:54,792][102897] Updated weights for policy 0, policy_version 34020 (0.0008) +[2023-10-08 13:07:54,942][102898] Updated weights for policy 1, policy_version 34050 (0.0011) +[2023-10-08 13:07:55,166][102897] Updated weights for policy 0, policy_version 34030 (0.0008) +[2023-10-08 13:07:55,312][102898] Updated weights for policy 1, policy_version 34060 (0.0007) +[2023-10-08 13:07:55,530][102897] Updated weights for policy 0, policy_version 34040 (0.0008) +[2023-10-08 13:07:55,681][102898] Updated weights for policy 1, policy_version 34070 (0.0008) +[2023-10-08 13:07:56,048][102898] Updated weights for policy 1, policy_version 34080 (0.0009) +[2023-10-08 13:07:56,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 69763072. Throughput: 0: 1780.8, 1: 1780.1. Samples: 17444282. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:07:56,876][101941] Avg episode reward: [(0, '6.290'), (1, '7.230')] +[2023-10-08 13:07:59,249][102897] Updated weights for policy 0, policy_version 34050 (0.0009) +[2023-10-08 13:07:59,621][102897] Updated weights for policy 0, policy_version 34060 (0.0007) +[2023-10-08 13:07:59,847][102898] Updated weights for policy 1, policy_version 34090 (0.0007) +[2023-10-08 13:07:59,998][102897] Updated weights for policy 0, policy_version 34070 (0.0007) +[2023-10-08 13:08:00,219][102898] Updated weights for policy 1, policy_version 34100 (0.0007) +[2023-10-08 13:08:00,361][102897] Updated weights for policy 0, policy_version 34080 (0.0007) +[2023-10-08 13:08:00,583][102898] Updated weights for policy 1, policy_version 34110 (0.0009) +[2023-10-08 13:08:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 69828608. Throughput: 0: 1771.5, 1: 1771.0. Samples: 17465520. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:08:01,876][101941] Avg episode reward: [(0, '6.540'), (1, '6.870')] +[2023-10-08 13:08:04,060][102897] Updated weights for policy 0, policy_version 34090 (0.0008) +[2023-10-08 13:08:04,375][102898] Updated weights for policy 1, policy_version 34120 (0.0009) +[2023-10-08 13:08:04,428][102897] Updated weights for policy 0, policy_version 34100 (0.0008) +[2023-10-08 13:08:04,751][102898] Updated weights for policy 1, policy_version 34130 (0.0008) +[2023-10-08 13:08:04,812][102897] Updated weights for policy 0, policy_version 34110 (0.0007) +[2023-10-08 13:08:05,110][102898] Updated weights for policy 1, policy_version 34140 (0.0007) +[2023-10-08 13:08:06,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 69894144. Throughput: 0: 1785.6, 1: 1794.8. Samples: 17476814. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:08:06,875][101941] Avg episode reward: [(0, '6.860'), (1, '6.790')] +[2023-10-08 13:08:08,633][102897] Updated weights for policy 0, policy_version 34120 (0.0007) +[2023-10-08 13:08:08,829][102898] Updated weights for policy 1, policy_version 34150 (0.0009) +[2023-10-08 13:08:09,001][102897] Updated weights for policy 0, policy_version 34130 (0.0009) +[2023-10-08 13:08:09,199][102898] Updated weights for policy 1, policy_version 34160 (0.0008) +[2023-10-08 13:08:09,369][102897] Updated weights for policy 0, policy_version 34140 (0.0007) +[2023-10-08 13:08:09,562][102898] Updated weights for policy 1, policy_version 34170 (0.0008) +[2023-10-08 13:08:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 69959680. Throughput: 0: 1766.7, 1: 1774.8. Samples: 17497184. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:08:11,875][101941] Avg episode reward: [(0, '6.230'), (1, '6.870')] +[2023-10-08 13:08:13,151][102897] Updated weights for policy 0, policy_version 34150 (0.0009) +[2023-10-08 13:08:13,412][102898] Updated weights for policy 1, policy_version 34180 (0.0007) +[2023-10-08 13:08:13,516][102897] Updated weights for policy 0, policy_version 34160 (0.0009) +[2023-10-08 13:08:13,780][102898] Updated weights for policy 1, policy_version 34190 (0.0007) +[2023-10-08 13:08:13,885][102897] Updated weights for policy 0, policy_version 34170 (0.0008) +[2023-10-08 13:08:14,146][102898] Updated weights for policy 1, policy_version 34200 (0.0008) +[2023-10-08 13:08:16,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 70025216. Throughput: 0: 1771.7, 1: 1773.9. Samples: 17519402. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:08:16,876][101941] Avg episode reward: [(0, '6.820'), (1, '6.830')] +[2023-10-08 13:08:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000034176_34996224.pth... +[2023-10-08 13:08:16,883][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000034208_35028992.pth... +[2023-10-08 13:08:16,914][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000032544_33325056.pth +[2023-10-08 13:08:16,925][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000032512_33292288.pth +[2023-10-08 13:08:17,837][102897] Updated weights for policy 0, policy_version 34180 (0.0008) +[2023-10-08 13:08:17,934][102898] Updated weights for policy 1, policy_version 34210 (0.0010) +[2023-10-08 13:08:18,231][102897] Updated weights for policy 0, policy_version 34190 (0.0008) +[2023-10-08 13:08:18,330][102898] Updated weights for policy 1, policy_version 34220 (0.0009) +[2023-10-08 13:08:18,597][102897] Updated weights for policy 0, policy_version 34200 (0.0008) +[2023-10-08 13:08:18,689][102898] Updated weights for policy 1, policy_version 34230 (0.0008) +[2023-10-08 13:08:19,053][102898] Updated weights for policy 1, policy_version 34240 (0.0009) +[2023-10-08 13:08:21,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 70090752. Throughput: 0: 1773.3, 1: 1774.6. Samples: 17528870. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:08:21,876][101941] Avg episode reward: [(0, '7.100'), (1, '7.460')] +[2023-10-08 13:08:22,328][102897] Updated weights for policy 0, policy_version 34210 (0.0008) +[2023-10-08 13:08:22,703][102897] Updated weights for policy 0, policy_version 34220 (0.0008) +[2023-10-08 13:08:23,023][102898] Updated weights for policy 1, policy_version 34250 (0.0008) +[2023-10-08 13:08:23,069][102897] Updated weights for policy 0, policy_version 34230 (0.0008) +[2023-10-08 13:08:23,381][102898] Updated weights for policy 1, policy_version 34260 (0.0007) +[2023-10-08 13:08:23,435][102897] Updated weights for policy 0, policy_version 34240 (0.0008) +[2023-10-08 13:08:23,747][102898] Updated weights for policy 1, policy_version 34270 (0.0010) +[2023-10-08 13:08:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 70156288. Throughput: 0: 1770.2, 1: 1763.0. Samples: 17550788. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:08:26,876][101941] Avg episode reward: [(0, '6.920'), (1, '7.440')] +[2023-10-08 13:08:27,136][102897] Updated weights for policy 0, policy_version 34250 (0.0007) +[2023-10-08 13:08:27,512][102897] Updated weights for policy 0, policy_version 34260 (0.0007) +[2023-10-08 13:08:27,587][102898] Updated weights for policy 1, policy_version 34280 (0.0008) +[2023-10-08 13:08:27,880][102897] Updated weights for policy 0, policy_version 34270 (0.0007) +[2023-10-08 13:08:27,949][102898] Updated weights for policy 1, policy_version 34290 (0.0007) +[2023-10-08 13:08:28,316][102898] Updated weights for policy 1, policy_version 34300 (0.0010) +[2023-10-08 13:08:31,746][102897] Updated weights for policy 0, policy_version 34280 (0.0007) +[2023-10-08 13:08:31,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 70221824. Throughput: 0: 1796.4, 1: 1793.5. Samples: 17573352. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:08:31,876][101941] Avg episode reward: [(0, '6.640'), (1, '7.720')] +[2023-10-08 13:08:32,039][102898] Updated weights for policy 1, policy_version 34310 (0.0007) +[2023-10-08 13:08:32,117][102897] Updated weights for policy 0, policy_version 34290 (0.0007) +[2023-10-08 13:08:32,400][102898] Updated weights for policy 1, policy_version 34320 (0.0007) +[2023-10-08 13:08:32,483][102897] Updated weights for policy 0, policy_version 34300 (0.0007) +[2023-10-08 13:08:32,768][102898] Updated weights for policy 1, policy_version 34330 (0.0007) +[2023-10-08 13:08:36,306][102897] Updated weights for policy 0, policy_version 34310 (0.0008) +[2023-10-08 13:08:36,524][102898] Updated weights for policy 1, policy_version 34340 (0.0008) +[2023-10-08 13:08:36,672][102897] Updated weights for policy 0, policy_version 34320 (0.0008) +[2023-10-08 13:08:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 70287360. Throughput: 0: 1771.7, 1: 1773.5. Samples: 17583140. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:08:36,875][101941] Avg episode reward: [(0, '6.510'), (1, '8.080')] +[2023-10-08 13:08:36,894][102898] Updated weights for policy 1, policy_version 34350 (0.0007) +[2023-10-08 13:08:37,048][102897] Updated weights for policy 0, policy_version 34330 (0.0010) +[2023-10-08 13:08:37,269][102898] Updated weights for policy 1, policy_version 34360 (0.0007) +[2023-10-08 13:08:40,864][102897] Updated weights for policy 0, policy_version 34340 (0.0011) +[2023-10-08 13:08:41,045][102898] Updated weights for policy 1, policy_version 34370 (0.0007) +[2023-10-08 13:08:41,233][102897] Updated weights for policy 0, policy_version 34350 (0.0007) +[2023-10-08 13:08:41,411][102898] Updated weights for policy 1, policy_version 34380 (0.0007) +[2023-10-08 13:08:41,597][102897] Updated weights for policy 0, policy_version 34360 (0.0008) +[2023-10-08 13:08:41,774][102898] Updated weights for policy 1, policy_version 34390 (0.0007) +[2023-10-08 13:08:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14106.9). Total num frames: 70352896. Throughput: 0: 1790.1, 1: 1790.0. Samples: 17605384. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:08:41,875][101941] Avg episode reward: [(0, '6.370'), (1, '7.120')] +[2023-10-08 13:08:42,144][102898] Updated weights for policy 1, policy_version 34400 (0.0007) +[2023-10-08 13:08:45,271][102897] Updated weights for policy 0, policy_version 34370 (0.0007) +[2023-10-08 13:08:45,635][102897] Updated weights for policy 0, policy_version 34380 (0.0009) +[2023-10-08 13:08:45,899][102898] Updated weights for policy 1, policy_version 34410 (0.0007) +[2023-10-08 13:08:46,011][102897] Updated weights for policy 0, policy_version 34390 (0.0009) +[2023-10-08 13:08:46,265][102898] Updated weights for policy 1, policy_version 34420 (0.0010) +[2023-10-08 13:08:46,374][102897] Updated weights for policy 0, policy_version 34400 (0.0007) +[2023-10-08 13:08:46,635][102898] Updated weights for policy 1, policy_version 34430 (0.0009) +[2023-10-08 13:08:46,875][101941] Fps is (10 sec: 19660.5, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 70483968. Throughput: 0: 1770.5, 1: 1780.0. Samples: 17625292. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:08:46,876][101941] Avg episode reward: [(0, '6.530'), (1, '7.110')] +[2023-10-08 13:08:50,207][102897] Updated weights for policy 0, policy_version 34410 (0.0009) +[2023-10-08 13:08:50,501][102898] Updated weights for policy 1, policy_version 34440 (0.0008) +[2023-10-08 13:08:50,579][102897] Updated weights for policy 0, policy_version 34420 (0.0007) +[2023-10-08 13:08:50,869][102898] Updated weights for policy 1, policy_version 34450 (0.0008) +[2023-10-08 13:08:50,949][102897] Updated weights for policy 0, policy_version 34430 (0.0008) +[2023-10-08 13:08:51,229][102898] Updated weights for policy 1, policy_version 34460 (0.0009) +[2023-10-08 13:08:51,875][101941] Fps is (10 sec: 19660.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 70549504. Throughput: 0: 1789.5, 1: 1777.2. Samples: 17637318. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:08:51,876][101941] Avg episode reward: [(0, '5.980'), (1, '7.140')] +[2023-10-08 13:08:54,808][102897] Updated weights for policy 0, policy_version 34440 (0.0008) +[2023-10-08 13:08:54,911][102898] Updated weights for policy 1, policy_version 34470 (0.0008) +[2023-10-08 13:08:55,180][102897] Updated weights for policy 0, policy_version 34450 (0.0008) +[2023-10-08 13:08:55,274][102898] Updated weights for policy 1, policy_version 34480 (0.0009) +[2023-10-08 13:08:55,546][102897] Updated weights for policy 0, policy_version 34460 (0.0009) +[2023-10-08 13:08:55,643][102898] Updated weights for policy 1, policy_version 34490 (0.0007) +[2023-10-08 13:08:56,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 70615040. Throughput: 0: 1783.9, 1: 1786.8. Samples: 17657866. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:08:56,876][101941] Avg episode reward: [(0, '6.840'), (1, '6.700')] +[2023-10-08 13:08:59,378][102897] Updated weights for policy 0, policy_version 34470 (0.0008) +[2023-10-08 13:08:59,398][102898] Updated weights for policy 1, policy_version 34500 (0.0008) +[2023-10-08 13:08:59,753][102897] Updated weights for policy 0, policy_version 34480 (0.0007) +[2023-10-08 13:08:59,760][102898] Updated weights for policy 1, policy_version 34510 (0.0007) +[2023-10-08 13:09:00,115][102897] Updated weights for policy 0, policy_version 34490 (0.0007) +[2023-10-08 13:09:00,124][102898] Updated weights for policy 1, policy_version 34520 (0.0009) +[2023-10-08 13:09:01,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 70680576. Throughput: 0: 1768.5, 1: 1772.9. Samples: 17678766. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:09:01,875][101941] Avg episode reward: [(0, '6.950'), (1, '6.640')] +[2023-10-08 13:09:04,010][102898] Updated weights for policy 1, policy_version 34530 (0.0009) +[2023-10-08 13:09:04,058][102897] Updated weights for policy 0, policy_version 34500 (0.0008) +[2023-10-08 13:09:04,395][102898] Updated weights for policy 1, policy_version 34540 (0.0009) +[2023-10-08 13:09:04,458][102897] Updated weights for policy 0, policy_version 34510 (0.0007) +[2023-10-08 13:09:04,757][102898] Updated weights for policy 1, policy_version 34550 (0.0008) +[2023-10-08 13:09:04,823][102897] Updated weights for policy 0, policy_version 34520 (0.0007) +[2023-10-08 13:09:05,128][102898] Updated weights for policy 1, policy_version 34560 (0.0007) +[2023-10-08 13:09:06,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 70746112. Throughput: 0: 1786.3, 1: 1792.3. Samples: 17689906. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:09:06,876][101941] Avg episode reward: [(0, '6.470'), (1, '7.530')] +[2023-10-08 13:09:08,602][102897] Updated weights for policy 0, policy_version 34530 (0.0007) +[2023-10-08 13:09:08,864][102898] Updated weights for policy 1, policy_version 34570 (0.0007) +[2023-10-08 13:09:08,970][102897] Updated weights for policy 0, policy_version 34540 (0.0009) +[2023-10-08 13:09:09,230][102898] Updated weights for policy 1, policy_version 34580 (0.0010) +[2023-10-08 13:09:09,343][102897] Updated weights for policy 0, policy_version 34550 (0.0007) +[2023-10-08 13:09:09,600][102898] Updated weights for policy 1, policy_version 34590 (0.0008) +[2023-10-08 13:09:09,713][102897] Updated weights for policy 0, policy_version 34560 (0.0008) +[2023-10-08 13:09:11,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 70811648. Throughput: 0: 1767.1, 1: 1779.5. Samples: 17710384. Policy #0 lag: (min: 17.0, avg: 27.9, max: 49.0) +[2023-10-08 13:09:11,876][101941] Avg episode reward: [(0, '6.550'), (1, '6.840')] +[2023-10-08 13:09:13,460][102897] Updated weights for policy 0, policy_version 34570 (0.0007) +[2023-10-08 13:09:13,468][102898] Updated weights for policy 1, policy_version 34600 (0.0007) +[2023-10-08 13:09:13,817][102897] Updated weights for policy 0, policy_version 34580 (0.0008) +[2023-10-08 13:09:13,821][102898] Updated weights for policy 1, policy_version 34610 (0.0009) +[2023-10-08 13:09:14,186][102897] Updated weights for policy 0, policy_version 34590 (0.0008) +[2023-10-08 13:09:14,189][102898] Updated weights for policy 1, policy_version 34620 (0.0008) +[2023-10-08 13:09:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 70877184. Throughput: 0: 1766.0, 1: 1769.2. Samples: 17732434. Policy #0 lag: (min: 17.0, avg: 27.9, max: 49.0) +[2023-10-08 13:09:16,875][101941] Avg episode reward: [(0, '7.010'), (1, '7.330')] +[2023-10-08 13:09:17,986][102898] Updated weights for policy 1, policy_version 34630 (0.0007) +[2023-10-08 13:09:18,025][102897] Updated weights for policy 0, policy_version 34600 (0.0008) +[2023-10-08 13:09:18,350][102898] Updated weights for policy 1, policy_version 34640 (0.0007) +[2023-10-08 13:09:18,399][102897] Updated weights for policy 0, policy_version 34610 (0.0008) +[2023-10-08 13:09:18,708][102898] Updated weights for policy 1, policy_version 34650 (0.0007) +[2023-10-08 13:09:18,765][102897] Updated weights for policy 0, policy_version 34620 (0.0007) +[2023-10-08 13:09:21,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 70942720. Throughput: 0: 1763.0, 1: 1773.2. Samples: 17742270. Policy #0 lag: (min: 17.0, avg: 27.9, max: 49.0) +[2023-10-08 13:09:21,875][101941] Avg episode reward: [(0, '6.800'), (1, '8.450')] +[2023-10-08 13:09:21,876][102760] Saving new best policy, reward=8.450! +[2023-10-08 13:09:22,439][102898] Updated weights for policy 1, policy_version 34660 (0.0008) +[2023-10-08 13:09:22,642][102897] Updated weights for policy 0, policy_version 34630 (0.0007) +[2023-10-08 13:09:22,816][102898] Updated weights for policy 1, policy_version 34670 (0.0008) +[2023-10-08 13:09:23,010][102897] Updated weights for policy 0, policy_version 34640 (0.0007) +[2023-10-08 13:09:23,178][102898] Updated weights for policy 1, policy_version 34680 (0.0008) +[2023-10-08 13:09:23,381][102897] Updated weights for policy 0, policy_version 34650 (0.0007) +[2023-10-08 13:09:26,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 71008256. Throughput: 0: 1763.0, 1: 1774.7. Samples: 17764580. Policy #0 lag: (min: 17.0, avg: 27.9, max: 49.0) +[2023-10-08 13:09:26,876][101941] Avg episode reward: [(0, '6.200'), (1, '8.510')] +[2023-10-08 13:09:27,022][102898] Updated weights for policy 1, policy_version 34690 (0.0007) +[2023-10-08 13:09:27,154][102897] Updated weights for policy 0, policy_version 34660 (0.0007) +[2023-10-08 13:09:27,391][102898] Updated weights for policy 1, policy_version 34700 (0.0007) +[2023-10-08 13:09:27,521][102897] Updated weights for policy 0, policy_version 34670 (0.0007) +[2023-10-08 13:09:27,760][102898] Updated weights for policy 1, policy_version 34710 (0.0007) +[2023-10-08 13:09:27,887][102897] Updated weights for policy 0, policy_version 34680 (0.0008) +[2023-10-08 13:09:28,124][102760] Saving new best policy, reward=8.510! +[2023-10-08 13:09:28,124][102898] Updated weights for policy 1, policy_version 34720 (0.0008) +[2023-10-08 13:09:31,678][102897] Updated weights for policy 0, policy_version 34690 (0.0008) +[2023-10-08 13:09:31,854][102898] Updated weights for policy 1, policy_version 34730 (0.0009) +[2023-10-08 13:09:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 71073792. Throughput: 0: 1787.6, 1: 1796.7. Samples: 17786584. Policy #0 lag: (min: 17.0, avg: 27.9, max: 49.0) +[2023-10-08 13:09:31,876][101941] Avg episode reward: [(0, '6.270'), (1, '7.100')] +[2023-10-08 13:09:32,045][102897] Updated weights for policy 0, policy_version 34700 (0.0008) +[2023-10-08 13:09:32,218][102898] Updated weights for policy 1, policy_version 34740 (0.0009) +[2023-10-08 13:09:32,417][102897] Updated weights for policy 0, policy_version 34710 (0.0007) +[2023-10-08 13:09:32,588][102898] Updated weights for policy 1, policy_version 34750 (0.0008) +[2023-10-08 13:09:32,785][102897] Updated weights for policy 0, policy_version 34720 (0.0007) +[2023-10-08 13:09:36,417][102898] Updated weights for policy 1, policy_version 34760 (0.0007) +[2023-10-08 13:09:36,556][102897] Updated weights for policy 0, policy_version 34730 (0.0007) +[2023-10-08 13:09:36,778][102898] Updated weights for policy 1, policy_version 34770 (0.0007) +[2023-10-08 13:09:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 71139328. Throughput: 0: 1756.8, 1: 1775.0. Samples: 17796250. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:09:36,875][101941] Avg episode reward: [(0, '6.160'), (1, '7.470')] +[2023-10-08 13:09:36,930][102897] Updated weights for policy 0, policy_version 34740 (0.0007) +[2023-10-08 13:09:37,150][102898] Updated weights for policy 1, policy_version 34780 (0.0007) +[2023-10-08 13:09:37,291][102897] Updated weights for policy 0, policy_version 34750 (0.0009) +[2023-10-08 13:09:40,872][102898] Updated weights for policy 1, policy_version 34790 (0.0008) +[2023-10-08 13:09:41,003][102897] Updated weights for policy 0, policy_version 34760 (0.0008) +[2023-10-08 13:09:41,236][102898] Updated weights for policy 1, policy_version 34800 (0.0008) +[2023-10-08 13:09:41,373][102897] Updated weights for policy 0, policy_version 34770 (0.0008) +[2023-10-08 13:09:41,609][102898] Updated weights for policy 1, policy_version 34810 (0.0008) +[2023-10-08 13:09:41,745][102897] Updated weights for policy 0, policy_version 34780 (0.0008) +[2023-10-08 13:09:41,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14218.0). Total num frames: 71237632. Throughput: 0: 1784.8, 1: 1789.1. Samples: 17818690. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:09:41,876][101941] Avg episode reward: [(0, '6.570'), (1, '7.970')] +[2023-10-08 13:09:45,404][102898] Updated weights for policy 1, policy_version 34820 (0.0010) +[2023-10-08 13:09:45,618][102897] Updated weights for policy 0, policy_version 34790 (0.0008) +[2023-10-08 13:09:45,770][102898] Updated weights for policy 1, policy_version 34830 (0.0007) +[2023-10-08 13:09:45,999][102897] Updated weights for policy 0, policy_version 34800 (0.0008) +[2023-10-08 13:09:46,137][102898] Updated weights for policy 1, policy_version 34840 (0.0007) +[2023-10-08 13:09:46,362][102897] Updated weights for policy 0, policy_version 34810 (0.0007) +[2023-10-08 13:09:46,875][101941] Fps is (10 sec: 19660.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 71335936. Throughput: 0: 1768.6, 1: 1772.3. Samples: 17838110. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:09:46,876][101941] Avg episode reward: [(0, '6.140'), (1, '7.360')] +[2023-10-08 13:09:49,808][102898] Updated weights for policy 1, policy_version 34850 (0.0007) +[2023-10-08 13:09:50,211][102898] Updated weights for policy 1, policy_version 34860 (0.0008) +[2023-10-08 13:09:50,313][102897] Updated weights for policy 0, policy_version 34820 (0.0007) +[2023-10-08 13:09:50,578][102898] Updated weights for policy 1, policy_version 34870 (0.0008) +[2023-10-08 13:09:50,703][102897] Updated weights for policy 0, policy_version 34830 (0.0007) +[2023-10-08 13:09:50,942][102898] Updated weights for policy 1, policy_version 34880 (0.0009) +[2023-10-08 13:09:51,078][102897] Updated weights for policy 0, policy_version 34840 (0.0008) +[2023-10-08 13:09:51,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 71401472. Throughput: 0: 1774.3, 1: 1789.6. Samples: 17850280. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:09:51,876][101941] Avg episode reward: [(0, '6.770'), (1, '7.520')] +[2023-10-08 13:09:54,653][102898] Updated weights for policy 1, policy_version 34890 (0.0009) +[2023-10-08 13:09:54,831][102897] Updated weights for policy 0, policy_version 34850 (0.0010) +[2023-10-08 13:09:55,017][102898] Updated weights for policy 1, policy_version 34900 (0.0008) +[2023-10-08 13:09:55,210][102897] Updated weights for policy 0, policy_version 34860 (0.0008) +[2023-10-08 13:09:55,383][102898] Updated weights for policy 1, policy_version 34910 (0.0007) +[2023-10-08 13:09:55,577][102897] Updated weights for policy 0, policy_version 34870 (0.0008) +[2023-10-08 13:09:55,944][102897] Updated weights for policy 0, policy_version 34880 (0.0009) +[2023-10-08 13:09:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 71467008. Throughput: 0: 1777.5, 1: 1776.2. Samples: 17870300. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:09:56,876][101941] Avg episode reward: [(0, '6.540'), (1, '7.210')] +[2023-10-08 13:09:59,254][102898] Updated weights for policy 1, policy_version 34920 (0.0009) +[2023-10-08 13:09:59,614][102898] Updated weights for policy 1, policy_version 34930 (0.0007) +[2023-10-08 13:09:59,877][102897] Updated weights for policy 0, policy_version 34890 (0.0007) +[2023-10-08 13:09:59,981][102898] Updated weights for policy 1, policy_version 34940 (0.0007) +[2023-10-08 13:10:00,244][102897] Updated weights for policy 0, policy_version 34900 (0.0009) +[2023-10-08 13:10:00,612][102897] Updated weights for policy 0, policy_version 34910 (0.0009) +[2023-10-08 13:10:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 71532544. Throughput: 0: 1759.5, 1: 1775.6. Samples: 17891512. Policy #0 lag: (min: 31.0, avg: 36.0, max: 63.0) +[2023-10-08 13:10:01,876][101941] Avg episode reward: [(0, '6.450'), (1, '7.910')] +[2023-10-08 13:10:03,965][102898] Updated weights for policy 1, policy_version 34950 (0.0009) +[2023-10-08 13:10:04,090][102897] Updated weights for policy 0, policy_version 34920 (0.0009) +[2023-10-08 13:10:04,330][102898] Updated weights for policy 1, policy_version 34960 (0.0008) +[2023-10-08 13:10:04,458][102897] Updated weights for policy 0, policy_version 34930 (0.0009) +[2023-10-08 13:10:04,695][102898] Updated weights for policy 1, policy_version 34970 (0.0009) +[2023-10-08 13:10:04,826][102897] Updated weights for policy 0, policy_version 34940 (0.0007) +[2023-10-08 13:10:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 71598080. Throughput: 0: 1784.7, 1: 1779.5. Samples: 17902660. Policy #0 lag: (min: 31.0, avg: 36.0, max: 63.0) +[2023-10-08 13:10:06,876][101941] Avg episode reward: [(0, '6.290'), (1, '8.240')] +[2023-10-08 13:10:08,590][102898] Updated weights for policy 1, policy_version 34980 (0.0008) +[2023-10-08 13:10:08,788][102897] Updated weights for policy 0, policy_version 34950 (0.0008) +[2023-10-08 13:10:08,957][102898] Updated weights for policy 1, policy_version 34990 (0.0007) +[2023-10-08 13:10:09,165][102897] Updated weights for policy 0, policy_version 34960 (0.0009) +[2023-10-08 13:10:09,314][102898] Updated weights for policy 1, policy_version 35000 (0.0007) +[2023-10-08 13:10:09,534][102897] Updated weights for policy 0, policy_version 34970 (0.0009) +[2023-10-08 13:10:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 71663616. Throughput: 0: 1766.9, 1: 1766.8. Samples: 17923594. Policy #0 lag: (min: 31.0, avg: 36.0, max: 63.0) +[2023-10-08 13:10:11,876][101941] Avg episode reward: [(0, '5.840'), (1, '8.170')] +[2023-10-08 13:10:13,084][102898] Updated weights for policy 1, policy_version 35010 (0.0007) +[2023-10-08 13:10:13,205][102897] Updated weights for policy 0, policy_version 34980 (0.0007) +[2023-10-08 13:10:13,448][102898] Updated weights for policy 1, policy_version 35020 (0.0009) +[2023-10-08 13:10:13,580][102897] Updated weights for policy 0, policy_version 34990 (0.0009) +[2023-10-08 13:10:13,808][102898] Updated weights for policy 1, policy_version 35030 (0.0007) +[2023-10-08 13:10:13,940][102897] Updated weights for policy 0, policy_version 35000 (0.0009) +[2023-10-08 13:10:14,186][102898] Updated weights for policy 1, policy_version 35040 (0.0008) +[2023-10-08 13:10:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 71729152. Throughput: 0: 1775.9, 1: 1765.2. Samples: 17945936. Policy #0 lag: (min: 31.0, avg: 36.0, max: 63.0) +[2023-10-08 13:10:16,876][101941] Avg episode reward: [(0, '6.520'), (1, '8.570')] +[2023-10-08 13:10:16,884][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000035008_35848192.pth... +[2023-10-08 13:10:16,884][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000035040_35880960.pth... +[2023-10-08 13:10:16,916][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000033344_34144256.pth +[2023-10-08 13:10:16,924][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000033376_34177024.pth +[2023-10-08 13:10:16,928][102760] Saving new best policy, reward=8.570! +[2023-10-08 13:10:17,764][102897] Updated weights for policy 0, policy_version 35010 (0.0008) +[2023-10-08 13:10:18,007][102898] Updated weights for policy 1, policy_version 35050 (0.0008) +[2023-10-08 13:10:18,142][102897] Updated weights for policy 0, policy_version 35020 (0.0007) +[2023-10-08 13:10:18,373][102898] Updated weights for policy 1, policy_version 35060 (0.0008) +[2023-10-08 13:10:18,508][102897] Updated weights for policy 0, policy_version 35030 (0.0009) +[2023-10-08 13:10:18,736][102898] Updated weights for policy 1, policy_version 35070 (0.0008) +[2023-10-08 13:10:18,881][102897] Updated weights for policy 0, policy_version 35040 (0.0009) +[2023-10-08 13:10:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 71794688. Throughput: 0: 1773.5, 1: 1764.8. Samples: 17955476. Policy #0 lag: (min: 31.0, avg: 36.0, max: 63.0) +[2023-10-08 13:10:21,876][101941] Avg episode reward: [(0, '7.050'), (1, '8.060')] +[2023-10-08 13:10:22,611][102897] Updated weights for policy 0, policy_version 35050 (0.0007) +[2023-10-08 13:10:22,746][102898] Updated weights for policy 1, policy_version 35080 (0.0008) +[2023-10-08 13:10:22,975][102897] Updated weights for policy 0, policy_version 35060 (0.0007) +[2023-10-08 13:10:23,110][102898] Updated weights for policy 1, policy_version 35090 (0.0007) +[2023-10-08 13:10:23,339][102897] Updated weights for policy 0, policy_version 35070 (0.0009) +[2023-10-08 13:10:23,476][102898] Updated weights for policy 1, policy_version 35100 (0.0008) +[2023-10-08 13:10:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 71860224. Throughput: 0: 1768.1, 1: 1766.1. Samples: 17977728. Policy #0 lag: (min: 31.0, avg: 36.0, max: 63.0) +[2023-10-08 13:10:26,876][101941] Avg episode reward: [(0, '7.330'), (1, '6.960')] +[2023-10-08 13:10:27,137][102898] Updated weights for policy 1, policy_version 35110 (0.0007) +[2023-10-08 13:10:27,185][102897] Updated weights for policy 0, policy_version 35080 (0.0007) +[2023-10-08 13:10:27,503][102898] Updated weights for policy 1, policy_version 35120 (0.0007) +[2023-10-08 13:10:27,554][102897] Updated weights for policy 0, policy_version 35090 (0.0008) +[2023-10-08 13:10:27,863][102898] Updated weights for policy 1, policy_version 35130 (0.0009) +[2023-10-08 13:10:27,919][102897] Updated weights for policy 0, policy_version 35100 (0.0008) +[2023-10-08 13:10:31,556][102898] Updated weights for policy 1, policy_version 35140 (0.0009) +[2023-10-08 13:10:31,759][102897] Updated weights for policy 0, policy_version 35110 (0.0007) +[2023-10-08 13:10:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 71925760. Throughput: 0: 1795.2, 1: 1796.7. Samples: 17999742. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 13:10:31,876][101941] Avg episode reward: [(0, '6.920'), (1, '7.590')] +[2023-10-08 13:10:31,922][102898] Updated weights for policy 1, policy_version 35150 (0.0007) +[2023-10-08 13:10:32,119][102897] Updated weights for policy 0, policy_version 35120 (0.0007) +[2023-10-08 13:10:32,283][102898] Updated weights for policy 1, policy_version 35160 (0.0009) +[2023-10-08 13:10:32,495][102897] Updated weights for policy 0, policy_version 35130 (0.0007) +[2023-10-08 13:10:36,148][102898] Updated weights for policy 1, policy_version 35170 (0.0009) +[2023-10-08 13:10:36,337][102897] Updated weights for policy 0, policy_version 35140 (0.0007) +[2023-10-08 13:10:36,568][102898] Updated weights for policy 1, policy_version 35180 (0.0008) +[2023-10-08 13:10:36,724][102897] Updated weights for policy 0, policy_version 35150 (0.0008) +[2023-10-08 13:10:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14106.9). Total num frames: 71991296. Throughput: 0: 1771.9, 1: 1763.0. Samples: 18009350. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 13:10:36,875][101941] Avg episode reward: [(0, '6.090'), (1, '7.640')] +[2023-10-08 13:10:36,932][102898] Updated weights for policy 1, policy_version 35190 (0.0007) +[2023-10-08 13:10:37,089][102897] Updated weights for policy 0, policy_version 35160 (0.0007) +[2023-10-08 13:10:37,297][102898] Updated weights for policy 1, policy_version 35200 (0.0008) +[2023-10-08 13:10:40,685][102897] Updated weights for policy 0, policy_version 35170 (0.0007) +[2023-10-08 13:10:41,054][102897] Updated weights for policy 0, policy_version 35180 (0.0010) +[2023-10-08 13:10:41,198][102898] Updated weights for policy 1, policy_version 35210 (0.0008) +[2023-10-08 13:10:41,434][102897] Updated weights for policy 0, policy_version 35190 (0.0009) +[2023-10-08 13:10:41,559][102898] Updated weights for policy 1, policy_version 35220 (0.0009) +[2023-10-08 13:10:41,792][102897] Updated weights for policy 0, policy_version 35200 (0.0008) +[2023-10-08 13:10:41,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 72089600. Throughput: 0: 1789.1, 1: 1793.0. Samples: 18031496. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 13:10:41,875][101941] Avg episode reward: [(0, '6.400'), (1, '7.020')] +[2023-10-08 13:10:41,935][102898] Updated weights for policy 1, policy_version 35230 (0.0010) +[2023-10-08 13:10:45,537][102897] Updated weights for policy 0, policy_version 35210 (0.0007) +[2023-10-08 13:10:45,731][102898] Updated weights for policy 1, policy_version 35240 (0.0009) +[2023-10-08 13:10:45,902][102897] Updated weights for policy 0, policy_version 35220 (0.0007) +[2023-10-08 13:10:46,098][102898] Updated weights for policy 1, policy_version 35250 (0.0008) +[2023-10-08 13:10:46,275][102897] Updated weights for policy 0, policy_version 35230 (0.0008) +[2023-10-08 13:10:46,460][102898] Updated weights for policy 1, policy_version 35260 (0.0010) +[2023-10-08 13:10:46,875][101941] Fps is (10 sec: 19660.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 72187904. Throughput: 0: 1775.7, 1: 1770.7. Samples: 18051102. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 13:10:46,876][101941] Avg episode reward: [(0, '6.880'), (1, '7.290')] +[2023-10-08 13:10:50,084][102897] Updated weights for policy 0, policy_version 35240 (0.0008) +[2023-10-08 13:10:50,130][102898] Updated weights for policy 1, policy_version 35270 (0.0008) +[2023-10-08 13:10:50,466][102897] Updated weights for policy 0, policy_version 35250 (0.0008) +[2023-10-08 13:10:50,504][102898] Updated weights for policy 1, policy_version 35280 (0.0007) +[2023-10-08 13:10:50,824][102897] Updated weights for policy 0, policy_version 35260 (0.0009) +[2023-10-08 13:10:50,861][102898] Updated weights for policy 1, policy_version 35290 (0.0009) +[2023-10-08 13:10:51,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 72253440. Throughput: 0: 1778.8, 1: 1791.6. Samples: 18063326. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 13:10:51,876][101941] Avg episode reward: [(0, '7.650'), (1, '7.200')] +[2023-10-08 13:10:54,515][102897] Updated weights for policy 0, policy_version 35270 (0.0008) +[2023-10-08 13:10:54,717][102898] Updated weights for policy 1, policy_version 35300 (0.0008) +[2023-10-08 13:10:54,885][102897] Updated weights for policy 0, policy_version 35280 (0.0007) +[2023-10-08 13:10:55,081][102898] Updated weights for policy 1, policy_version 35310 (0.0008) +[2023-10-08 13:10:55,262][102897] Updated weights for policy 0, policy_version 35290 (0.0008) +[2023-10-08 13:10:55,451][102898] Updated weights for policy 1, policy_version 35320 (0.0007) +[2023-10-08 13:10:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 72318976. Throughput: 0: 1777.7, 1: 1774.7. Samples: 18083452. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:10:56,876][101941] Avg episode reward: [(0, '7.210'), (1, '7.180')] +[2023-10-08 13:10:59,001][102897] Updated weights for policy 0, policy_version 35300 (0.0009) +[2023-10-08 13:10:59,282][102898] Updated weights for policy 1, policy_version 35330 (0.0007) +[2023-10-08 13:10:59,379][102897] Updated weights for policy 0, policy_version 35310 (0.0008) +[2023-10-08 13:10:59,656][102898] Updated weights for policy 1, policy_version 35340 (0.0007) +[2023-10-08 13:10:59,751][102897] Updated weights for policy 0, policy_version 35320 (0.0007) +[2023-10-08 13:11:00,011][102898] Updated weights for policy 1, policy_version 35350 (0.0008) +[2023-10-08 13:11:00,374][102898] Updated weights for policy 1, policy_version 35360 (0.0010) +[2023-10-08 13:11:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 72384512. Throughput: 0: 1768.5, 1: 1764.8. Samples: 18104938. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:11:01,876][101941] Avg episode reward: [(0, '6.100'), (1, '7.310')] +[2023-10-08 13:11:03,672][102897] Updated weights for policy 0, policy_version 35330 (0.0008) +[2023-10-08 13:11:04,040][102897] Updated weights for policy 0, policy_version 35340 (0.0008) +[2023-10-08 13:11:04,069][102898] Updated weights for policy 1, policy_version 35370 (0.0007) +[2023-10-08 13:11:04,401][102897] Updated weights for policy 0, policy_version 35350 (0.0009) +[2023-10-08 13:11:04,426][102898] Updated weights for policy 1, policy_version 35380 (0.0007) +[2023-10-08 13:11:04,768][102897] Updated weights for policy 0, policy_version 35360 (0.0007) +[2023-10-08 13:11:04,793][102898] Updated weights for policy 1, policy_version 35390 (0.0008) +[2023-10-08 13:11:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 72450048. Throughput: 0: 1781.1, 1: 1784.0. Samples: 18115904. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:11:06,876][101941] Avg episode reward: [(0, '6.540'), (1, '7.530')] +[2023-10-08 13:11:08,473][102898] Updated weights for policy 1, policy_version 35400 (0.0007) +[2023-10-08 13:11:08,669][102897] Updated weights for policy 0, policy_version 35370 (0.0009) +[2023-10-08 13:11:08,836][102898] Updated weights for policy 1, policy_version 35410 (0.0008) +[2023-10-08 13:11:09,042][102897] Updated weights for policy 0, policy_version 35380 (0.0009) +[2023-10-08 13:11:09,209][102898] Updated weights for policy 1, policy_version 35420 (0.0009) +[2023-10-08 13:11:09,411][102897] Updated weights for policy 0, policy_version 35390 (0.0008) +[2023-10-08 13:11:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 72515584. Throughput: 0: 1769.8, 1: 1775.1. Samples: 18137248. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:11:11,876][101941] Avg episode reward: [(0, '7.010'), (1, '8.220')] +[2023-10-08 13:11:12,962][102898] Updated weights for policy 1, policy_version 35430 (0.0008) +[2023-10-08 13:11:13,173][102897] Updated weights for policy 0, policy_version 35400 (0.0009) +[2023-10-08 13:11:13,332][102898] Updated weights for policy 1, policy_version 35440 (0.0007) +[2023-10-08 13:11:13,535][102897] Updated weights for policy 0, policy_version 35410 (0.0008) +[2023-10-08 13:11:13,704][102898] Updated weights for policy 1, policy_version 35450 (0.0007) +[2023-10-08 13:11:13,900][102897] Updated weights for policy 0, policy_version 35420 (0.0009) +[2023-10-08 13:11:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 72581120. Throughput: 0: 1772.7, 1: 1776.9. Samples: 18159474. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:11:16,876][101941] Avg episode reward: [(0, '6.400'), (1, '8.180')] +[2023-10-08 13:11:17,488][102898] Updated weights for policy 1, policy_version 35460 (0.0008) +[2023-10-08 13:11:17,652][102897] Updated weights for policy 0, policy_version 35430 (0.0009) +[2023-10-08 13:11:17,857][102898] Updated weights for policy 1, policy_version 35470 (0.0008) +[2023-10-08 13:11:18,022][102897] Updated weights for policy 0, policy_version 35440 (0.0008) +[2023-10-08 13:11:18,215][102898] Updated weights for policy 1, policy_version 35480 (0.0009) +[2023-10-08 13:11:18,391][102897] Updated weights for policy 0, policy_version 35450 (0.0008) +[2023-10-08 13:11:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 72646656. Throughput: 0: 1775.2, 1: 1775.2. Samples: 18169122. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:11:21,876][101941] Avg episode reward: [(0, '5.720'), (1, '7.800')] +[2023-10-08 13:11:21,929][102898] Updated weights for policy 1, policy_version 35490 (0.0009) +[2023-10-08 13:11:22,306][102898] Updated weights for policy 1, policy_version 35500 (0.0007) +[2023-10-08 13:11:22,318][102897] Updated weights for policy 0, policy_version 35460 (0.0007) +[2023-10-08 13:11:22,668][102898] Updated weights for policy 1, policy_version 35510 (0.0009) +[2023-10-08 13:11:22,698][102897] Updated weights for policy 0, policy_version 35470 (0.0008) +[2023-10-08 13:11:23,023][102898] Updated weights for policy 1, policy_version 35520 (0.0009) +[2023-10-08 13:11:23,075][102897] Updated weights for policy 0, policy_version 35480 (0.0008) +[2023-10-08 13:11:26,714][102897] Updated weights for policy 0, policy_version 35490 (0.0010) +[2023-10-08 13:11:26,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 72712192. Throughput: 0: 1771.9, 1: 1776.7. Samples: 18191182. Policy #0 lag: (min: 13.0, avg: 23.8, max: 45.0) +[2023-10-08 13:11:26,876][101941] Avg episode reward: [(0, '6.280'), (1, '7.540')] +[2023-10-08 13:11:27,045][102898] Updated weights for policy 1, policy_version 35530 (0.0008) +[2023-10-08 13:11:27,083][102897] Updated weights for policy 0, policy_version 35500 (0.0008) +[2023-10-08 13:11:27,416][102898] Updated weights for policy 1, policy_version 35540 (0.0007) +[2023-10-08 13:11:27,461][102897] Updated weights for policy 0, policy_version 35510 (0.0009) +[2023-10-08 13:11:27,789][102898] Updated weights for policy 1, policy_version 35550 (0.0009) +[2023-10-08 13:11:27,827][102897] Updated weights for policy 0, policy_version 35520 (0.0009) +[2023-10-08 13:11:31,708][102898] Updated weights for policy 1, policy_version 35560 (0.0008) +[2023-10-08 13:11:31,821][102897] Updated weights for policy 0, policy_version 35530 (0.0007) +[2023-10-08 13:11:31,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 72777728. Throughput: 0: 1798.0, 1: 1800.5. Samples: 18213032. Policy #0 lag: (min: 13.0, avg: 23.8, max: 45.0) +[2023-10-08 13:11:31,875][101941] Avg episode reward: [(0, '6.670'), (1, '7.790')] +[2023-10-08 13:11:32,064][102898] Updated weights for policy 1, policy_version 35570 (0.0008) +[2023-10-08 13:11:32,185][102897] Updated weights for policy 0, policy_version 35540 (0.0007) +[2023-10-08 13:11:32,430][102898] Updated weights for policy 1, policy_version 35580 (0.0007) +[2023-10-08 13:11:32,559][102897] Updated weights for policy 0, policy_version 35550 (0.0008) +[2023-10-08 13:11:36,313][102898] Updated weights for policy 1, policy_version 35590 (0.0008) +[2023-10-08 13:11:36,450][102897] Updated weights for policy 0, policy_version 35560 (0.0007) +[2023-10-08 13:11:36,687][102898] Updated weights for policy 1, policy_version 35600 (0.0009) +[2023-10-08 13:11:36,811][102897] Updated weights for policy 0, policy_version 35570 (0.0008) +[2023-10-08 13:11:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14106.9). Total num frames: 72843264. Throughput: 0: 1771.0, 1: 1773.4. Samples: 18222824. Policy #0 lag: (min: 13.0, avg: 23.8, max: 45.0) +[2023-10-08 13:11:36,876][101941] Avg episode reward: [(0, '6.020'), (1, '7.660')] +[2023-10-08 13:11:37,057][102898] Updated weights for policy 1, policy_version 35610 (0.0007) +[2023-10-08 13:11:37,185][102897] Updated weights for policy 0, policy_version 35580 (0.0007) +[2023-10-08 13:11:40,774][102897] Updated weights for policy 0, policy_version 35590 (0.0007) +[2023-10-08 13:11:40,854][102898] Updated weights for policy 1, policy_version 35620 (0.0007) +[2023-10-08 13:11:41,160][102897] Updated weights for policy 0, policy_version 35600 (0.0008) +[2023-10-08 13:11:41,223][102898] Updated weights for policy 1, policy_version 35630 (0.0008) +[2023-10-08 13:11:41,534][102897] Updated weights for policy 0, policy_version 35610 (0.0008) +[2023-10-08 13:11:41,582][102898] Updated weights for policy 1, policy_version 35640 (0.0007) +[2023-10-08 13:11:41,878][101941] Fps is (10 sec: 19654.2, 60 sec: 14744.8, 300 sec: 14328.9). Total num frames: 72974336. Throughput: 0: 1793.9, 1: 1800.4. Samples: 18245204. Policy #0 lag: (min: 13.0, avg: 23.8, max: 45.0) +[2023-10-08 13:11:41,880][101941] Avg episode reward: [(0, '5.970'), (1, '7.450')] +[2023-10-08 13:11:45,152][102897] Updated weights for policy 0, policy_version 35620 (0.0007) +[2023-10-08 13:11:45,224][102898] Updated weights for policy 1, policy_version 35650 (0.0009) +[2023-10-08 13:11:45,521][102897] Updated weights for policy 0, policy_version 35630 (0.0008) +[2023-10-08 13:11:45,593][102898] Updated weights for policy 1, policy_version 35660 (0.0008) +[2023-10-08 13:11:45,891][102897] Updated weights for policy 0, policy_version 35640 (0.0008) +[2023-10-08 13:11:45,947][102898] Updated weights for policy 1, policy_version 35670 (0.0007) +[2023-10-08 13:11:46,316][102898] Updated weights for policy 1, policy_version 35680 (0.0007) +[2023-10-08 13:11:46,875][101941] Fps is (10 sec: 19661.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 73039872. Throughput: 0: 1771.6, 1: 1780.9. Samples: 18264798. Policy #0 lag: (min: 13.0, avg: 23.8, max: 45.0) +[2023-10-08 13:11:46,875][101941] Avg episode reward: [(0, '6.060'), (1, '7.450')] +[2023-10-08 13:11:49,616][102897] Updated weights for policy 0, policy_version 35650 (0.0008) +[2023-10-08 13:11:49,993][102897] Updated weights for policy 0, policy_version 35660 (0.0008) +[2023-10-08 13:11:50,131][102898] Updated weights for policy 1, policy_version 35690 (0.0007) +[2023-10-08 13:11:50,369][102897] Updated weights for policy 0, policy_version 35670 (0.0008) +[2023-10-08 13:11:50,494][102898] Updated weights for policy 1, policy_version 35700 (0.0008) +[2023-10-08 13:11:50,748][102897] Updated weights for policy 0, policy_version 35680 (0.0009) +[2023-10-08 13:11:50,860][102898] Updated weights for policy 1, policy_version 35710 (0.0009) +[2023-10-08 13:11:51,875][101941] Fps is (10 sec: 13111.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 73105408. Throughput: 0: 1795.0, 1: 1795.2. Samples: 18277460. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 13:11:51,876][101941] Avg episode reward: [(0, '6.750'), (1, '7.480')] +[2023-10-08 13:11:54,350][102897] Updated weights for policy 0, policy_version 35690 (0.0010) +[2023-10-08 13:11:54,718][102897] Updated weights for policy 0, policy_version 35700 (0.0009) +[2023-10-08 13:11:54,801][102898] Updated weights for policy 1, policy_version 35720 (0.0008) +[2023-10-08 13:11:55,096][102897] Updated weights for policy 0, policy_version 35710 (0.0008) +[2023-10-08 13:11:55,170][102898] Updated weights for policy 1, policy_version 35730 (0.0008) +[2023-10-08 13:11:55,528][102898] Updated weights for policy 1, policy_version 35740 (0.0007) +[2023-10-08 13:11:56,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 73170944. Throughput: 0: 1779.3, 1: 1772.6. Samples: 18297082. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 13:11:56,876][101941] Avg episode reward: [(0, '6.900'), (1, '7.490')] +[2023-10-08 13:11:58,940][102897] Updated weights for policy 0, policy_version 35720 (0.0007) +[2023-10-08 13:11:59,211][102898] Updated weights for policy 1, policy_version 35750 (0.0009) +[2023-10-08 13:11:59,312][102897] Updated weights for policy 0, policy_version 35730 (0.0007) +[2023-10-08 13:11:59,576][102898] Updated weights for policy 1, policy_version 35760 (0.0008) +[2023-10-08 13:11:59,675][102897] Updated weights for policy 0, policy_version 35740 (0.0008) +[2023-10-08 13:11:59,944][102898] Updated weights for policy 1, policy_version 35770 (0.0007) +[2023-10-08 13:12:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 73236480. Throughput: 0: 1784.2, 1: 1764.4. Samples: 18319160. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 13:12:01,876][101941] Avg episode reward: [(0, '6.700'), (1, '8.230')] +[2023-10-08 13:12:03,484][102897] Updated weights for policy 0, policy_version 35750 (0.0008) +[2023-10-08 13:12:03,744][102898] Updated weights for policy 1, policy_version 35780 (0.0008) +[2023-10-08 13:12:03,855][102897] Updated weights for policy 0, policy_version 35760 (0.0007) +[2023-10-08 13:12:04,109][102898] Updated weights for policy 1, policy_version 35790 (0.0008) +[2023-10-08 13:12:04,235][102897] Updated weights for policy 0, policy_version 35770 (0.0007) +[2023-10-08 13:12:04,477][102898] Updated weights for policy 1, policy_version 35800 (0.0007) +[2023-10-08 13:12:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 73302016. Throughput: 0: 1788.5, 1: 1779.0. Samples: 18329662. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 13:12:06,876][101941] Avg episode reward: [(0, '7.100'), (1, '7.800')] +[2023-10-08 13:12:08,044][102897] Updated weights for policy 0, policy_version 35780 (0.0008) +[2023-10-08 13:12:08,308][102898] Updated weights for policy 1, policy_version 35810 (0.0007) +[2023-10-08 13:12:08,416][102897] Updated weights for policy 0, policy_version 35790 (0.0009) +[2023-10-08 13:12:08,708][102898] Updated weights for policy 1, policy_version 35820 (0.0007) +[2023-10-08 13:12:08,792][102897] Updated weights for policy 0, policy_version 35800 (0.0008) +[2023-10-08 13:12:09,075][102898] Updated weights for policy 1, policy_version 35830 (0.0007) +[2023-10-08 13:12:09,443][102898] Updated weights for policy 1, policy_version 35840 (0.0007) +[2023-10-08 13:12:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 73367552. Throughput: 0: 1786.1, 1: 1768.8. Samples: 18351152. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 13:12:11,875][101941] Avg episode reward: [(0, '6.610'), (1, '6.950')] +[2023-10-08 13:12:12,523][102897] Updated weights for policy 0, policy_version 35810 (0.0007) +[2023-10-08 13:12:12,886][102897] Updated weights for policy 0, policy_version 35820 (0.0008) +[2023-10-08 13:12:13,240][102898] Updated weights for policy 1, policy_version 35850 (0.0007) +[2023-10-08 13:12:13,251][102897] Updated weights for policy 0, policy_version 35830 (0.0007) +[2023-10-08 13:12:13,602][102898] Updated weights for policy 1, policy_version 35860 (0.0008) +[2023-10-08 13:12:13,623][102897] Updated weights for policy 0, policy_version 35840 (0.0007) +[2023-10-08 13:12:13,967][102898] Updated weights for policy 1, policy_version 35870 (0.0010) +[2023-10-08 13:12:16,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 73433088. Throughput: 0: 1795.0, 1: 1771.6. Samples: 18373526. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 13:12:16,875][101941] Avg episode reward: [(0, '6.410'), (1, '7.800')] +[2023-10-08 13:12:16,885][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000035872_36732928.pth... +[2023-10-08 13:12:16,886][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000035840_36700160.pth... +[2023-10-08 13:12:16,920][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000034208_35028992.pth +[2023-10-08 13:12:16,927][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000034176_34996224.pth +[2023-10-08 13:12:17,455][102897] Updated weights for policy 0, policy_version 35850 (0.0010) +[2023-10-08 13:12:17,760][102898] Updated weights for policy 1, policy_version 35880 (0.0008) +[2023-10-08 13:12:17,826][102897] Updated weights for policy 0, policy_version 35860 (0.0007) +[2023-10-08 13:12:18,120][102898] Updated weights for policy 1, policy_version 35890 (0.0008) +[2023-10-08 13:12:18,199][102897] Updated weights for policy 0, policy_version 35870 (0.0008) +[2023-10-08 13:12:18,486][102898] Updated weights for policy 1, policy_version 35900 (0.0008) +[2023-10-08 13:12:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 73498624. Throughput: 0: 1792.8, 1: 1769.4. Samples: 18383126. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:12:21,876][101941] Avg episode reward: [(0, '6.510'), (1, '8.120')] +[2023-10-08 13:12:21,923][102897] Updated weights for policy 0, policy_version 35880 (0.0008) +[2023-10-08 13:12:22,264][102898] Updated weights for policy 1, policy_version 35910 (0.0008) +[2023-10-08 13:12:22,287][102897] Updated weights for policy 0, policy_version 35890 (0.0007) +[2023-10-08 13:12:22,631][102898] Updated weights for policy 1, policy_version 35920 (0.0008) +[2023-10-08 13:12:22,664][102897] Updated weights for policy 0, policy_version 35900 (0.0009) +[2023-10-08 13:12:22,986][102898] Updated weights for policy 1, policy_version 35930 (0.0007) +[2023-10-08 13:12:26,604][102897] Updated weights for policy 0, policy_version 35910 (0.0009) +[2023-10-08 13:12:26,754][102898] Updated weights for policy 1, policy_version 35940 (0.0008) +[2023-10-08 13:12:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 73564160. Throughput: 0: 1787.6, 1: 1767.6. Samples: 18405174. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:12:26,876][101941] Avg episode reward: [(0, '6.050'), (1, '7.910')] +[2023-10-08 13:12:26,980][102897] Updated weights for policy 0, policy_version 35920 (0.0009) +[2023-10-08 13:12:27,120][102898] Updated weights for policy 1, policy_version 35950 (0.0008) +[2023-10-08 13:12:27,350][102897] Updated weights for policy 0, policy_version 35930 (0.0008) +[2023-10-08 13:12:27,478][102898] Updated weights for policy 1, policy_version 35960 (0.0007) +[2023-10-08 13:12:31,274][102897] Updated weights for policy 0, policy_version 35940 (0.0008) +[2023-10-08 13:12:31,315][102898] Updated weights for policy 1, policy_version 35970 (0.0007) +[2023-10-08 13:12:31,646][102897] Updated weights for policy 0, policy_version 35950 (0.0008) +[2023-10-08 13:12:31,690][102898] Updated weights for policy 1, policy_version 35980 (0.0008) +[2023-10-08 13:12:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 73629696. Throughput: 0: 1804.0, 1: 1792.3. Samples: 18426628. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:12:31,876][101941] Avg episode reward: [(0, '5.720'), (1, '8.200')] +[2023-10-08 13:12:32,015][102897] Updated weights for policy 0, policy_version 35960 (0.0007) +[2023-10-08 13:12:32,044][102898] Updated weights for policy 1, policy_version 35990 (0.0007) +[2023-10-08 13:12:32,418][102898] Updated weights for policy 1, policy_version 36000 (0.0008) +[2023-10-08 13:12:35,545][102897] Updated weights for policy 0, policy_version 35970 (0.0008) +[2023-10-08 13:12:35,920][102897] Updated weights for policy 0, policy_version 35980 (0.0007) +[2023-10-08 13:12:36,122][102898] Updated weights for policy 1, policy_version 36010 (0.0007) +[2023-10-08 13:12:36,290][102897] Updated weights for policy 0, policy_version 35990 (0.0007) +[2023-10-08 13:12:36,487][102898] Updated weights for policy 1, policy_version 36020 (0.0007) +[2023-10-08 13:12:36,666][102897] Updated weights for policy 0, policy_version 36000 (0.0007) +[2023-10-08 13:12:36,861][102898] Updated weights for policy 1, policy_version 36030 (0.0009) +[2023-10-08 13:12:36,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 73728000. Throughput: 0: 1780.1, 1: 1764.1. Samples: 18436952. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:12:36,875][101941] Avg episode reward: [(0, '6.370'), (1, '7.870')] +[2023-10-08 13:12:40,319][102897] Updated weights for policy 0, policy_version 36010 (0.0009) +[2023-10-08 13:12:40,692][102897] Updated weights for policy 0, policy_version 36020 (0.0007) +[2023-10-08 13:12:40,887][102898] Updated weights for policy 1, policy_version 36040 (0.0009) +[2023-10-08 13:12:41,065][102897] Updated weights for policy 0, policy_version 36030 (0.0008) +[2023-10-08 13:12:41,251][102898] Updated weights for policy 1, policy_version 36050 (0.0009) +[2023-10-08 13:12:41,623][102898] Updated weights for policy 1, policy_version 36060 (0.0009) +[2023-10-08 13:12:41,875][101941] Fps is (10 sec: 19660.9, 60 sec: 14200.3, 300 sec: 14218.0). Total num frames: 73826304. Throughput: 0: 1800.8, 1: 1791.0. Samples: 18458712. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:12:41,875][101941] Avg episode reward: [(0, '6.560'), (1, '7.300')] +[2023-10-08 13:12:44,820][102897] Updated weights for policy 0, policy_version 36040 (0.0009) +[2023-10-08 13:12:45,199][102897] Updated weights for policy 0, policy_version 36050 (0.0007) +[2023-10-08 13:12:45,289][102898] Updated weights for policy 1, policy_version 36070 (0.0007) +[2023-10-08 13:12:45,566][102897] Updated weights for policy 0, policy_version 36060 (0.0011) +[2023-10-08 13:12:45,664][102898] Updated weights for policy 1, policy_version 36080 (0.0009) +[2023-10-08 13:12:46,018][102898] Updated weights for policy 1, policy_version 36090 (0.0007) +[2023-10-08 13:12:46,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 73891840. Throughput: 0: 1775.9, 1: 1768.9. Samples: 18478674. Policy #0 lag: (min: 23.0, avg: 27.3, max: 55.0) +[2023-10-08 13:12:46,876][101941] Avg episode reward: [(0, '6.910'), (1, '7.570')] +[2023-10-08 13:12:49,403][102897] Updated weights for policy 0, policy_version 36070 (0.0007) +[2023-10-08 13:12:49,782][102897] Updated weights for policy 0, policy_version 36080 (0.0008) +[2023-10-08 13:12:49,879][102898] Updated weights for policy 1, policy_version 36100 (0.0008) +[2023-10-08 13:12:50,151][102897] Updated weights for policy 0, policy_version 36090 (0.0008) +[2023-10-08 13:12:50,238][102898] Updated weights for policy 1, policy_version 36110 (0.0008) +[2023-10-08 13:12:50,606][102898] Updated weights for policy 1, policy_version 36120 (0.0009) +[2023-10-08 13:12:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 73957376. Throughput: 0: 1795.3, 1: 1787.8. Samples: 18490900. Policy #0 lag: (min: 23.0, avg: 27.3, max: 55.0) +[2023-10-08 13:12:51,876][101941] Avg episode reward: [(0, '5.820'), (1, '8.000')] +[2023-10-08 13:12:53,894][102897] Updated weights for policy 0, policy_version 36100 (0.0008) +[2023-10-08 13:12:54,262][102897] Updated weights for policy 0, policy_version 36110 (0.0009) +[2023-10-08 13:12:54,369][102898] Updated weights for policy 1, policy_version 36130 (0.0008) +[2023-10-08 13:12:54,638][102897] Updated weights for policy 0, policy_version 36120 (0.0007) +[2023-10-08 13:12:54,766][102898] Updated weights for policy 1, policy_version 36140 (0.0007) +[2023-10-08 13:12:55,135][102898] Updated weights for policy 1, policy_version 36150 (0.0009) +[2023-10-08 13:12:55,499][102898] Updated weights for policy 1, policy_version 36160 (0.0008) +[2023-10-08 13:12:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 74022912. Throughput: 0: 1777.9, 1: 1768.5. Samples: 18510740. Policy #0 lag: (min: 23.0, avg: 27.3, max: 55.0) +[2023-10-08 13:12:56,876][101941] Avg episode reward: [(0, '6.060'), (1, '7.580')] +[2023-10-08 13:12:58,554][102897] Updated weights for policy 0, policy_version 36130 (0.0008) +[2023-10-08 13:12:58,958][102897] Updated weights for policy 0, policy_version 36140 (0.0009) +[2023-10-08 13:12:59,248][102898] Updated weights for policy 1, policy_version 36170 (0.0007) +[2023-10-08 13:12:59,331][102897] Updated weights for policy 0, policy_version 36150 (0.0008) +[2023-10-08 13:12:59,622][102898] Updated weights for policy 1, policy_version 36180 (0.0008) +[2023-10-08 13:12:59,692][102897] Updated weights for policy 0, policy_version 36160 (0.0010) +[2023-10-08 13:12:59,990][102898] Updated weights for policy 1, policy_version 36190 (0.0010) +[2023-10-08 13:13:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 74088448. Throughput: 0: 1768.2, 1: 1764.4. Samples: 18532492. Policy #0 lag: (min: 23.0, avg: 27.3, max: 55.0) +[2023-10-08 13:13:01,875][101941] Avg episode reward: [(0, '6.920'), (1, '7.810')] +[2023-10-08 13:13:03,562][102897] Updated weights for policy 0, policy_version 36170 (0.0007) +[2023-10-08 13:13:03,855][102898] Updated weights for policy 1, policy_version 36200 (0.0010) +[2023-10-08 13:13:03,934][102897] Updated weights for policy 0, policy_version 36180 (0.0008) +[2023-10-08 13:13:04,229][102898] Updated weights for policy 1, policy_version 36210 (0.0009) +[2023-10-08 13:13:04,316][102897] Updated weights for policy 0, policy_version 36190 (0.0008) +[2023-10-08 13:13:04,600][102898] Updated weights for policy 1, policy_version 36220 (0.0008) +[2023-10-08 13:13:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 74153984. Throughput: 0: 1771.0, 1: 1777.6. Samples: 18542814. Policy #0 lag: (min: 23.0, avg: 27.3, max: 55.0) +[2023-10-08 13:13:06,876][101941] Avg episode reward: [(0, '6.560'), (1, '8.200')] +[2023-10-08 13:13:08,110][102897] Updated weights for policy 0, policy_version 36200 (0.0008) +[2023-10-08 13:13:08,288][102898] Updated weights for policy 1, policy_version 36230 (0.0008) +[2023-10-08 13:13:08,484][102897] Updated weights for policy 0, policy_version 36210 (0.0007) +[2023-10-08 13:13:08,655][102898] Updated weights for policy 1, policy_version 36240 (0.0007) +[2023-10-08 13:13:08,847][102897] Updated weights for policy 0, policy_version 36220 (0.0007) +[2023-10-08 13:13:09,022][102898] Updated weights for policy 1, policy_version 36250 (0.0009) +[2023-10-08 13:13:11,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 74219520. Throughput: 0: 1777.7, 1: 1771.5. Samples: 18564886. Policy #0 lag: (min: 23.0, avg: 27.3, max: 55.0) +[2023-10-08 13:13:11,876][101941] Avg episode reward: [(0, '6.990'), (1, '7.900')] +[2023-10-08 13:13:12,545][102897] Updated weights for policy 0, policy_version 36230 (0.0009) +[2023-10-08 13:13:12,794][102898] Updated weights for policy 1, policy_version 36260 (0.0007) +[2023-10-08 13:13:12,913][102897] Updated weights for policy 0, policy_version 36240 (0.0008) +[2023-10-08 13:13:13,164][102898] Updated weights for policy 1, policy_version 36270 (0.0007) +[2023-10-08 13:13:13,282][102897] Updated weights for policy 0, policy_version 36250 (0.0009) +[2023-10-08 13:13:13,541][102898] Updated weights for policy 1, policy_version 36280 (0.0008) +[2023-10-08 13:13:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 74285056. Throughput: 0: 1796.0, 1: 1774.6. Samples: 18587308. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:13:16,875][101941] Avg episode reward: [(0, '7.140'), (1, '7.850')] +[2023-10-08 13:13:16,939][102897] Updated weights for policy 0, policy_version 36260 (0.0009) +[2023-10-08 13:13:17,298][102897] Updated weights for policy 0, policy_version 36270 (0.0009) +[2023-10-08 13:13:17,316][102898] Updated weights for policy 1, policy_version 36290 (0.0010) +[2023-10-08 13:13:17,664][102897] Updated weights for policy 0, policy_version 36280 (0.0007) +[2023-10-08 13:13:17,672][102898] Updated weights for policy 1, policy_version 36300 (0.0007) +[2023-10-08 13:13:18,049][102898] Updated weights for policy 1, policy_version 36310 (0.0010) +[2023-10-08 13:13:18,409][102898] Updated weights for policy 1, policy_version 36320 (0.0009) +[2023-10-08 13:13:21,346][102897] Updated weights for policy 0, policy_version 36290 (0.0008) +[2023-10-08 13:13:21,716][102897] Updated weights for policy 0, policy_version 36300 (0.0009) +[2023-10-08 13:13:21,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 74350592. Throughput: 0: 1783.5, 1: 1769.7. Samples: 18596844. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:13:21,875][101941] Avg episode reward: [(0, '6.590'), (1, '7.800')] +[2023-10-08 13:13:22,091][102897] Updated weights for policy 0, policy_version 36310 (0.0009) +[2023-10-08 13:13:22,246][102898] Updated weights for policy 1, policy_version 36330 (0.0007) +[2023-10-08 13:13:22,459][102897] Updated weights for policy 0, policy_version 36320 (0.0009) +[2023-10-08 13:13:22,614][102898] Updated weights for policy 1, policy_version 36340 (0.0009) +[2023-10-08 13:13:22,987][102898] Updated weights for policy 1, policy_version 36350 (0.0010) +[2023-10-08 13:13:26,191][102897] Updated weights for policy 0, policy_version 36330 (0.0010) +[2023-10-08 13:13:26,559][102897] Updated weights for policy 0, policy_version 36340 (0.0010) +[2023-10-08 13:13:26,718][102898] Updated weights for policy 1, policy_version 36360 (0.0008) +[2023-10-08 13:13:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 74416128. Throughput: 0: 1799.3, 1: 1773.8. Samples: 18619504. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:13:26,875][101941] Avg episode reward: [(0, '6.320'), (1, '7.280')] +[2023-10-08 13:13:26,941][102897] Updated weights for policy 0, policy_version 36350 (0.0008) +[2023-10-08 13:13:27,093][102898] Updated weights for policy 1, policy_version 36370 (0.0009) +[2023-10-08 13:13:27,464][102898] Updated weights for policy 1, policy_version 36380 (0.0009) +[2023-10-08 13:13:30,724][102897] Updated weights for policy 0, policy_version 36360 (0.0007) +[2023-10-08 13:13:31,088][102897] Updated weights for policy 0, policy_version 36370 (0.0008) +[2023-10-08 13:13:31,349][102898] Updated weights for policy 1, policy_version 36390 (0.0008) +[2023-10-08 13:13:31,460][102897] Updated weights for policy 0, policy_version 36380 (0.0008) +[2023-10-08 13:13:31,716][102898] Updated weights for policy 1, policy_version 36400 (0.0009) +[2023-10-08 13:13:31,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 74514432. Throughput: 0: 1792.1, 1: 1794.8. Samples: 18640084. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:13:31,876][101941] Avg episode reward: [(0, '6.090'), (1, '6.830')] +[2023-10-08 13:13:32,081][102898] Updated weights for policy 1, policy_version 36410 (0.0009) +[2023-10-08 13:13:35,137][102897] Updated weights for policy 0, policy_version 36390 (0.0007) +[2023-10-08 13:13:35,510][102897] Updated weights for policy 0, policy_version 36400 (0.0010) +[2023-10-08 13:13:35,841][102898] Updated weights for policy 1, policy_version 36420 (0.0009) +[2023-10-08 13:13:35,879][102897] Updated weights for policy 0, policy_version 36410 (0.0009) +[2023-10-08 13:13:36,202][102898] Updated weights for policy 1, policy_version 36430 (0.0008) +[2023-10-08 13:13:36,572][102898] Updated weights for policy 1, policy_version 36440 (0.0007) +[2023-10-08 13:13:36,875][101941] Fps is (10 sec: 19660.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 74612736. Throughput: 0: 1793.1, 1: 1769.3. Samples: 18651208. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:13:36,875][101941] Avg episode reward: [(0, '5.970'), (1, '7.600')] +[2023-10-08 13:13:39,631][102897] Updated weights for policy 0, policy_version 36420 (0.0007) +[2023-10-08 13:13:40,002][102897] Updated weights for policy 0, policy_version 36430 (0.0007) +[2023-10-08 13:13:40,374][102898] Updated weights for policy 1, policy_version 36450 (0.0009) +[2023-10-08 13:13:40,377][102897] Updated weights for policy 0, policy_version 36440 (0.0008) +[2023-10-08 13:13:40,776][102898] Updated weights for policy 1, policy_version 36460 (0.0008) +[2023-10-08 13:13:41,140][102898] Updated weights for policy 1, policy_version 36470 (0.0009) +[2023-10-08 13:13:41,502][102898] Updated weights for policy 1, policy_version 36480 (0.0011) +[2023-10-08 13:13:41,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 74678272. Throughput: 0: 1797.2, 1: 1797.3. Samples: 18672492. Policy #0 lag: (min: 11.0, avg: 12.8, max: 40.0) +[2023-10-08 13:13:41,876][101941] Avg episode reward: [(0, '6.690'), (1, '8.270')] +[2023-10-08 13:13:44,155][102897] Updated weights for policy 0, policy_version 36450 (0.0007) +[2023-10-08 13:13:44,556][102897] Updated weights for policy 0, policy_version 36460 (0.0008) +[2023-10-08 13:13:44,917][102897] Updated weights for policy 0, policy_version 36470 (0.0007) +[2023-10-08 13:13:45,258][102898] Updated weights for policy 1, policy_version 36490 (0.0007) +[2023-10-08 13:13:45,288][102897] Updated weights for policy 0, policy_version 36480 (0.0008) +[2023-10-08 13:13:45,621][102898] Updated weights for policy 1, policy_version 36500 (0.0009) +[2023-10-08 13:13:45,989][102898] Updated weights for policy 1, policy_version 36510 (0.0007) +[2023-10-08 13:13:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 74743808. Throughput: 0: 1800.8, 1: 1773.3. Samples: 18693326. Policy #0 lag: (min: 11.0, avg: 12.8, max: 40.0) +[2023-10-08 13:13:46,875][101941] Avg episode reward: [(0, '5.920'), (1, '8.300')] +[2023-10-08 13:13:49,020][102897] Updated weights for policy 0, policy_version 36490 (0.0007) +[2023-10-08 13:13:49,392][102897] Updated weights for policy 0, policy_version 36500 (0.0009) +[2023-10-08 13:13:49,684][102898] Updated weights for policy 1, policy_version 36520 (0.0008) +[2023-10-08 13:13:49,753][102897] Updated weights for policy 0, policy_version 36510 (0.0007) +[2023-10-08 13:13:50,060][102898] Updated weights for policy 1, policy_version 36530 (0.0008) +[2023-10-08 13:13:50,426][102898] Updated weights for policy 1, policy_version 36540 (0.0008) +[2023-10-08 13:13:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 74809344. Throughput: 0: 1810.4, 1: 1792.8. Samples: 18704958. Policy #0 lag: (min: 11.0, avg: 12.8, max: 40.0) +[2023-10-08 13:13:51,876][101941] Avg episode reward: [(0, '5.800'), (1, '8.060')] +[2023-10-08 13:13:53,565][102897] Updated weights for policy 0, policy_version 36520 (0.0009) +[2023-10-08 13:13:53,935][102897] Updated weights for policy 0, policy_version 36530 (0.0009) +[2023-10-08 13:13:54,207][102898] Updated weights for policy 1, policy_version 36550 (0.0008) +[2023-10-08 13:13:54,323][102897] Updated weights for policy 0, policy_version 36540 (0.0008) +[2023-10-08 13:13:54,579][102898] Updated weights for policy 1, policy_version 36560 (0.0007) +[2023-10-08 13:13:54,947][102898] Updated weights for policy 1, policy_version 36570 (0.0008) +[2023-10-08 13:13:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 74874880. Throughput: 0: 1795.3, 1: 1769.1. Samples: 18725282. Policy #0 lag: (min: 11.0, avg: 12.8, max: 40.0) +[2023-10-08 13:13:56,876][101941] Avg episode reward: [(0, '6.400'), (1, '7.980')] +[2023-10-08 13:13:58,205][102897] Updated weights for policy 0, policy_version 36550 (0.0007) +[2023-10-08 13:13:58,575][102897] Updated weights for policy 0, policy_version 36560 (0.0008) +[2023-10-08 13:13:58,608][102898] Updated weights for policy 1, policy_version 36580 (0.0009) +[2023-10-08 13:13:58,946][102897] Updated weights for policy 0, policy_version 36570 (0.0008) +[2023-10-08 13:13:58,971][102898] Updated weights for policy 1, policy_version 36590 (0.0007) +[2023-10-08 13:13:59,333][102898] Updated weights for policy 1, policy_version 36600 (0.0007) +[2023-10-08 13:14:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 74940416. Throughput: 0: 1790.5, 1: 1780.1. Samples: 18747986. Policy #0 lag: (min: 11.0, avg: 12.8, max: 40.0) +[2023-10-08 13:14:01,876][101941] Avg episode reward: [(0, '6.650'), (1, '7.800')] +[2023-10-08 13:14:02,724][102897] Updated weights for policy 0, policy_version 36580 (0.0007) +[2023-10-08 13:14:03,086][102898] Updated weights for policy 1, policy_version 36610 (0.0007) +[2023-10-08 13:14:03,095][102897] Updated weights for policy 0, policy_version 36590 (0.0008) +[2023-10-08 13:14:03,448][102898] Updated weights for policy 1, policy_version 36620 (0.0007) +[2023-10-08 13:14:03,469][102897] Updated weights for policy 0, policy_version 36600 (0.0007) +[2023-10-08 13:14:03,810][102898] Updated weights for policy 1, policy_version 36630 (0.0009) +[2023-10-08 13:14:04,180][102898] Updated weights for policy 1, policy_version 36640 (0.0011) +[2023-10-08 13:14:06,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 75005952. Throughput: 0: 1789.0, 1: 1783.3. Samples: 18757598. Policy #0 lag: (min: 11.0, avg: 12.8, max: 40.0) +[2023-10-08 13:14:06,876][101941] Avg episode reward: [(0, '6.560'), (1, '6.960')] +[2023-10-08 13:14:07,107][102897] Updated weights for policy 0, policy_version 36610 (0.0010) +[2023-10-08 13:14:07,486][102897] Updated weights for policy 0, policy_version 36620 (0.0010) +[2023-10-08 13:14:07,850][102897] Updated weights for policy 0, policy_version 36630 (0.0007) +[2023-10-08 13:14:08,027][102898] Updated weights for policy 1, policy_version 36650 (0.0008) +[2023-10-08 13:14:08,219][102897] Updated weights for policy 0, policy_version 36640 (0.0007) +[2023-10-08 13:14:08,385][102898] Updated weights for policy 1, policy_version 36660 (0.0009) +[2023-10-08 13:14:08,748][102898] Updated weights for policy 1, policy_version 36670 (0.0010) +[2023-10-08 13:14:11,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 75071488. Throughput: 0: 1786.2, 1: 1776.5. Samples: 18779826. Policy #0 lag: (min: 2.0, avg: 6.3, max: 34.0) +[2023-10-08 13:14:11,875][101941] Avg episode reward: [(0, '6.230'), (1, '7.050')] +[2023-10-08 13:14:11,966][102897] Updated weights for policy 0, policy_version 36650 (0.0008) +[2023-10-08 13:14:12,345][102897] Updated weights for policy 0, policy_version 36660 (0.0008) +[2023-10-08 13:14:12,672][102898] Updated weights for policy 1, policy_version 36680 (0.0009) +[2023-10-08 13:14:12,719][102897] Updated weights for policy 0, policy_version 36670 (0.0007) +[2023-10-08 13:14:13,041][102898] Updated weights for policy 1, policy_version 36690 (0.0008) +[2023-10-08 13:14:13,405][102898] Updated weights for policy 1, policy_version 36700 (0.0008) +[2023-10-08 13:14:16,503][102897] Updated weights for policy 0, policy_version 36680 (0.0008) +[2023-10-08 13:14:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 75137024. Throughput: 0: 1805.1, 1: 1783.7. Samples: 18801578. Policy #0 lag: (min: 2.0, avg: 6.3, max: 34.0) +[2023-10-08 13:14:16,876][102897] Updated weights for policy 0, policy_version 36690 (0.0007) +[2023-10-08 13:14:16,876][101941] Avg episode reward: [(0, '5.840'), (1, '7.470')] +[2023-10-08 13:14:16,887][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000036704_37584896.pth... +[2023-10-08 13:14:16,922][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000035040_35880960.pth +[2023-10-08 13:14:17,238][102897] Updated weights for policy 0, policy_version 36700 (0.0007) +[2023-10-08 13:14:17,333][102898] Updated weights for policy 1, policy_version 36710 (0.0008) +[2023-10-08 13:14:17,385][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000036704_37584896.pth... +[2023-10-08 13:14:17,420][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000035008_35848192.pth +[2023-10-08 13:14:17,694][102898] Updated weights for policy 1, policy_version 36720 (0.0007) +[2023-10-08 13:14:18,072][102898] Updated weights for policy 1, policy_version 36730 (0.0010) +[2023-10-08 13:14:20,942][102897] Updated weights for policy 0, policy_version 36710 (0.0007) +[2023-10-08 13:14:21,314][102897] Updated weights for policy 0, policy_version 36720 (0.0009) +[2023-10-08 13:14:21,690][102897] Updated weights for policy 0, policy_version 36730 (0.0008) +[2023-10-08 13:14:21,849][102898] Updated weights for policy 1, policy_version 36740 (0.0009) +[2023-10-08 13:14:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 75202560. Throughput: 0: 1783.5, 1: 1777.6. Samples: 18811456. Policy #0 lag: (min: 2.0, avg: 6.3, max: 34.0) +[2023-10-08 13:14:21,875][101941] Avg episode reward: [(0, '5.870'), (1, '7.500')] +[2023-10-08 13:14:22,222][102898] Updated weights for policy 1, policy_version 36750 (0.0009) +[2023-10-08 13:14:22,592][102898] Updated weights for policy 1, policy_version 36760 (0.0010) +[2023-10-08 13:14:25,405][102897] Updated weights for policy 0, policy_version 36740 (0.0010) +[2023-10-08 13:14:25,782][102897] Updated weights for policy 0, policy_version 36750 (0.0008) +[2023-10-08 13:14:26,155][102897] Updated weights for policy 0, policy_version 36760 (0.0008) +[2023-10-08 13:14:26,443][102898] Updated weights for policy 1, policy_version 36770 (0.0008) +[2023-10-08 13:14:26,840][102898] Updated weights for policy 1, policy_version 36780 (0.0009) +[2023-10-08 13:14:26,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.5, 300 sec: 14329.1). Total num frames: 75300864. Throughput: 0: 1806.2, 1: 1779.6. Samples: 18833854. Policy #0 lag: (min: 2.0, avg: 6.3, max: 34.0) +[2023-10-08 13:14:26,876][101941] Avg episode reward: [(0, '5.920'), (1, '7.790')] +[2023-10-08 13:14:27,210][102898] Updated weights for policy 1, policy_version 36790 (0.0008) +[2023-10-08 13:14:27,569][102898] Updated weights for policy 1, policy_version 36800 (0.0007) +[2023-10-08 13:14:29,881][102897] Updated weights for policy 0, policy_version 36770 (0.0008) +[2023-10-08 13:14:30,260][102897] Updated weights for policy 0, policy_version 36780 (0.0010) +[2023-10-08 13:14:30,620][102897] Updated weights for policy 0, policy_version 36790 (0.0009) +[2023-10-08 13:14:30,997][102897] Updated weights for policy 0, policy_version 36800 (0.0009) +[2023-10-08 13:14:31,345][102898] Updated weights for policy 1, policy_version 36810 (0.0007) +[2023-10-08 13:14:31,710][102898] Updated weights for policy 1, policy_version 36820 (0.0008) +[2023-10-08 13:14:31,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 75366400. Throughput: 0: 1784.6, 1: 1795.5. Samples: 18854434. Policy #0 lag: (min: 2.0, avg: 6.3, max: 34.0) +[2023-10-08 13:14:31,876][101941] Avg episode reward: [(0, '6.020'), (1, '8.120')] +[2023-10-08 13:14:32,084][102898] Updated weights for policy 1, policy_version 36830 (0.0009) +[2023-10-08 13:14:34,755][102897] Updated weights for policy 0, policy_version 36810 (0.0007) +[2023-10-08 13:14:35,125][102897] Updated weights for policy 0, policy_version 36820 (0.0007) +[2023-10-08 13:14:35,493][102897] Updated weights for policy 0, policy_version 36830 (0.0009) +[2023-10-08 13:14:35,872][102898] Updated weights for policy 1, policy_version 36840 (0.0009) +[2023-10-08 13:14:36,235][102898] Updated weights for policy 1, policy_version 36850 (0.0007) +[2023-10-08 13:14:36,601][102898] Updated weights for policy 1, policy_version 36860 (0.0009) +[2023-10-08 13:14:36,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 75464704. Throughput: 0: 1808.1, 1: 1774.1. Samples: 18866156. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 13:14:36,875][101941] Avg episode reward: [(0, '6.750'), (1, '7.570')] +[2023-10-08 13:14:39,301][102897] Updated weights for policy 0, policy_version 36840 (0.0009) +[2023-10-08 13:14:39,675][102897] Updated weights for policy 0, policy_version 36850 (0.0008) +[2023-10-08 13:14:40,054][102897] Updated weights for policy 0, policy_version 36860 (0.0008) +[2023-10-08 13:14:40,398][102898] Updated weights for policy 1, policy_version 36870 (0.0010) +[2023-10-08 13:14:40,763][102898] Updated weights for policy 1, policy_version 36880 (0.0007) +[2023-10-08 13:14:41,135][102898] Updated weights for policy 1, policy_version 36890 (0.0007) +[2023-10-08 13:14:41,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 75530240. Throughput: 0: 1785.8, 1: 1798.2. Samples: 18886564. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 13:14:41,875][101941] Avg episode reward: [(0, '6.720'), (1, '7.610')] +[2023-10-08 13:14:43,771][102897] Updated weights for policy 0, policy_version 36870 (0.0008) +[2023-10-08 13:14:44,137][102897] Updated weights for policy 0, policy_version 36880 (0.0007) +[2023-10-08 13:14:44,519][102897] Updated weights for policy 0, policy_version 36890 (0.0008) +[2023-10-08 13:14:44,882][102898] Updated weights for policy 1, policy_version 36900 (0.0007) +[2023-10-08 13:14:45,245][102898] Updated weights for policy 1, policy_version 36910 (0.0007) +[2023-10-08 13:14:45,616][102898] Updated weights for policy 1, policy_version 36920 (0.0009) +[2023-10-08 13:14:46,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 75595776. Throughput: 0: 1783.5, 1: 1764.1. Samples: 18907628. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 13:14:46,876][101941] Avg episode reward: [(0, '5.830'), (1, '7.360')] +[2023-10-08 13:14:48,357][102897] Updated weights for policy 0, policy_version 36900 (0.0008) +[2023-10-08 13:14:48,726][102897] Updated weights for policy 0, policy_version 36910 (0.0008) +[2023-10-08 13:14:49,112][102897] Updated weights for policy 0, policy_version 36920 (0.0008) +[2023-10-08 13:14:49,270][102898] Updated weights for policy 1, policy_version 36930 (0.0007) +[2023-10-08 13:14:49,639][102898] Updated weights for policy 1, policy_version 36940 (0.0007) +[2023-10-08 13:14:50,007][102898] Updated weights for policy 1, policy_version 36950 (0.0009) +[2023-10-08 13:14:50,369][102898] Updated weights for policy 1, policy_version 36960 (0.0007) +[2023-10-08 13:14:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 75661312. Throughput: 0: 1786.8, 1: 1792.1. Samples: 18918648. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 13:14:51,876][101941] Avg episode reward: [(0, '5.850'), (1, '7.290')] +[2023-10-08 13:14:52,839][102897] Updated weights for policy 0, policy_version 36930 (0.0008) +[2023-10-08 13:14:53,205][102897] Updated weights for policy 0, policy_version 36940 (0.0009) +[2023-10-08 13:14:53,585][102897] Updated weights for policy 0, policy_version 36950 (0.0008) +[2023-10-08 13:14:53,944][102897] Updated weights for policy 0, policy_version 36960 (0.0008) +[2023-10-08 13:14:54,083][102898] Updated weights for policy 1, policy_version 36970 (0.0008) +[2023-10-08 13:14:54,451][102898] Updated weights for policy 1, policy_version 36980 (0.0009) +[2023-10-08 13:14:54,814][102898] Updated weights for policy 1, policy_version 36990 (0.0007) +[2023-10-08 13:14:56,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 75726848. Throughput: 0: 1782.3, 1: 1772.4. Samples: 18939784. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 13:14:56,876][101941] Avg episode reward: [(0, '6.620'), (1, '7.430')] +[2023-10-08 13:14:57,647][102897] Updated weights for policy 0, policy_version 36970 (0.0007) +[2023-10-08 13:14:58,021][102897] Updated weights for policy 0, policy_version 36980 (0.0007) +[2023-10-08 13:14:58,394][102897] Updated weights for policy 0, policy_version 36990 (0.0008) +[2023-10-08 13:14:58,564][102898] Updated weights for policy 1, policy_version 37000 (0.0008) +[2023-10-08 13:14:58,934][102898] Updated weights for policy 1, policy_version 37010 (0.0007) +[2023-10-08 13:14:59,294][102898] Updated weights for policy 1, policy_version 37020 (0.0007) +[2023-10-08 13:15:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 75792384. Throughput: 0: 1790.9, 1: 1781.1. Samples: 18962316. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 13:15:01,876][101941] Avg episode reward: [(0, '6.530'), (1, '7.040')] +[2023-10-08 13:15:02,339][102897] Updated weights for policy 0, policy_version 37000 (0.0007) +[2023-10-08 13:15:02,708][102897] Updated weights for policy 0, policy_version 37010 (0.0007) +[2023-10-08 13:15:03,087][102897] Updated weights for policy 0, policy_version 37020 (0.0007) +[2023-10-08 13:15:03,157][102898] Updated weights for policy 1, policy_version 37030 (0.0008) +[2023-10-08 13:15:03,523][102898] Updated weights for policy 1, policy_version 37040 (0.0008) +[2023-10-08 13:15:03,894][102898] Updated weights for policy 1, policy_version 37050 (0.0008) +[2023-10-08 13:15:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 75857920. Throughput: 0: 1786.9, 1: 1780.0. Samples: 18971970. Policy #0 lag: (min: 2.0, avg: 2.2, max: 12.0) +[2023-10-08 13:15:06,875][101941] Avg episode reward: [(0, '6.430'), (1, '7.320')] +[2023-10-08 13:15:06,920][102897] Updated weights for policy 0, policy_version 37030 (0.0008) +[2023-10-08 13:15:07,290][102897] Updated weights for policy 0, policy_version 37040 (0.0007) +[2023-10-08 13:15:07,663][102897] Updated weights for policy 0, policy_version 37050 (0.0007) +[2023-10-08 13:15:07,671][102898] Updated weights for policy 1, policy_version 37060 (0.0008) +[2023-10-08 13:15:08,035][102898] Updated weights for policy 1, policy_version 37070 (0.0009) +[2023-10-08 13:15:08,405][102898] Updated weights for policy 1, policy_version 37080 (0.0011) +[2023-10-08 13:15:11,444][102897] Updated weights for policy 0, policy_version 37060 (0.0007) +[2023-10-08 13:15:11,816][102897] Updated weights for policy 0, policy_version 37070 (0.0007) +[2023-10-08 13:15:11,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 75923456. Throughput: 0: 1784.6, 1: 1783.0. Samples: 18994394. Policy #0 lag: (min: 2.0, avg: 2.2, max: 12.0) +[2023-10-08 13:15:11,876][101941] Avg episode reward: [(0, '6.300'), (1, '7.570')] +[2023-10-08 13:15:12,172][102898] Updated weights for policy 1, policy_version 37090 (0.0011) +[2023-10-08 13:15:12,178][102897] Updated weights for policy 0, policy_version 37080 (0.0007) +[2023-10-08 13:15:12,544][102898] Updated weights for policy 1, policy_version 37100 (0.0010) +[2023-10-08 13:15:12,916][102898] Updated weights for policy 1, policy_version 37110 (0.0011) +[2023-10-08 13:15:13,282][102898] Updated weights for policy 1, policy_version 37120 (0.0007) +[2023-10-08 13:15:15,891][102897] Updated weights for policy 0, policy_version 37090 (0.0008) +[2023-10-08 13:15:16,288][102897] Updated weights for policy 0, policy_version 37100 (0.0007) +[2023-10-08 13:15:16,670][102897] Updated weights for policy 0, policy_version 37110 (0.0007) +[2023-10-08 13:15:16,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 75988992. Throughput: 0: 1792.4, 1: 1792.4. Samples: 19015752. Policy #0 lag: (min: 2.0, avg: 2.2, max: 12.0) +[2023-10-08 13:15:16,876][101941] Avg episode reward: [(0, '5.830'), (1, '6.970')] +[2023-10-08 13:15:17,050][102897] Updated weights for policy 0, policy_version 37120 (0.0007) +[2023-10-08 13:15:17,169][102898] Updated weights for policy 1, policy_version 37130 (0.0009) +[2023-10-08 13:15:17,528][102898] Updated weights for policy 1, policy_version 37140 (0.0008) +[2023-10-08 13:15:17,893][102898] Updated weights for policy 1, policy_version 37150 (0.0008) +[2023-10-08 13:15:20,642][102897] Updated weights for policy 0, policy_version 37130 (0.0009) +[2023-10-08 13:15:21,014][102897] Updated weights for policy 0, policy_version 37140 (0.0011) +[2023-10-08 13:15:21,384][102897] Updated weights for policy 0, policy_version 37150 (0.0008) +[2023-10-08 13:15:21,814][102898] Updated weights for policy 1, policy_version 37160 (0.0008) +[2023-10-08 13:15:21,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 76087296. Throughput: 0: 1774.2, 1: 1779.3. Samples: 19026066. Policy #0 lag: (min: 2.0, avg: 2.2, max: 12.0) +[2023-10-08 13:15:21,876][101941] Avg episode reward: [(0, '5.940'), (1, '6.950')] +[2023-10-08 13:15:22,182][102898] Updated weights for policy 1, policy_version 37170 (0.0008) +[2023-10-08 13:15:22,549][102898] Updated weights for policy 1, policy_version 37180 (0.0010) +[2023-10-08 13:15:25,218][102897] Updated weights for policy 0, policy_version 37160 (0.0008) +[2023-10-08 13:15:25,586][102897] Updated weights for policy 0, policy_version 37170 (0.0008) +[2023-10-08 13:15:25,961][102897] Updated weights for policy 0, policy_version 37180 (0.0007) +[2023-10-08 13:15:26,311][102898] Updated weights for policy 1, policy_version 37190 (0.0009) +[2023-10-08 13:15:26,673][102898] Updated weights for policy 1, policy_version 37200 (0.0007) +[2023-10-08 13:15:26,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 76152832. Throughput: 0: 1797.6, 1: 1788.4. Samples: 19047934. Policy #0 lag: (min: 2.0, avg: 2.2, max: 12.0) +[2023-10-08 13:15:26,876][101941] Avg episode reward: [(0, '5.590'), (1, '7.710')] +[2023-10-08 13:15:27,030][102898] Updated weights for policy 1, policy_version 37210 (0.0007) +[2023-10-08 13:15:29,656][102897] Updated weights for policy 0, policy_version 37190 (0.0007) +[2023-10-08 13:15:30,026][102897] Updated weights for policy 0, policy_version 37200 (0.0007) +[2023-10-08 13:15:30,400][102897] Updated weights for policy 0, policy_version 37210 (0.0008) +[2023-10-08 13:15:30,971][102898] Updated weights for policy 1, policy_version 37220 (0.0008) +[2023-10-08 13:15:31,339][102898] Updated weights for policy 1, policy_version 37230 (0.0008) +[2023-10-08 13:15:31,713][102898] Updated weights for policy 1, policy_version 37240 (0.0008) +[2023-10-08 13:15:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 76218368. Throughput: 0: 1781.9, 1: 1794.6. Samples: 19068570. Policy #0 lag: (min: 20.0, avg: 25.7, max: 52.0) +[2023-10-08 13:15:31,876][101941] Avg episode reward: [(0, '5.350'), (1, '7.630')] +[2023-10-08 13:15:33,990][102897] Updated weights for policy 0, policy_version 37220 (0.0007) +[2023-10-08 13:15:34,359][102897] Updated weights for policy 0, policy_version 37230 (0.0008) +[2023-10-08 13:15:34,733][102897] Updated weights for policy 0, policy_version 37240 (0.0009) +[2023-10-08 13:15:35,398][102898] Updated weights for policy 1, policy_version 37250 (0.0007) +[2023-10-08 13:15:35,760][102898] Updated weights for policy 1, policy_version 37260 (0.0008) +[2023-10-08 13:15:36,129][102898] Updated weights for policy 1, policy_version 37270 (0.0011) +[2023-10-08 13:15:36,489][102898] Updated weights for policy 1, policy_version 37280 (0.0010) +[2023-10-08 13:15:36,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 76316672. Throughput: 0: 1799.6, 1: 1784.4. Samples: 19079930. Policy #0 lag: (min: 20.0, avg: 25.7, max: 52.0) +[2023-10-08 13:15:36,875][101941] Avg episode reward: [(0, '5.560'), (1, '7.010')] +[2023-10-08 13:15:38,569][102897] Updated weights for policy 0, policy_version 37250 (0.0007) +[2023-10-08 13:15:38,939][102897] Updated weights for policy 0, policy_version 37260 (0.0009) +[2023-10-08 13:15:39,311][102897] Updated weights for policy 0, policy_version 37270 (0.0009) +[2023-10-08 13:15:39,672][102897] Updated weights for policy 0, policy_version 37280 (0.0008) +[2023-10-08 13:15:40,432][102898] Updated weights for policy 1, policy_version 37290 (0.0010) +[2023-10-08 13:15:40,807][102898] Updated weights for policy 1, policy_version 37300 (0.0009) +[2023-10-08 13:15:41,172][102898] Updated weights for policy 1, policy_version 37310 (0.0009) +[2023-10-08 13:15:41,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 76382208. Throughput: 0: 1784.3, 1: 1796.0. Samples: 19100896. Policy #0 lag: (min: 20.0, avg: 25.7, max: 52.0) +[2023-10-08 13:15:41,876][101941] Avg episode reward: [(0, '5.630'), (1, '6.990')] +[2023-10-08 13:15:43,434][102897] Updated weights for policy 0, policy_version 37290 (0.0008) +[2023-10-08 13:15:43,810][102897] Updated weights for policy 0, policy_version 37300 (0.0008) +[2023-10-08 13:15:44,183][102897] Updated weights for policy 0, policy_version 37310 (0.0007) +[2023-10-08 13:15:44,855][102898] Updated weights for policy 1, policy_version 37320 (0.0011) +[2023-10-08 13:15:45,220][102898] Updated weights for policy 1, policy_version 37330 (0.0009) +[2023-10-08 13:15:45,586][102898] Updated weights for policy 1, policy_version 37340 (0.0009) +[2023-10-08 13:15:46,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 76447744. Throughput: 0: 1783.7, 1: 1773.1. Samples: 19122370. Policy #0 lag: (min: 20.0, avg: 25.7, max: 52.0) +[2023-10-08 13:15:46,876][101941] Avg episode reward: [(0, '5.440'), (1, '7.260')] +[2023-10-08 13:15:47,905][102897] Updated weights for policy 0, policy_version 37320 (0.0009) +[2023-10-08 13:15:48,270][102897] Updated weights for policy 0, policy_version 37330 (0.0010) +[2023-10-08 13:15:48,658][102897] Updated weights for policy 0, policy_version 37340 (0.0008) +[2023-10-08 13:15:49,298][102898] Updated weights for policy 1, policy_version 37350 (0.0008) +[2023-10-08 13:15:49,658][102898] Updated weights for policy 1, policy_version 37360 (0.0008) +[2023-10-08 13:15:50,028][102898] Updated weights for policy 1, policy_version 37370 (0.0009) +[2023-10-08 13:15:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 76513280. Throughput: 0: 1783.6, 1: 1794.9. Samples: 19133006. Policy #0 lag: (min: 20.0, avg: 25.7, max: 52.0) +[2023-10-08 13:15:51,876][101941] Avg episode reward: [(0, '5.190'), (1, '7.860')] +[2023-10-08 13:15:52,407][102897] Updated weights for policy 0, policy_version 37350 (0.0009) +[2023-10-08 13:15:52,778][102897] Updated weights for policy 0, policy_version 37360 (0.0008) +[2023-10-08 13:15:53,150][102897] Updated weights for policy 0, policy_version 37370 (0.0007) +[2023-10-08 13:15:53,674][102898] Updated weights for policy 1, policy_version 37380 (0.0007) +[2023-10-08 13:15:54,035][102898] Updated weights for policy 1, policy_version 37390 (0.0008) +[2023-10-08 13:15:54,399][102898] Updated weights for policy 1, policy_version 37400 (0.0007) +[2023-10-08 13:15:56,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 76578816. Throughput: 0: 1783.6, 1: 1774.7. Samples: 19154518. Policy #0 lag: (min: 20.0, avg: 25.7, max: 52.0) +[2023-10-08 13:15:56,876][101941] Avg episode reward: [(0, '5.810'), (1, '8.120')] +[2023-10-08 13:15:56,881][102897] Updated weights for policy 0, policy_version 37380 (0.0010) +[2023-10-08 13:15:57,251][102897] Updated weights for policy 0, policy_version 37390 (0.0007) +[2023-10-08 13:15:57,633][102897] Updated weights for policy 0, policy_version 37400 (0.0009) +[2023-10-08 13:15:58,165][102898] Updated weights for policy 1, policy_version 37410 (0.0009) +[2023-10-08 13:15:58,564][102898] Updated weights for policy 1, policy_version 37420 (0.0007) +[2023-10-08 13:15:58,939][102898] Updated weights for policy 1, policy_version 37430 (0.0008) +[2023-10-08 13:15:59,300][102898] Updated weights for policy 1, policy_version 37440 (0.0009) +[2023-10-08 13:16:01,519][102897] Updated weights for policy 0, policy_version 37410 (0.0008) +[2023-10-08 13:16:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 76644352. Throughput: 0: 1800.2, 1: 1778.3. Samples: 19176784. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:16:01,876][101941] Avg episode reward: [(0, '6.380'), (1, '8.760')] +[2023-10-08 13:16:01,885][102760] Saving new best policy, reward=8.760! +[2023-10-08 13:16:01,935][102897] Updated weights for policy 0, policy_version 37420 (0.0007) +[2023-10-08 13:16:02,312][102897] Updated weights for policy 0, policy_version 37430 (0.0008) +[2023-10-08 13:16:02,679][102897] Updated weights for policy 0, policy_version 37440 (0.0007) +[2023-10-08 13:16:03,043][102898] Updated weights for policy 1, policy_version 37450 (0.0007) +[2023-10-08 13:16:03,414][102898] Updated weights for policy 1, policy_version 37460 (0.0008) +[2023-10-08 13:16:03,776][102898] Updated weights for policy 1, policy_version 37470 (0.0008) +[2023-10-08 13:16:06,351][102897] Updated weights for policy 0, policy_version 37450 (0.0010) +[2023-10-08 13:16:06,731][102897] Updated weights for policy 0, policy_version 37460 (0.0008) +[2023-10-08 13:16:06,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 76709888. Throughput: 0: 1784.9, 1: 1780.0. Samples: 19186490. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:16:06,877][101941] Avg episode reward: [(0, '6.310'), (1, '7.410')] +[2023-10-08 13:16:07,093][102897] Updated weights for policy 0, policy_version 37470 (0.0008) +[2023-10-08 13:16:07,487][102898] Updated weights for policy 1, policy_version 37480 (0.0008) +[2023-10-08 13:16:07,860][102898] Updated weights for policy 1, policy_version 37490 (0.0008) +[2023-10-08 13:16:08,227][102898] Updated weights for policy 1, policy_version 37500 (0.0008) +[2023-10-08 13:16:10,802][102897] Updated weights for policy 0, policy_version 37480 (0.0008) +[2023-10-08 13:16:11,173][102897] Updated weights for policy 0, policy_version 37490 (0.0007) +[2023-10-08 13:16:11,539][102897] Updated weights for policy 0, policy_version 37500 (0.0009) +[2023-10-08 13:16:11,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 76808192. Throughput: 0: 1800.2, 1: 1778.2. Samples: 19208962. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:16:11,875][101941] Avg episode reward: [(0, '6.620'), (1, '7.740')] +[2023-10-08 13:16:12,020][102898] Updated weights for policy 1, policy_version 37510 (0.0009) +[2023-10-08 13:16:12,387][102898] Updated weights for policy 1, policy_version 37520 (0.0010) +[2023-10-08 13:16:12,746][102898] Updated weights for policy 1, policy_version 37530 (0.0009) +[2023-10-08 13:16:15,105][102897] Updated weights for policy 0, policy_version 37510 (0.0008) +[2023-10-08 13:16:15,476][102897] Updated weights for policy 0, policy_version 37520 (0.0010) +[2023-10-08 13:16:15,861][102897] Updated weights for policy 0, policy_version 37530 (0.0011) +[2023-10-08 13:16:16,492][102898] Updated weights for policy 1, policy_version 37540 (0.0007) +[2023-10-08 13:16:16,856][102898] Updated weights for policy 1, policy_version 37550 (0.0008) +[2023-10-08 13:16:16,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 76873728. Throughput: 0: 1788.8, 1: 1797.9. Samples: 19229972. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:16:16,876][101941] Avg episode reward: [(0, '6.270'), (1, '7.690')] +[2023-10-08 13:16:16,886][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000037536_38436864.pth... +[2023-10-08 13:16:16,922][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000035840_36700160.pth +[2023-10-08 13:16:17,215][102898] Updated weights for policy 1, policy_version 37560 (0.0008) +[2023-10-08 13:16:17,509][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000037568_38469632.pth... +[2023-10-08 13:16:17,538][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000035872_36732928.pth +[2023-10-08 13:16:19,600][102897] Updated weights for policy 0, policy_version 37540 (0.0007) +[2023-10-08 13:16:19,978][102897] Updated weights for policy 0, policy_version 37550 (0.0007) +[2023-10-08 13:16:20,347][102897] Updated weights for policy 0, policy_version 37560 (0.0009) +[2023-10-08 13:16:21,135][102898] Updated weights for policy 1, policy_version 37570 (0.0009) +[2023-10-08 13:16:21,505][102898] Updated weights for policy 1, policy_version 37580 (0.0008) +[2023-10-08 13:16:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 76939264. Throughput: 0: 1807.8, 1: 1780.6. Samples: 19241408. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:16:21,876][101941] Avg episode reward: [(0, '5.660'), (1, '7.090')] +[2023-10-08 13:16:21,877][102898] Updated weights for policy 1, policy_version 37590 (0.0009) +[2023-10-08 13:16:22,240][102898] Updated weights for policy 1, policy_version 37600 (0.0010) +[2023-10-08 13:16:23,935][102897] Updated weights for policy 0, policy_version 37570 (0.0009) +[2023-10-08 13:16:24,307][102897] Updated weights for policy 0, policy_version 37580 (0.0009) +[2023-10-08 13:16:24,682][102897] Updated weights for policy 0, policy_version 37590 (0.0008) +[2023-10-08 13:16:25,062][102897] Updated weights for policy 0, policy_version 37600 (0.0007) +[2023-10-08 13:16:26,110][102898] Updated weights for policy 1, policy_version 37610 (0.0009) +[2023-10-08 13:16:26,474][102898] Updated weights for policy 1, policy_version 37620 (0.0009) +[2023-10-08 13:16:26,840][102898] Updated weights for policy 1, policy_version 37630 (0.0008) +[2023-10-08 13:16:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 77004800. Throughput: 0: 1796.4, 1: 1793.4. Samples: 19262436. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:16:26,876][101941] Avg episode reward: [(0, '5.320'), (1, '7.360')] +[2023-10-08 13:16:28,959][102897] Updated weights for policy 0, policy_version 37610 (0.0008) +[2023-10-08 13:16:29,327][102897] Updated weights for policy 0, policy_version 37620 (0.0007) +[2023-10-08 13:16:29,709][102897] Updated weights for policy 0, policy_version 37630 (0.0009) +[2023-10-08 13:16:30,575][102898] Updated weights for policy 1, policy_version 37640 (0.0007) +[2023-10-08 13:16:30,944][102898] Updated weights for policy 1, policy_version 37650 (0.0007) +[2023-10-08 13:16:31,307][102898] Updated weights for policy 1, policy_version 37660 (0.0008) +[2023-10-08 13:16:31,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 77103104. Throughput: 0: 1799.6, 1: 1783.3. Samples: 19283596. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:16:31,876][101941] Avg episode reward: [(0, '5.910'), (1, '7.020')] +[2023-10-08 13:16:33,472][102897] Updated weights for policy 0, policy_version 37640 (0.0007) +[2023-10-08 13:16:33,834][102897] Updated weights for policy 0, policy_version 37650 (0.0008) +[2023-10-08 13:16:34,212][102897] Updated weights for policy 0, policy_version 37660 (0.0008) +[2023-10-08 13:16:34,874][102898] Updated weights for policy 1, policy_version 37670 (0.0008) +[2023-10-08 13:16:35,244][102898] Updated weights for policy 1, policy_version 37680 (0.0010) +[2023-10-08 13:16:35,613][102898] Updated weights for policy 1, policy_version 37690 (0.0008) +[2023-10-08 13:16:36,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14218.1). Total num frames: 77168640. Throughput: 0: 1797.4, 1: 1797.7. Samples: 19294784. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:16:36,876][101941] Avg episode reward: [(0, '5.490'), (1, '7.620')] +[2023-10-08 13:16:38,038][102897] Updated weights for policy 0, policy_version 37670 (0.0008) +[2023-10-08 13:16:38,411][102897] Updated weights for policy 0, policy_version 37680 (0.0011) +[2023-10-08 13:16:38,787][102897] Updated weights for policy 0, policy_version 37690 (0.0007) +[2023-10-08 13:16:39,345][102898] Updated weights for policy 1, policy_version 37700 (0.0008) +[2023-10-08 13:16:39,714][102898] Updated weights for policy 1, policy_version 37710 (0.0009) +[2023-10-08 13:16:40,090][102898] Updated weights for policy 1, policy_version 37720 (0.0008) +[2023-10-08 13:16:41,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 77234176. Throughput: 0: 1794.8, 1: 1786.0. Samples: 19315658. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:16:41,876][101941] Avg episode reward: [(0, '5.350'), (1, '7.880')] +[2023-10-08 13:16:42,550][102897] Updated weights for policy 0, policy_version 37700 (0.0008) +[2023-10-08 13:16:42,928][102897] Updated weights for policy 0, policy_version 37710 (0.0010) +[2023-10-08 13:16:43,300][102897] Updated weights for policy 0, policy_version 37720 (0.0009) +[2023-10-08 13:16:43,824][102898] Updated weights for policy 1, policy_version 37730 (0.0008) +[2023-10-08 13:16:44,233][102898] Updated weights for policy 1, policy_version 37740 (0.0008) +[2023-10-08 13:16:44,613][102898] Updated weights for policy 1, policy_version 37750 (0.0008) +[2023-10-08 13:16:44,978][102898] Updated weights for policy 1, policy_version 37760 (0.0007) +[2023-10-08 13:16:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 77299712. Throughput: 0: 1792.3, 1: 1784.7. Samples: 19337748. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:16:46,876][101941] Avg episode reward: [(0, '6.140'), (1, '7.480')] +[2023-10-08 13:16:47,184][102897] Updated weights for policy 0, policy_version 37730 (0.0009) +[2023-10-08 13:16:47,583][102897] Updated weights for policy 0, policy_version 37740 (0.0007) +[2023-10-08 13:16:47,950][102897] Updated weights for policy 0, policy_version 37750 (0.0007) +[2023-10-08 13:16:48,322][102897] Updated weights for policy 0, policy_version 37760 (0.0007) +[2023-10-08 13:16:48,837][102898] Updated weights for policy 1, policy_version 37770 (0.0008) +[2023-10-08 13:16:49,201][102898] Updated weights for policy 1, policy_version 37780 (0.0008) +[2023-10-08 13:16:49,572][102898] Updated weights for policy 1, policy_version 37790 (0.0008) +[2023-10-08 13:16:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 77365248. Throughput: 0: 1792.0, 1: 1794.1. Samples: 19347862. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:16:51,876][101941] Avg episode reward: [(0, '6.130'), (1, '7.000')] +[2023-10-08 13:16:52,042][102897] Updated weights for policy 0, policy_version 37770 (0.0011) +[2023-10-08 13:16:52,413][102897] Updated weights for policy 0, policy_version 37780 (0.0009) +[2023-10-08 13:16:52,778][102897] Updated weights for policy 0, policy_version 37790 (0.0009) +[2023-10-08 13:16:53,333][102898] Updated weights for policy 1, policy_version 37800 (0.0007) +[2023-10-08 13:16:53,696][102898] Updated weights for policy 1, policy_version 37810 (0.0007) +[2023-10-08 13:16:54,062][102898] Updated weights for policy 1, policy_version 37820 (0.0011) +[2023-10-08 13:16:56,644][102897] Updated weights for policy 0, policy_version 37800 (0.0009) +[2023-10-08 13:16:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 77430784. Throughput: 0: 1790.3, 1: 1787.2. Samples: 19369950. Policy #0 lag: (min: 26.0, avg: 29.2, max: 56.0) +[2023-10-08 13:16:56,876][101941] Avg episode reward: [(0, '5.840'), (1, '6.750')] +[2023-10-08 13:16:57,018][102897] Updated weights for policy 0, policy_version 37810 (0.0008) +[2023-10-08 13:16:57,392][102897] Updated weights for policy 0, policy_version 37820 (0.0009) +[2023-10-08 13:16:57,769][102898] Updated weights for policy 1, policy_version 37830 (0.0008) +[2023-10-08 13:16:58,142][102898] Updated weights for policy 1, policy_version 37840 (0.0008) +[2023-10-08 13:16:58,507][102898] Updated weights for policy 1, policy_version 37850 (0.0008) +[2023-10-08 13:17:01,103][102897] Updated weights for policy 0, policy_version 37830 (0.0008) +[2023-10-08 13:17:01,473][102897] Updated weights for policy 0, policy_version 37840 (0.0008) +[2023-10-08 13:17:01,855][102897] Updated weights for policy 0, policy_version 37850 (0.0008) +[2023-10-08 13:17:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 77496320. Throughput: 0: 1802.4, 1: 1790.8. Samples: 19391664. Policy #0 lag: (min: 26.0, avg: 29.2, max: 56.0) +[2023-10-08 13:17:01,876][101941] Avg episode reward: [(0, '6.170'), (1, '7.610')] +[2023-10-08 13:17:02,414][102898] Updated weights for policy 1, policy_version 37860 (0.0007) +[2023-10-08 13:17:02,779][102898] Updated weights for policy 1, policy_version 37870 (0.0009) +[2023-10-08 13:17:03,152][102898] Updated weights for policy 1, policy_version 37880 (0.0008) +[2023-10-08 13:17:05,629][102897] Updated weights for policy 0, policy_version 37860 (0.0008) +[2023-10-08 13:17:06,008][102897] Updated weights for policy 0, policy_version 37870 (0.0008) +[2023-10-08 13:17:06,368][102897] Updated weights for policy 0, policy_version 37880 (0.0008) +[2023-10-08 13:17:06,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 77594624. Throughput: 0: 1783.2, 1: 1786.7. Samples: 19402050. Policy #0 lag: (min: 26.0, avg: 29.2, max: 56.0) +[2023-10-08 13:17:06,875][101941] Avg episode reward: [(0, '6.370'), (1, '7.670')] +[2023-10-08 13:17:06,974][102898] Updated weights for policy 1, policy_version 37890 (0.0010) +[2023-10-08 13:17:07,344][102898] Updated weights for policy 1, policy_version 37900 (0.0007) +[2023-10-08 13:17:07,708][102898] Updated weights for policy 1, policy_version 37910 (0.0008) +[2023-10-08 13:17:08,071][102898] Updated weights for policy 1, policy_version 37920 (0.0008) +[2023-10-08 13:17:10,103][102897] Updated weights for policy 0, policy_version 37890 (0.0007) +[2023-10-08 13:17:10,469][102897] Updated weights for policy 0, policy_version 37900 (0.0007) +[2023-10-08 13:17:10,848][102897] Updated weights for policy 0, policy_version 37910 (0.0008) +[2023-10-08 13:17:11,209][102897] Updated weights for policy 0, policy_version 37920 (0.0009) +[2023-10-08 13:17:11,719][102898] Updated weights for policy 1, policy_version 37930 (0.0007) +[2023-10-08 13:17:11,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 77660160. Throughput: 0: 1798.1, 1: 1786.7. Samples: 19423752. Policy #0 lag: (min: 26.0, avg: 29.2, max: 56.0) +[2023-10-08 13:17:11,877][101941] Avg episode reward: [(0, '7.250'), (1, '7.800')] +[2023-10-08 13:17:12,084][102898] Updated weights for policy 1, policy_version 37940 (0.0008) +[2023-10-08 13:17:12,453][102898] Updated weights for policy 1, policy_version 37950 (0.0008) +[2023-10-08 13:17:14,945][102897] Updated weights for policy 0, policy_version 37930 (0.0007) +[2023-10-08 13:17:15,309][102897] Updated weights for policy 0, policy_version 37940 (0.0008) +[2023-10-08 13:17:15,683][102897] Updated weights for policy 0, policy_version 37950 (0.0009) +[2023-10-08 13:17:16,382][102898] Updated weights for policy 1, policy_version 37960 (0.0010) +[2023-10-08 13:17:16,753][102898] Updated weights for policy 1, policy_version 37970 (0.0011) +[2023-10-08 13:17:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 77725696. Throughput: 0: 1773.5, 1: 1803.0. Samples: 19444538. Policy #0 lag: (min: 26.0, avg: 29.2, max: 56.0) +[2023-10-08 13:17:16,876][101941] Avg episode reward: [(0, '6.630'), (1, '7.430')] +[2023-10-08 13:17:17,120][102898] Updated weights for policy 1, policy_version 37980 (0.0011) +[2023-10-08 13:17:19,490][102897] Updated weights for policy 0, policy_version 37960 (0.0009) +[2023-10-08 13:17:19,867][102897] Updated weights for policy 0, policy_version 37970 (0.0007) +[2023-10-08 13:17:20,243][102897] Updated weights for policy 0, policy_version 37980 (0.0008) +[2023-10-08 13:17:20,999][102898] Updated weights for policy 1, policy_version 37990 (0.0009) +[2023-10-08 13:17:21,370][102898] Updated weights for policy 1, policy_version 38000 (0.0009) +[2023-10-08 13:17:21,738][102898] Updated weights for policy 1, policy_version 38010 (0.0008) +[2023-10-08 13:17:21,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 77791232. Throughput: 0: 1803.7, 1: 1776.3. Samples: 19455882. Policy #0 lag: (min: 18.0, avg: 21.0, max: 50.0) +[2023-10-08 13:17:21,876][101941] Avg episode reward: [(0, '5.710'), (1, '7.600')] +[2023-10-08 13:17:23,976][102897] Updated weights for policy 0, policy_version 37990 (0.0010) +[2023-10-08 13:17:24,344][102897] Updated weights for policy 0, policy_version 38000 (0.0007) +[2023-10-08 13:17:24,719][102897] Updated weights for policy 0, policy_version 38010 (0.0007) +[2023-10-08 13:17:25,519][102898] Updated weights for policy 1, policy_version 38020 (0.0009) +[2023-10-08 13:17:25,894][102898] Updated weights for policy 1, policy_version 38030 (0.0009) +[2023-10-08 13:17:26,250][102898] Updated weights for policy 1, policy_version 38040 (0.0008) +[2023-10-08 13:17:26,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 77889536. Throughput: 0: 1775.2, 1: 1801.7. Samples: 19476620. Policy #0 lag: (min: 18.0, avg: 21.0, max: 50.0) +[2023-10-08 13:17:26,876][101941] Avg episode reward: [(0, '5.570'), (1, '7.880')] +[2023-10-08 13:17:28,415][102897] Updated weights for policy 0, policy_version 38020 (0.0010) +[2023-10-08 13:17:28,775][102897] Updated weights for policy 0, policy_version 38030 (0.0010) +[2023-10-08 13:17:29,152][102897] Updated weights for policy 0, policy_version 38040 (0.0008) +[2023-10-08 13:17:30,056][102898] Updated weights for policy 1, policy_version 38050 (0.0008) +[2023-10-08 13:17:30,461][102898] Updated weights for policy 1, policy_version 38060 (0.0007) +[2023-10-08 13:17:30,832][102898] Updated weights for policy 1, policy_version 38070 (0.0008) +[2023-10-08 13:17:31,194][102898] Updated weights for policy 1, policy_version 38080 (0.0009) +[2023-10-08 13:17:31,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 77955072. Throughput: 0: 1780.8, 1: 1771.0. Samples: 19497576. Policy #0 lag: (min: 18.0, avg: 21.0, max: 50.0) +[2023-10-08 13:17:31,876][101941] Avg episode reward: [(0, '6.390'), (1, '7.190')] +[2023-10-08 13:17:33,080][102897] Updated weights for policy 0, policy_version 38050 (0.0009) +[2023-10-08 13:17:33,493][102897] Updated weights for policy 0, policy_version 38060 (0.0009) +[2023-10-08 13:17:33,859][102897] Updated weights for policy 0, policy_version 38070 (0.0008) +[2023-10-08 13:17:34,238][102897] Updated weights for policy 0, policy_version 38080 (0.0008) +[2023-10-08 13:17:34,818][102898] Updated weights for policy 1, policy_version 38090 (0.0007) +[2023-10-08 13:17:35,189][102898] Updated weights for policy 1, policy_version 38100 (0.0008) +[2023-10-08 13:17:35,548][102898] Updated weights for policy 1, policy_version 38110 (0.0007) +[2023-10-08 13:17:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 78020608. Throughput: 0: 1775.5, 1: 1799.6. Samples: 19508742. Policy #0 lag: (min: 18.0, avg: 21.0, max: 50.0) +[2023-10-08 13:17:36,876][101941] Avg episode reward: [(0, '6.770'), (1, '7.320')] +[2023-10-08 13:17:37,987][102897] Updated weights for policy 0, policy_version 38090 (0.0007) +[2023-10-08 13:17:38,351][102897] Updated weights for policy 0, policy_version 38100 (0.0007) +[2023-10-08 13:17:38,716][102897] Updated weights for policy 0, policy_version 38110 (0.0008) +[2023-10-08 13:17:39,290][102898] Updated weights for policy 1, policy_version 38120 (0.0010) +[2023-10-08 13:17:39,656][102898] Updated weights for policy 1, policy_version 38130 (0.0011) +[2023-10-08 13:17:40,025][102898] Updated weights for policy 1, policy_version 38140 (0.0010) +[2023-10-08 13:17:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 78086144. Throughput: 0: 1772.4, 1: 1774.0. Samples: 19529540. Policy #0 lag: (min: 18.0, avg: 21.0, max: 50.0) +[2023-10-08 13:17:41,876][101941] Avg episode reward: [(0, '6.540'), (1, '8.350')] +[2023-10-08 13:17:42,598][102897] Updated weights for policy 0, policy_version 38120 (0.0007) +[2023-10-08 13:17:42,979][102897] Updated weights for policy 0, policy_version 38130 (0.0008) +[2023-10-08 13:17:43,336][102897] Updated weights for policy 0, policy_version 38140 (0.0011) +[2023-10-08 13:17:43,907][102898] Updated weights for policy 1, policy_version 38150 (0.0009) +[2023-10-08 13:17:44,278][102898] Updated weights for policy 1, policy_version 38160 (0.0009) +[2023-10-08 13:17:44,647][102898] Updated weights for policy 1, policy_version 38170 (0.0010) +[2023-10-08 13:17:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 78151680. Throughput: 0: 1787.7, 1: 1769.6. Samples: 19551744. Policy #0 lag: (min: 18.0, avg: 21.0, max: 50.0) +[2023-10-08 13:17:46,876][101941] Avg episode reward: [(0, '6.230'), (1, '7.880')] +[2023-10-08 13:17:47,043][102897] Updated weights for policy 0, policy_version 38150 (0.0009) +[2023-10-08 13:17:47,412][102897] Updated weights for policy 0, policy_version 38160 (0.0008) +[2023-10-08 13:17:47,784][102897] Updated weights for policy 0, policy_version 38170 (0.0010) +[2023-10-08 13:17:48,461][102898] Updated weights for policy 1, policy_version 38180 (0.0009) +[2023-10-08 13:17:48,828][102898] Updated weights for policy 1, policy_version 38190 (0.0008) +[2023-10-08 13:17:49,202][102898] Updated weights for policy 1, policy_version 38200 (0.0009) +[2023-10-08 13:17:51,365][102897] Updated weights for policy 0, policy_version 38180 (0.0009) +[2023-10-08 13:17:51,735][102897] Updated weights for policy 0, policy_version 38190 (0.0010) +[2023-10-08 13:17:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 78217216. Throughput: 0: 1772.4, 1: 1775.6. Samples: 19561714. Policy #0 lag: (min: 31.0, avg: 36.6, max: 63.0) +[2023-10-08 13:17:51,876][101941] Avg episode reward: [(0, '6.590'), (1, '7.480')] +[2023-10-08 13:17:52,095][102897] Updated weights for policy 0, policy_version 38200 (0.0008) +[2023-10-08 13:17:53,050][102898] Updated weights for policy 1, policy_version 38210 (0.0007) +[2023-10-08 13:17:53,425][102898] Updated weights for policy 1, policy_version 38220 (0.0008) +[2023-10-08 13:17:53,802][102898] Updated weights for policy 1, policy_version 38230 (0.0009) +[2023-10-08 13:17:54,163][102898] Updated weights for policy 1, policy_version 38240 (0.0009) +[2023-10-08 13:17:55,791][102897] Updated weights for policy 0, policy_version 38210 (0.0009) +[2023-10-08 13:17:56,166][102897] Updated weights for policy 0, policy_version 38220 (0.0009) +[2023-10-08 13:17:56,534][102897] Updated weights for policy 0, policy_version 38230 (0.0009) +[2023-10-08 13:17:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 78282752. Throughput: 0: 1789.2, 1: 1774.2. Samples: 19584104. Policy #0 lag: (min: 31.0, avg: 36.6, max: 63.0) +[2023-10-08 13:17:56,876][101941] Avg episode reward: [(0, '6.050'), (1, '7.430')] +[2023-10-08 13:17:56,914][102897] Updated weights for policy 0, policy_version 38240 (0.0008) +[2023-10-08 13:17:57,870][102898] Updated weights for policy 1, policy_version 38250 (0.0011) +[2023-10-08 13:17:58,233][102898] Updated weights for policy 1, policy_version 38260 (0.0011) +[2023-10-08 13:17:58,598][102898] Updated weights for policy 1, policy_version 38270 (0.0008) +[2023-10-08 13:18:00,739][102897] Updated weights for policy 0, policy_version 38250 (0.0008) +[2023-10-08 13:18:01,099][102897] Updated weights for policy 0, policy_version 38260 (0.0008) +[2023-10-08 13:18:01,476][102897] Updated weights for policy 0, policy_version 38270 (0.0010) +[2023-10-08 13:18:01,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 78381056. Throughput: 0: 1788.2, 1: 1783.9. Samples: 19605282. Policy #0 lag: (min: 31.0, avg: 36.6, max: 63.0) +[2023-10-08 13:18:01,876][101941] Avg episode reward: [(0, '5.120'), (1, '7.580')] +[2023-10-08 13:18:02,399][102898] Updated weights for policy 1, policy_version 38280 (0.0010) +[2023-10-08 13:18:02,765][102898] Updated weights for policy 1, policy_version 38290 (0.0010) +[2023-10-08 13:18:03,141][102898] Updated weights for policy 1, policy_version 38300 (0.0008) +[2023-10-08 13:18:05,070][102897] Updated weights for policy 0, policy_version 38280 (0.0008) +[2023-10-08 13:18:05,443][102897] Updated weights for policy 0, policy_version 38290 (0.0007) +[2023-10-08 13:18:05,821][102897] Updated weights for policy 0, policy_version 38300 (0.0007) +[2023-10-08 13:18:06,803][102898] Updated weights for policy 1, policy_version 38310 (0.0009) +[2023-10-08 13:18:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 78446592. Throughput: 0: 1793.0, 1: 1776.0. Samples: 19616488. Policy #0 lag: (min: 31.0, avg: 36.6, max: 63.0) +[2023-10-08 13:18:06,876][101941] Avg episode reward: [(0, '5.950'), (1, '8.140')] +[2023-10-08 13:18:07,169][102898] Updated weights for policy 1, policy_version 38320 (0.0007) +[2023-10-08 13:18:07,538][102898] Updated weights for policy 1, policy_version 38330 (0.0007) +[2023-10-08 13:18:09,564][102897] Updated weights for policy 0, policy_version 38310 (0.0010) +[2023-10-08 13:18:09,938][102897] Updated weights for policy 0, policy_version 38320 (0.0008) +[2023-10-08 13:18:10,312][102897] Updated weights for policy 0, policy_version 38330 (0.0010) +[2023-10-08 13:18:11,276][102898] Updated weights for policy 1, policy_version 38340 (0.0008) +[2023-10-08 13:18:11,645][102898] Updated weights for policy 1, policy_version 38350 (0.0009) +[2023-10-08 13:18:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 78512128. Throughput: 0: 1793.3, 1: 1786.0. Samples: 19637688. Policy #0 lag: (min: 31.0, avg: 36.6, max: 63.0) +[2023-10-08 13:18:11,875][101941] Avg episode reward: [(0, '6.570'), (1, '7.840')] +[2023-10-08 13:18:12,013][102898] Updated weights for policy 1, policy_version 38360 (0.0008) +[2023-10-08 13:18:14,072][102897] Updated weights for policy 0, policy_version 38340 (0.0007) +[2023-10-08 13:18:14,447][102897] Updated weights for policy 0, policy_version 38350 (0.0008) +[2023-10-08 13:18:14,819][102897] Updated weights for policy 0, policy_version 38360 (0.0009) +[2023-10-08 13:18:15,804][102898] Updated weights for policy 1, policy_version 38370 (0.0009) +[2023-10-08 13:18:16,207][102898] Updated weights for policy 1, policy_version 38380 (0.0010) +[2023-10-08 13:18:16,571][102898] Updated weights for policy 1, policy_version 38390 (0.0008) +[2023-10-08 13:18:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 78577664. Throughput: 0: 1789.7, 1: 1797.6. Samples: 19659006. Policy #0 lag: (min: 16.0, avg: 36.5, max: 48.0) +[2023-10-08 13:18:16,876][101941] Avg episode reward: [(0, '6.660'), (1, '6.660')] +[2023-10-08 13:18:16,886][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000038368_39288832.pth... +[2023-10-08 13:18:16,917][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000036704_37584896.pth +[2023-10-08 13:18:16,934][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000038400_39321600.pth... +[2023-10-08 13:18:16,939][102898] Updated weights for policy 1, policy_version 38400 (0.0008) +[2023-10-08 13:18:16,962][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000036704_37584896.pth +[2023-10-08 13:18:18,581][102897] Updated weights for policy 0, policy_version 38370 (0.0009) +[2023-10-08 13:18:18,976][102897] Updated weights for policy 0, policy_version 38380 (0.0009) +[2023-10-08 13:18:19,336][102897] Updated weights for policy 0, policy_version 38390 (0.0010) +[2023-10-08 13:18:19,703][102897] Updated weights for policy 0, policy_version 38400 (0.0011) +[2023-10-08 13:18:20,656][102898] Updated weights for policy 1, policy_version 38410 (0.0008) +[2023-10-08 13:18:21,030][102898] Updated weights for policy 1, policy_version 38420 (0.0010) +[2023-10-08 13:18:21,390][102898] Updated weights for policy 1, policy_version 38430 (0.0010) +[2023-10-08 13:18:21,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 78675968. Throughput: 0: 1803.1, 1: 1781.5. Samples: 19670050. Policy #0 lag: (min: 16.0, avg: 36.5, max: 48.0) +[2023-10-08 13:18:21,876][101941] Avg episode reward: [(0, '5.570'), (1, '7.410')] +[2023-10-08 13:18:23,484][102897] Updated weights for policy 0, policy_version 38410 (0.0009) +[2023-10-08 13:18:23,862][102897] Updated weights for policy 0, policy_version 38420 (0.0008) +[2023-10-08 13:18:24,233][102897] Updated weights for policy 0, policy_version 38430 (0.0007) +[2023-10-08 13:18:25,340][102898] Updated weights for policy 1, policy_version 38440 (0.0008) +[2023-10-08 13:18:25,705][102898] Updated weights for policy 1, policy_version 38450 (0.0008) +[2023-10-08 13:18:26,071][102898] Updated weights for policy 1, policy_version 38460 (0.0007) +[2023-10-08 13:18:26,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 78741504. Throughput: 0: 1795.1, 1: 1802.2. Samples: 19691416. Policy #0 lag: (min: 16.0, avg: 36.5, max: 48.0) +[2023-10-08 13:18:26,876][101941] Avg episode reward: [(0, '5.090'), (1, '8.200')] +[2023-10-08 13:18:28,042][102897] Updated weights for policy 0, policy_version 38440 (0.0009) +[2023-10-08 13:18:28,412][102897] Updated weights for policy 0, policy_version 38450 (0.0011) +[2023-10-08 13:18:28,794][102897] Updated weights for policy 0, policy_version 38460 (0.0009) +[2023-10-08 13:18:29,834][102898] Updated weights for policy 1, policy_version 38470 (0.0008) +[2023-10-08 13:18:30,198][102898] Updated weights for policy 1, policy_version 38480 (0.0008) +[2023-10-08 13:18:30,570][102898] Updated weights for policy 1, policy_version 38490 (0.0008) +[2023-10-08 13:18:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 78807040. Throughput: 0: 1789.7, 1: 1781.9. Samples: 19712470. Policy #0 lag: (min: 16.0, avg: 36.5, max: 48.0) +[2023-10-08 13:18:31,876][101941] Avg episode reward: [(0, '5.490'), (1, '7.730')] +[2023-10-08 13:18:32,617][102897] Updated weights for policy 0, policy_version 38470 (0.0009) +[2023-10-08 13:18:32,989][102897] Updated weights for policy 0, policy_version 38480 (0.0010) +[2023-10-08 13:18:33,356][102897] Updated weights for policy 0, policy_version 38490 (0.0010) +[2023-10-08 13:18:34,341][102898] Updated weights for policy 1, policy_version 38500 (0.0009) +[2023-10-08 13:18:34,711][102898] Updated weights for policy 1, policy_version 38510 (0.0010) +[2023-10-08 13:18:35,073][102898] Updated weights for policy 1, policy_version 38520 (0.0011) +[2023-10-08 13:18:36,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 78872576. Throughput: 0: 1784.3, 1: 1799.2. Samples: 19722970. Policy #0 lag: (min: 16.0, avg: 36.5, max: 48.0) +[2023-10-08 13:18:36,876][101941] Avg episode reward: [(0, '6.340'), (1, '7.330')] +[2023-10-08 13:18:37,270][102897] Updated weights for policy 0, policy_version 38500 (0.0009) +[2023-10-08 13:18:37,638][102897] Updated weights for policy 0, policy_version 38510 (0.0007) +[2023-10-08 13:18:38,018][102897] Updated weights for policy 0, policy_version 38520 (0.0007) +[2023-10-08 13:18:38,962][102898] Updated weights for policy 1, policy_version 38530 (0.0008) +[2023-10-08 13:18:39,329][102898] Updated weights for policy 1, policy_version 38540 (0.0008) +[2023-10-08 13:18:39,689][102898] Updated weights for policy 1, policy_version 38550 (0.0010) +[2023-10-08 13:18:40,057][102898] Updated weights for policy 1, policy_version 38560 (0.0007) +[2023-10-08 13:18:41,803][102897] Updated weights for policy 0, policy_version 38530 (0.0007) +[2023-10-08 13:18:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 78938112. Throughput: 0: 1781.4, 1: 1771.2. Samples: 19743968. Policy #0 lag: (min: 16.0, avg: 36.5, max: 48.0) +[2023-10-08 13:18:41,876][101941] Avg episode reward: [(0, '6.030'), (1, '8.040')] +[2023-10-08 13:18:42,167][102897] Updated weights for policy 0, policy_version 38540 (0.0009) +[2023-10-08 13:18:42,551][102897] Updated weights for policy 0, policy_version 38550 (0.0011) +[2023-10-08 13:18:42,921][102897] Updated weights for policy 0, policy_version 38560 (0.0008) +[2023-10-08 13:18:43,835][102898] Updated weights for policy 1, policy_version 38570 (0.0008) +[2023-10-08 13:18:44,203][102898] Updated weights for policy 1, policy_version 38580 (0.0008) +[2023-10-08 13:18:44,574][102898] Updated weights for policy 1, policy_version 38590 (0.0008) +[2023-10-08 13:18:46,669][102897] Updated weights for policy 0, policy_version 38570 (0.0007) +[2023-10-08 13:18:46,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 79003648. Throughput: 0: 1803.6, 1: 1772.2. Samples: 19766192. Policy #0 lag: (min: 3.0, avg: 4.8, max: 31.0) +[2023-10-08 13:18:46,876][101941] Avg episode reward: [(0, '6.170'), (1, '8.210')] +[2023-10-08 13:18:47,034][102897] Updated weights for policy 0, policy_version 38580 (0.0008) +[2023-10-08 13:18:47,412][102897] Updated weights for policy 0, policy_version 38590 (0.0008) +[2023-10-08 13:18:48,369][102898] Updated weights for policy 1, policy_version 38600 (0.0009) +[2023-10-08 13:18:48,740][102898] Updated weights for policy 1, policy_version 38610 (0.0009) +[2023-10-08 13:18:49,114][102898] Updated weights for policy 1, policy_version 38620 (0.0008) +[2023-10-08 13:18:51,213][102897] Updated weights for policy 0, policy_version 38600 (0.0008) +[2023-10-08 13:18:51,586][102897] Updated weights for policy 0, policy_version 38610 (0.0010) +[2023-10-08 13:18:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 79069184. Throughput: 0: 1771.7, 1: 1772.3. Samples: 19775966. Policy #0 lag: (min: 3.0, avg: 4.8, max: 31.0) +[2023-10-08 13:18:51,876][101941] Avg episode reward: [(0, '6.740'), (1, '7.330')] +[2023-10-08 13:18:51,960][102897] Updated weights for policy 0, policy_version 38620 (0.0007) +[2023-10-08 13:18:52,839][102898] Updated weights for policy 1, policy_version 38630 (0.0007) +[2023-10-08 13:18:53,209][102898] Updated weights for policy 1, policy_version 38640 (0.0008) +[2023-10-08 13:18:53,569][102898] Updated weights for policy 1, policy_version 38650 (0.0007) +[2023-10-08 13:18:55,651][102897] Updated weights for policy 0, policy_version 38630 (0.0008) +[2023-10-08 13:18:56,017][102897] Updated weights for policy 0, policy_version 38640 (0.0007) +[2023-10-08 13:18:56,386][102897] Updated weights for policy 0, policy_version 38650 (0.0007) +[2023-10-08 13:18:56,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 79167488. Throughput: 0: 1803.3, 1: 1768.9. Samples: 19798438. Policy #0 lag: (min: 3.0, avg: 4.8, max: 31.0) +[2023-10-08 13:18:56,875][101941] Avg episode reward: [(0, '6.040'), (1, '7.640')] +[2023-10-08 13:18:57,394][102898] Updated weights for policy 1, policy_version 38660 (0.0009) +[2023-10-08 13:18:57,751][102898] Updated weights for policy 1, policy_version 38670 (0.0010) +[2023-10-08 13:18:58,119][102898] Updated weights for policy 1, policy_version 38680 (0.0009) +[2023-10-08 13:19:00,157][102897] Updated weights for policy 0, policy_version 38660 (0.0007) +[2023-10-08 13:19:00,527][102897] Updated weights for policy 0, policy_version 38670 (0.0007) +[2023-10-08 13:19:00,899][102897] Updated weights for policy 0, policy_version 38680 (0.0007) +[2023-10-08 13:19:01,787][102898] Updated weights for policy 1, policy_version 38690 (0.0009) +[2023-10-08 13:19:01,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 79233024. Throughput: 0: 1769.1, 1: 1792.4. Samples: 19819272. Policy #0 lag: (min: 3.0, avg: 4.8, max: 31.0) +[2023-10-08 13:19:01,876][101941] Avg episode reward: [(0, '5.520'), (1, '8.020')] +[2023-10-08 13:19:02,182][102898] Updated weights for policy 1, policy_version 38700 (0.0009) +[2023-10-08 13:19:02,547][102898] Updated weights for policy 1, policy_version 38710 (0.0008) +[2023-10-08 13:19:02,915][102898] Updated weights for policy 1, policy_version 38720 (0.0008) +[2023-10-08 13:19:04,808][102897] Updated weights for policy 0, policy_version 38690 (0.0009) +[2023-10-08 13:19:05,183][102897] Updated weights for policy 0, policy_version 38700 (0.0010) +[2023-10-08 13:19:05,547][102897] Updated weights for policy 0, policy_version 38710 (0.0010) +[2023-10-08 13:19:05,924][102897] Updated weights for policy 0, policy_version 38720 (0.0010) +[2023-10-08 13:19:06,741][102898] Updated weights for policy 1, policy_version 38730 (0.0007) +[2023-10-08 13:19:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 79298560. Throughput: 0: 1794.9, 1: 1766.9. Samples: 19830330. Policy #0 lag: (min: 3.0, avg: 4.8, max: 31.0) +[2023-10-08 13:19:06,875][101941] Avg episode reward: [(0, '6.240'), (1, '7.500')] +[2023-10-08 13:19:07,100][102898] Updated weights for policy 1, policy_version 38740 (0.0008) +[2023-10-08 13:19:07,463][102898] Updated weights for policy 1, policy_version 38750 (0.0007) +[2023-10-08 13:19:09,779][102897] Updated weights for policy 0, policy_version 38730 (0.0009) +[2023-10-08 13:19:10,154][102897] Updated weights for policy 0, policy_version 38740 (0.0007) +[2023-10-08 13:19:10,529][102897] Updated weights for policy 0, policy_version 38750 (0.0008) +[2023-10-08 13:19:11,247][102898] Updated weights for policy 1, policy_version 38760 (0.0010) +[2023-10-08 13:19:11,612][102898] Updated weights for policy 1, policy_version 38770 (0.0010) +[2023-10-08 13:19:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 79364096. Throughput: 0: 1777.6, 1: 1782.0. Samples: 19851596. Policy #0 lag: (min: 31.0, avg: 36.0, max: 63.0) +[2023-10-08 13:19:11,876][101941] Avg episode reward: [(0, '6.750'), (1, '7.760')] +[2023-10-08 13:19:11,982][102898] Updated weights for policy 1, policy_version 38780 (0.0011) +[2023-10-08 13:19:14,413][102897] Updated weights for policy 0, policy_version 38760 (0.0008) +[2023-10-08 13:19:14,777][102897] Updated weights for policy 0, policy_version 38770 (0.0008) +[2023-10-08 13:19:15,143][102897] Updated weights for policy 0, policy_version 38780 (0.0008) +[2023-10-08 13:19:15,728][102898] Updated weights for policy 1, policy_version 38790 (0.0010) +[2023-10-08 13:19:16,109][102898] Updated weights for policy 1, policy_version 38800 (0.0008) +[2023-10-08 13:19:16,472][102898] Updated weights for policy 1, policy_version 38810 (0.0008) +[2023-10-08 13:19:16,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 79462400. Throughput: 0: 1767.8, 1: 1783.1. Samples: 19872258. Policy #0 lag: (min: 31.0, avg: 36.0, max: 63.0) +[2023-10-08 13:19:16,876][101941] Avg episode reward: [(0, '6.320'), (1, '8.510')] +[2023-10-08 13:19:18,860][102897] Updated weights for policy 0, policy_version 38790 (0.0007) +[2023-10-08 13:19:19,225][102897] Updated weights for policy 0, policy_version 38800 (0.0008) +[2023-10-08 13:19:19,597][102897] Updated weights for policy 0, policy_version 38810 (0.0007) +[2023-10-08 13:19:20,170][102898] Updated weights for policy 1, policy_version 38820 (0.0007) +[2023-10-08 13:19:20,536][102898] Updated weights for policy 1, policy_version 38830 (0.0008) +[2023-10-08 13:19:20,905][102898] Updated weights for policy 1, policy_version 38840 (0.0009) +[2023-10-08 13:19:21,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 79527936. Throughput: 0: 1782.3, 1: 1787.6. Samples: 19883616. Policy #0 lag: (min: 31.0, avg: 36.0, max: 63.0) +[2023-10-08 13:19:21,876][101941] Avg episode reward: [(0, '6.120'), (1, '8.900')] +[2023-10-08 13:19:21,878][102760] Saving new best policy, reward=8.900! +[2023-10-08 13:19:23,438][102897] Updated weights for policy 0, policy_version 38820 (0.0007) +[2023-10-08 13:19:23,817][102897] Updated weights for policy 0, policy_version 38830 (0.0009) +[2023-10-08 13:19:24,190][102897] Updated weights for policy 0, policy_version 38840 (0.0007) +[2023-10-08 13:19:24,814][102898] Updated weights for policy 1, policy_version 38850 (0.0008) +[2023-10-08 13:19:25,182][102898] Updated weights for policy 1, policy_version 38860 (0.0009) +[2023-10-08 13:19:25,552][102898] Updated weights for policy 1, policy_version 38870 (0.0008) +[2023-10-08 13:19:25,926][102898] Updated weights for policy 1, policy_version 38880 (0.0007) +[2023-10-08 13:19:26,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 79593472. Throughput: 0: 1767.4, 1: 1796.2. Samples: 19904332. Policy #0 lag: (min: 31.0, avg: 36.0, max: 63.0) +[2023-10-08 13:19:26,876][101941] Avg episode reward: [(0, '6.410'), (1, '8.210')] +[2023-10-08 13:19:27,617][102897] Updated weights for policy 0, policy_version 38850 (0.0008) +[2023-10-08 13:19:27,991][102897] Updated weights for policy 0, policy_version 38860 (0.0010) +[2023-10-08 13:19:28,363][102897] Updated weights for policy 0, policy_version 38870 (0.0007) +[2023-10-08 13:19:28,739][102897] Updated weights for policy 0, policy_version 38880 (0.0007) +[2023-10-08 13:19:29,645][102898] Updated weights for policy 1, policy_version 38890 (0.0007) +[2023-10-08 13:19:30,014][102898] Updated weights for policy 1, policy_version 38900 (0.0007) +[2023-10-08 13:19:30,379][102898] Updated weights for policy 1, policy_version 38910 (0.0009) +[2023-10-08 13:19:31,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 79659008. Throughput: 0: 1772.2, 1: 1782.3. Samples: 19926144. Policy #0 lag: (min: 31.0, avg: 36.0, max: 63.0) +[2023-10-08 13:19:31,875][101941] Avg episode reward: [(0, '6.910'), (1, '6.890')] +[2023-10-08 13:19:32,616][102897] Updated weights for policy 0, policy_version 38890 (0.0008) +[2023-10-08 13:19:32,988][102897] Updated weights for policy 0, policy_version 38900 (0.0009) +[2023-10-08 13:19:33,363][102897] Updated weights for policy 0, policy_version 38910 (0.0008) +[2023-10-08 13:19:34,075][102898] Updated weights for policy 1, policy_version 38920 (0.0009) +[2023-10-08 13:19:34,459][102898] Updated weights for policy 1, policy_version 38930 (0.0009) +[2023-10-08 13:19:34,828][102898] Updated weights for policy 1, policy_version 38940 (0.0008) +[2023-10-08 13:19:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 79724544. Throughput: 0: 1773.7, 1: 1797.0. Samples: 19936648. Policy #0 lag: (min: 31.0, avg: 36.0, max: 63.0) +[2023-10-08 13:19:36,876][101941] Avg episode reward: [(0, '6.710'), (1, '6.880')] +[2023-10-08 13:19:37,131][102897] Updated weights for policy 0, policy_version 38920 (0.0009) +[2023-10-08 13:19:37,499][102897] Updated weights for policy 0, policy_version 38930 (0.0009) +[2023-10-08 13:19:37,870][102897] Updated weights for policy 0, policy_version 38940 (0.0008) +[2023-10-08 13:19:38,479][102898] Updated weights for policy 1, policy_version 38950 (0.0009) +[2023-10-08 13:19:38,850][102898] Updated weights for policy 1, policy_version 38960 (0.0007) +[2023-10-08 13:19:39,221][102898] Updated weights for policy 1, policy_version 38970 (0.0008) +[2023-10-08 13:19:41,506][102897] Updated weights for policy 0, policy_version 38950 (0.0010) +[2023-10-08 13:19:41,870][102897] Updated weights for policy 0, policy_version 38960 (0.0009) +[2023-10-08 13:19:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 79790080. Throughput: 0: 1772.9, 1: 1784.1. Samples: 19958502. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:19:41,875][101941] Avg episode reward: [(0, '6.570'), (1, '7.150')] +[2023-10-08 13:19:42,242][102897] Updated weights for policy 0, policy_version 38970 (0.0008) +[2023-10-08 13:19:42,982][102898] Updated weights for policy 1, policy_version 38980 (0.0008) +[2023-10-08 13:19:43,349][102898] Updated weights for policy 1, policy_version 38990 (0.0007) +[2023-10-08 13:19:43,720][102898] Updated weights for policy 1, policy_version 39000 (0.0009) +[2023-10-08 13:19:46,042][102897] Updated weights for policy 0, policy_version 38980 (0.0008) +[2023-10-08 13:19:46,422][102897] Updated weights for policy 0, policy_version 38990 (0.0010) +[2023-10-08 13:19:46,802][102897] Updated weights for policy 0, policy_version 39000 (0.0008) +[2023-10-08 13:19:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 79855616. Throughput: 0: 1797.5, 1: 1782.4. Samples: 19980366. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:19:46,876][101941] Avg episode reward: [(0, '6.410'), (1, '7.890')] +[2023-10-08 13:19:47,533][102898] Updated weights for policy 1, policy_version 39010 (0.0008) +[2023-10-08 13:19:47,937][102898] Updated weights for policy 1, policy_version 39020 (0.0010) +[2023-10-08 13:19:48,314][102898] Updated weights for policy 1, policy_version 39030 (0.0008) +[2023-10-08 13:19:48,669][102898] Updated weights for policy 1, policy_version 39040 (0.0007) +[2023-10-08 13:19:50,585][102897] Updated weights for policy 0, policy_version 39010 (0.0008) +[2023-10-08 13:19:50,984][102897] Updated weights for policy 0, policy_version 39020 (0.0008) +[2023-10-08 13:19:51,347][102897] Updated weights for policy 0, policy_version 39030 (0.0007) +[2023-10-08 13:19:51,716][102897] Updated weights for policy 0, policy_version 39040 (0.0007) +[2023-10-08 13:19:51,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 79953920. Throughput: 0: 1778.0, 1: 1783.9. Samples: 19990612. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:19:51,876][101941] Avg episode reward: [(0, '6.200'), (1, '8.040')] +[2023-10-08 13:19:52,293][102898] Updated weights for policy 1, policy_version 39050 (0.0007) +[2023-10-08 13:19:52,656][102898] Updated weights for policy 1, policy_version 39060 (0.0008) +[2023-10-08 13:19:53,027][102898] Updated weights for policy 1, policy_version 39070 (0.0009) +[2023-10-08 13:19:55,508][102897] Updated weights for policy 0, policy_version 39050 (0.0008) +[2023-10-08 13:19:55,880][102897] Updated weights for policy 0, policy_version 39060 (0.0008) +[2023-10-08 13:19:56,253][102897] Updated weights for policy 0, policy_version 39070 (0.0008) +[2023-10-08 13:19:56,765][102898] Updated weights for policy 1, policy_version 39080 (0.0009) +[2023-10-08 13:19:56,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 80019456. Throughput: 0: 1794.8, 1: 1782.1. Samples: 20012558. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:19:56,876][101941] Avg episode reward: [(0, '5.770'), (1, '7.220')] +[2023-10-08 13:19:57,133][102898] Updated weights for policy 1, policy_version 39090 (0.0010) +[2023-10-08 13:19:57,500][102898] Updated weights for policy 1, policy_version 39100 (0.0009) +[2023-10-08 13:19:59,934][102897] Updated weights for policy 0, policy_version 39080 (0.0009) +[2023-10-08 13:20:00,301][102897] Updated weights for policy 0, policy_version 39090 (0.0009) +[2023-10-08 13:20:00,683][102897] Updated weights for policy 0, policy_version 39100 (0.0008) +[2023-10-08 13:20:01,409][102898] Updated weights for policy 1, policy_version 39110 (0.0009) +[2023-10-08 13:20:01,770][102898] Updated weights for policy 1, policy_version 39120 (0.0010) +[2023-10-08 13:20:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 80084992. Throughput: 0: 1785.6, 1: 1797.8. Samples: 20033512. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:20:01,876][101941] Avg episode reward: [(0, '6.140'), (1, '7.050')] +[2023-10-08 13:20:02,134][102898] Updated weights for policy 1, policy_version 39130 (0.0009) +[2023-10-08 13:20:04,461][102897] Updated weights for policy 0, policy_version 39110 (0.0009) +[2023-10-08 13:20:04,833][102897] Updated weights for policy 0, policy_version 39120 (0.0010) +[2023-10-08 13:20:05,208][102897] Updated weights for policy 0, policy_version 39130 (0.0009) +[2023-10-08 13:20:06,083][102898] Updated weights for policy 1, policy_version 39140 (0.0009) +[2023-10-08 13:20:06,447][102898] Updated weights for policy 1, policy_version 39150 (0.0008) +[2023-10-08 13:20:06,814][102898] Updated weights for policy 1, policy_version 39160 (0.0007) +[2023-10-08 13:20:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 80150528. Throughput: 0: 1806.6, 1: 1780.0. Samples: 20045016. Policy #0 lag: (min: 20.0, avg: 20.1, max: 26.0) +[2023-10-08 13:20:06,876][101941] Avg episode reward: [(0, '6.740'), (1, '7.660')] +[2023-10-08 13:20:08,972][102897] Updated weights for policy 0, policy_version 39140 (0.0007) +[2023-10-08 13:20:09,343][102897] Updated weights for policy 0, policy_version 39150 (0.0007) +[2023-10-08 13:20:09,714][102897] Updated weights for policy 0, policy_version 39160 (0.0009) +[2023-10-08 13:20:10,662][102898] Updated weights for policy 1, policy_version 39170 (0.0008) +[2023-10-08 13:20:11,034][102898] Updated weights for policy 1, policy_version 39180 (0.0011) +[2023-10-08 13:20:11,407][102898] Updated weights for policy 1, policy_version 39190 (0.0009) +[2023-10-08 13:20:11,770][102898] Updated weights for policy 1, policy_version 39200 (0.0010) +[2023-10-08 13:20:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.2). Total num frames: 80248832. Throughput: 0: 1793.8, 1: 1803.3. Samples: 20066200. Policy #0 lag: (min: 20.0, avg: 20.1, max: 26.0) +[2023-10-08 13:20:11,875][101941] Avg episode reward: [(0, '7.030'), (1, '7.490')] +[2023-10-08 13:20:13,478][102897] Updated weights for policy 0, policy_version 39170 (0.0009) +[2023-10-08 13:20:13,856][102897] Updated weights for policy 0, policy_version 39180 (0.0007) +[2023-10-08 13:20:14,226][102897] Updated weights for policy 0, policy_version 39190 (0.0007) +[2023-10-08 13:20:14,594][102897] Updated weights for policy 0, policy_version 39200 (0.0007) +[2023-10-08 13:20:15,459][102898] Updated weights for policy 1, policy_version 39210 (0.0008) +[2023-10-08 13:20:15,824][102898] Updated weights for policy 1, policy_version 39220 (0.0009) +[2023-10-08 13:20:16,192][102898] Updated weights for policy 1, policy_version 39230 (0.0007) +[2023-10-08 13:20:16,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 80314368. Throughput: 0: 1793.8, 1: 1783.6. Samples: 20087128. Policy #0 lag: (min: 20.0, avg: 20.1, max: 26.0) +[2023-10-08 13:20:16,875][101941] Avg episode reward: [(0, '7.110'), (1, '7.680')] +[2023-10-08 13:20:16,885][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000039232_40173568.pth... +[2023-10-08 13:20:16,885][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000039200_40140800.pth... +[2023-10-08 13:20:16,925][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000037536_38436864.pth +[2023-10-08 13:20:16,926][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000037568_38469632.pth +[2023-10-08 13:20:18,360][102897] Updated weights for policy 0, policy_version 39210 (0.0010) +[2023-10-08 13:20:18,728][102897] Updated weights for policy 0, policy_version 39220 (0.0008) +[2023-10-08 13:20:19,102][102897] Updated weights for policy 0, policy_version 39230 (0.0008) +[2023-10-08 13:20:19,654][102898] Updated weights for policy 1, policy_version 39240 (0.0010) +[2023-10-08 13:20:20,032][102898] Updated weights for policy 1, policy_version 39250 (0.0010) +[2023-10-08 13:20:20,399][102898] Updated weights for policy 1, policy_version 39260 (0.0010) +[2023-10-08 13:20:21,875][101941] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 80379904. Throughput: 0: 1790.8, 1: 1806.4. Samples: 20098524. Policy #0 lag: (min: 20.0, avg: 20.1, max: 26.0) +[2023-10-08 13:20:21,876][101941] Avg episode reward: [(0, '6.890'), (1, '8.060')] +[2023-10-08 13:20:22,765][102897] Updated weights for policy 0, policy_version 39240 (0.0009) +[2023-10-08 13:20:23,138][102897] Updated weights for policy 0, policy_version 39250 (0.0008) +[2023-10-08 13:20:23,520][102897] Updated weights for policy 0, policy_version 39260 (0.0007) +[2023-10-08 13:20:24,143][102898] Updated weights for policy 1, policy_version 39270 (0.0011) +[2023-10-08 13:20:24,523][102898] Updated weights for policy 1, policy_version 39280 (0.0009) +[2023-10-08 13:20:24,881][102898] Updated weights for policy 1, policy_version 39290 (0.0007) +[2023-10-08 13:20:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 80445440. Throughput: 0: 1795.0, 1: 1790.0. Samples: 20119828. Policy #0 lag: (min: 20.0, avg: 20.1, max: 26.0) +[2023-10-08 13:20:26,875][101941] Avg episode reward: [(0, '6.130'), (1, '8.420')] +[2023-10-08 13:20:27,284][102897] Updated weights for policy 0, policy_version 39270 (0.0010) +[2023-10-08 13:20:27,656][102897] Updated weights for policy 0, policy_version 39280 (0.0007) +[2023-10-08 13:20:28,040][102897] Updated weights for policy 0, policy_version 39290 (0.0009) +[2023-10-08 13:20:28,742][102898] Updated weights for policy 1, policy_version 39300 (0.0009) +[2023-10-08 13:20:29,108][102898] Updated weights for policy 1, policy_version 39310 (0.0009) +[2023-10-08 13:20:29,479][102898] Updated weights for policy 1, policy_version 39320 (0.0008) +[2023-10-08 13:20:31,765][102897] Updated weights for policy 0, policy_version 39300 (0.0009) +[2023-10-08 13:20:31,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 80510976. Throughput: 0: 1806.4, 1: 1788.2. Samples: 20142122. Policy #0 lag: (min: 20.0, avg: 20.1, max: 26.0) +[2023-10-08 13:20:31,876][101941] Avg episode reward: [(0, '6.180'), (1, '7.670')] +[2023-10-08 13:20:32,142][102897] Updated weights for policy 0, policy_version 39310 (0.0008) +[2023-10-08 13:20:32,516][102897] Updated weights for policy 0, policy_version 39320 (0.0008) +[2023-10-08 13:20:33,142][102898] Updated weights for policy 1, policy_version 39330 (0.0008) +[2023-10-08 13:20:33,533][102898] Updated weights for policy 1, policy_version 39340 (0.0008) +[2023-10-08 13:20:33,889][102898] Updated weights for policy 1, policy_version 39350 (0.0009) +[2023-10-08 13:20:34,262][102898] Updated weights for policy 1, policy_version 39360 (0.0008) +[2023-10-08 13:20:36,407][102897] Updated weights for policy 0, policy_version 39330 (0.0007) +[2023-10-08 13:20:36,803][102897] Updated weights for policy 0, policy_version 39340 (0.0009) +[2023-10-08 13:20:36,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 80576512. Throughput: 0: 1788.5, 1: 1791.5. Samples: 20151714. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:20:36,876][101941] Avg episode reward: [(0, '5.850'), (1, '7.250')] +[2023-10-08 13:20:37,162][102897] Updated weights for policy 0, policy_version 39350 (0.0008) +[2023-10-08 13:20:37,537][102897] Updated weights for policy 0, policy_version 39360 (0.0007) +[2023-10-08 13:20:38,026][102898] Updated weights for policy 1, policy_version 39370 (0.0008) +[2023-10-08 13:20:38,389][102898] Updated weights for policy 1, policy_version 39380 (0.0007) +[2023-10-08 13:20:38,762][102898] Updated weights for policy 1, policy_version 39390 (0.0008) +[2023-10-08 13:20:41,279][102897] Updated weights for policy 0, policy_version 39370 (0.0010) +[2023-10-08 13:20:41,652][102897] Updated weights for policy 0, policy_version 39380 (0.0010) +[2023-10-08 13:20:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 80642048. Throughput: 0: 1795.2, 1: 1787.5. Samples: 20173778. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:20:41,875][101941] Avg episode reward: [(0, '6.110'), (1, '7.450')] +[2023-10-08 13:20:42,022][102897] Updated weights for policy 0, policy_version 39390 (0.0009) +[2023-10-08 13:20:42,647][102898] Updated weights for policy 1, policy_version 39400 (0.0009) +[2023-10-08 13:20:43,008][102898] Updated weights for policy 1, policy_version 39410 (0.0011) +[2023-10-08 13:20:43,385][102898] Updated weights for policy 1, policy_version 39420 (0.0009) +[2023-10-08 13:20:45,701][102897] Updated weights for policy 0, policy_version 39400 (0.0009) +[2023-10-08 13:20:46,062][102897] Updated weights for policy 0, policy_version 39410 (0.0008) +[2023-10-08 13:20:46,440][102897] Updated weights for policy 0, policy_version 39420 (0.0008) +[2023-10-08 13:20:46,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 80740352. Throughput: 0: 1794.8, 1: 1795.0. Samples: 20195052. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:20:46,876][101941] Avg episode reward: [(0, '6.440'), (1, '7.420')] +[2023-10-08 13:20:47,055][102898] Updated weights for policy 1, policy_version 39430 (0.0007) +[2023-10-08 13:20:47,409][102898] Updated weights for policy 1, policy_version 39440 (0.0007) +[2023-10-08 13:20:47,771][102898] Updated weights for policy 1, policy_version 39450 (0.0008) +[2023-10-08 13:20:50,264][102897] Updated weights for policy 0, policy_version 39430 (0.0009) +[2023-10-08 13:20:50,625][102897] Updated weights for policy 0, policy_version 39440 (0.0008) +[2023-10-08 13:20:51,004][102897] Updated weights for policy 0, policy_version 39450 (0.0007) +[2023-10-08 13:20:51,570][102898] Updated weights for policy 1, policy_version 39460 (0.0009) +[2023-10-08 13:20:51,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 80805888. Throughput: 0: 1786.9, 1: 1786.6. Samples: 20205824. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:20:51,876][101941] Avg episode reward: [(0, '6.230'), (1, '7.660')] +[2023-10-08 13:20:51,949][102898] Updated weights for policy 1, policy_version 39470 (0.0008) +[2023-10-08 13:20:52,312][102898] Updated weights for policy 1, policy_version 39480 (0.0009) +[2023-10-08 13:20:54,719][102897] Updated weights for policy 0, policy_version 39460 (0.0007) +[2023-10-08 13:20:55,090][102897] Updated weights for policy 0, policy_version 39470 (0.0008) +[2023-10-08 13:20:55,465][102897] Updated weights for policy 0, policy_version 39480 (0.0009) +[2023-10-08 13:20:56,190][102898] Updated weights for policy 1, policy_version 39490 (0.0007) +[2023-10-08 13:20:56,568][102898] Updated weights for policy 1, policy_version 39500 (0.0007) +[2023-10-08 13:20:56,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 80871424. Throughput: 0: 1794.4, 1: 1783.2. Samples: 20227196. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:20:56,876][101941] Avg episode reward: [(0, '6.360'), (1, '8.280')] +[2023-10-08 13:20:56,924][102898] Updated weights for policy 1, policy_version 39510 (0.0007) +[2023-10-08 13:20:57,293][102898] Updated weights for policy 1, policy_version 39520 (0.0008) +[2023-10-08 13:20:59,300][102897] Updated weights for policy 0, policy_version 39490 (0.0009) +[2023-10-08 13:20:59,666][102897] Updated weights for policy 0, policy_version 39500 (0.0007) +[2023-10-08 13:21:00,033][102897] Updated weights for policy 0, policy_version 39510 (0.0007) +[2023-10-08 13:21:00,407][102897] Updated weights for policy 0, policy_version 39520 (0.0010) +[2023-10-08 13:21:01,104][102898] Updated weights for policy 1, policy_version 39530 (0.0008) +[2023-10-08 13:21:01,483][102898] Updated weights for policy 1, policy_version 39540 (0.0009) +[2023-10-08 13:21:01,851][102898] Updated weights for policy 1, policy_version 39550 (0.0009) +[2023-10-08 13:21:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 80936960. Throughput: 0: 1776.9, 1: 1798.9. Samples: 20248042. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 13:21:01,876][101941] Avg episode reward: [(0, '7.120'), (1, '8.270')] +[2023-10-08 13:21:04,182][102897] Updated weights for policy 0, policy_version 39530 (0.0009) +[2023-10-08 13:21:04,553][102897] Updated weights for policy 0, policy_version 39540 (0.0010) +[2023-10-08 13:21:04,922][102897] Updated weights for policy 0, policy_version 39550 (0.0009) +[2023-10-08 13:21:05,539][102898] Updated weights for policy 1, policy_version 39560 (0.0011) +[2023-10-08 13:21:05,917][102898] Updated weights for policy 1, policy_version 39570 (0.0009) +[2023-10-08 13:21:06,292][102898] Updated weights for policy 1, policy_version 39580 (0.0007) +[2023-10-08 13:21:06,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 81035264. Throughput: 0: 1793.2, 1: 1786.0. Samples: 20259586. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 13:21:06,876][101941] Avg episode reward: [(0, '6.720'), (1, '7.620')] +[2023-10-08 13:21:08,633][102897] Updated weights for policy 0, policy_version 39560 (0.0009) +[2023-10-08 13:21:09,002][102897] Updated weights for policy 0, policy_version 39570 (0.0007) +[2023-10-08 13:21:09,379][102897] Updated weights for policy 0, policy_version 39580 (0.0008) +[2023-10-08 13:21:10,091][102898] Updated weights for policy 1, policy_version 39590 (0.0007) +[2023-10-08 13:21:10,462][102898] Updated weights for policy 1, policy_version 39600 (0.0008) +[2023-10-08 13:21:10,833][102898] Updated weights for policy 1, policy_version 39610 (0.0007) +[2023-10-08 13:21:11,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 81100800. Throughput: 0: 1771.4, 1: 1802.3. Samples: 20280646. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 13:21:11,876][101941] Avg episode reward: [(0, '6.300'), (1, '7.780')] +[2023-10-08 13:21:13,097][102897] Updated weights for policy 0, policy_version 39590 (0.0010) +[2023-10-08 13:21:13,477][102897] Updated weights for policy 0, policy_version 39600 (0.0010) +[2023-10-08 13:21:13,844][102897] Updated weights for policy 0, policy_version 39610 (0.0010) +[2023-10-08 13:21:14,754][102898] Updated weights for policy 1, policy_version 39620 (0.0009) +[2023-10-08 13:21:15,116][102898] Updated weights for policy 1, policy_version 39630 (0.0010) +[2023-10-08 13:21:15,485][102898] Updated weights for policy 1, policy_version 39640 (0.0008) +[2023-10-08 13:21:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 81166336. Throughput: 0: 1777.2, 1: 1784.0. Samples: 20302376. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 13:21:16,875][101941] Avg episode reward: [(0, '6.760'), (1, '8.370')] +[2023-10-08 13:21:17,450][102897] Updated weights for policy 0, policy_version 39620 (0.0008) +[2023-10-08 13:21:17,821][102897] Updated weights for policy 0, policy_version 39630 (0.0007) +[2023-10-08 13:21:18,190][102897] Updated weights for policy 0, policy_version 39640 (0.0008) +[2023-10-08 13:21:19,086][102898] Updated weights for policy 1, policy_version 39650 (0.0008) +[2023-10-08 13:21:19,503][102898] Updated weights for policy 1, policy_version 39660 (0.0008) +[2023-10-08 13:21:19,870][102898] Updated weights for policy 1, policy_version 39670 (0.0008) +[2023-10-08 13:21:20,226][102898] Updated weights for policy 1, policy_version 39680 (0.0008) +[2023-10-08 13:21:21,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.6, 300 sec: 14329.1). Total num frames: 81231872. Throughput: 0: 1779.7, 1: 1807.7. Samples: 20313146. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 13:21:21,875][101941] Avg episode reward: [(0, '7.090'), (1, '8.140')] +[2023-10-08 13:21:21,905][102897] Updated weights for policy 0, policy_version 39650 (0.0008) +[2023-10-08 13:21:22,272][102897] Updated weights for policy 0, policy_version 39660 (0.0008) +[2023-10-08 13:21:22,645][102897] Updated weights for policy 0, policy_version 39670 (0.0010) +[2023-10-08 13:21:23,016][102897] Updated weights for policy 0, policy_version 39680 (0.0009) +[2023-10-08 13:21:23,837][102898] Updated weights for policy 1, policy_version 39690 (0.0008) +[2023-10-08 13:21:24,210][102898] Updated weights for policy 1, policy_version 39700 (0.0011) +[2023-10-08 13:21:24,580][102898] Updated weights for policy 1, policy_version 39710 (0.0008) +[2023-10-08 13:21:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 81297408. Throughput: 0: 1787.1, 1: 1784.3. Samples: 20334492. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 13:21:26,876][101941] Avg episode reward: [(0, '6.830'), (1, '7.750')] +[2023-10-08 13:21:26,906][102897] Updated weights for policy 0, policy_version 39690 (0.0009) +[2023-10-08 13:21:27,273][102897] Updated weights for policy 0, policy_version 39700 (0.0009) +[2023-10-08 13:21:27,638][102897] Updated weights for policy 0, policy_version 39710 (0.0007) +[2023-10-08 13:21:28,407][102898] Updated weights for policy 1, policy_version 39720 (0.0008) +[2023-10-08 13:21:28,774][102898] Updated weights for policy 1, policy_version 39730 (0.0008) +[2023-10-08 13:21:29,143][102898] Updated weights for policy 1, policy_version 39740 (0.0010) +[2023-10-08 13:21:31,499][102897] Updated weights for policy 0, policy_version 39720 (0.0008) +[2023-10-08 13:21:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 81362944. Throughput: 0: 1805.3, 1: 1788.0. Samples: 20356754. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:21:31,875][101941] Avg episode reward: [(0, '6.710'), (1, '7.920')] +[2023-10-08 13:21:31,877][102897] Updated weights for policy 0, policy_version 39730 (0.0012) +[2023-10-08 13:21:32,248][102897] Updated weights for policy 0, policy_version 39740 (0.0009) +[2023-10-08 13:21:32,932][102898] Updated weights for policy 1, policy_version 39750 (0.0011) +[2023-10-08 13:21:33,303][102898] Updated weights for policy 1, policy_version 39760 (0.0008) +[2023-10-08 13:21:33,669][102898] Updated weights for policy 1, policy_version 39770 (0.0007) +[2023-10-08 13:21:36,030][102897] Updated weights for policy 0, policy_version 39750 (0.0009) +[2023-10-08 13:21:36,397][102897] Updated weights for policy 0, policy_version 39760 (0.0007) +[2023-10-08 13:21:36,765][102897] Updated weights for policy 0, policy_version 39770 (0.0008) +[2023-10-08 13:21:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 81428480. Throughput: 0: 1788.1, 1: 1788.8. Samples: 20366788. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:21:36,876][101941] Avg episode reward: [(0, '6.310'), (1, '7.860')] +[2023-10-08 13:21:37,501][102898] Updated weights for policy 1, policy_version 39780 (0.0007) +[2023-10-08 13:21:37,871][102898] Updated weights for policy 1, policy_version 39790 (0.0008) +[2023-10-08 13:21:38,234][102898] Updated weights for policy 1, policy_version 39800 (0.0010) +[2023-10-08 13:21:40,462][102897] Updated weights for policy 0, policy_version 39780 (0.0007) +[2023-10-08 13:21:40,833][102897] Updated weights for policy 0, policy_version 39790 (0.0008) +[2023-10-08 13:21:41,195][102897] Updated weights for policy 0, policy_version 39800 (0.0009) +[2023-10-08 13:21:41,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 81526784. Throughput: 0: 1813.7, 1: 1790.7. Samples: 20389392. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:21:41,876][101941] Avg episode reward: [(0, '6.480'), (1, '6.940')] +[2023-10-08 13:21:42,010][102898] Updated weights for policy 1, policy_version 39810 (0.0008) +[2023-10-08 13:21:42,365][102898] Updated weights for policy 1, policy_version 39820 (0.0008) +[2023-10-08 13:21:42,731][102898] Updated weights for policy 1, policy_version 39830 (0.0008) +[2023-10-08 13:21:43,107][102898] Updated weights for policy 1, policy_version 39840 (0.0008) +[2023-10-08 13:21:44,856][102897] Updated weights for policy 0, policy_version 39810 (0.0008) +[2023-10-08 13:21:45,229][102897] Updated weights for policy 0, policy_version 39820 (0.0010) +[2023-10-08 13:21:45,588][102897] Updated weights for policy 0, policy_version 39830 (0.0007) +[2023-10-08 13:21:45,960][102897] Updated weights for policy 0, policy_version 39840 (0.0010) +[2023-10-08 13:21:46,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 81592320. Throughput: 0: 1798.1, 1: 1808.4. Samples: 20410336. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:21:46,876][101941] Avg episode reward: [(0, '6.860'), (1, '7.110')] +[2023-10-08 13:21:46,912][102898] Updated weights for policy 1, policy_version 39850 (0.0008) +[2023-10-08 13:21:47,285][102898] Updated weights for policy 1, policy_version 39860 (0.0010) +[2023-10-08 13:21:47,641][102898] Updated weights for policy 1, policy_version 39870 (0.0009) +[2023-10-08 13:21:49,893][102897] Updated weights for policy 0, policy_version 39850 (0.0008) +[2023-10-08 13:21:50,261][102897] Updated weights for policy 0, policy_version 39860 (0.0008) +[2023-10-08 13:21:50,636][102897] Updated weights for policy 0, policy_version 39870 (0.0008) +[2023-10-08 13:21:51,444][102898] Updated weights for policy 1, policy_version 39880 (0.0010) +[2023-10-08 13:21:51,816][102898] Updated weights for policy 1, policy_version 39890 (0.0010) +[2023-10-08 13:21:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 81657856. Throughput: 0: 1813.2, 1: 1783.0. Samples: 20421414. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:21:51,875][101941] Avg episode reward: [(0, '6.530'), (1, '7.030')] +[2023-10-08 13:21:52,174][102898] Updated weights for policy 1, policy_version 39900 (0.0007) +[2023-10-08 13:21:54,337][102897] Updated weights for policy 0, policy_version 39880 (0.0008) +[2023-10-08 13:21:54,708][102897] Updated weights for policy 0, policy_version 39890 (0.0008) +[2023-10-08 13:21:55,078][102897] Updated weights for policy 0, policy_version 39900 (0.0007) +[2023-10-08 13:21:55,890][102898] Updated weights for policy 1, policy_version 39910 (0.0008) +[2023-10-08 13:21:56,248][102898] Updated weights for policy 1, policy_version 39920 (0.0008) +[2023-10-08 13:21:56,628][102898] Updated weights for policy 1, policy_version 39930 (0.0007) +[2023-10-08 13:21:56,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 81756160. Throughput: 0: 1795.0, 1: 1795.4. Samples: 20442212. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 13:21:56,876][101941] Avg episode reward: [(0, '6.220'), (1, '7.490')] +[2023-10-08 13:21:58,761][102897] Updated weights for policy 0, policy_version 39910 (0.0009) +[2023-10-08 13:21:59,130][102897] Updated weights for policy 0, policy_version 39920 (0.0009) +[2023-10-08 13:21:59,506][102897] Updated weights for policy 0, policy_version 39930 (0.0007) +[2023-10-08 13:22:00,202][102898] Updated weights for policy 1, policy_version 39940 (0.0008) +[2023-10-08 13:22:00,578][102898] Updated weights for policy 1, policy_version 39950 (0.0007) +[2023-10-08 13:22:00,949][102898] Updated weights for policy 1, policy_version 39960 (0.0007) +[2023-10-08 13:22:01,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 81821696. Throughput: 0: 1791.7, 1: 1785.7. Samples: 20463362. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 13:22:01,876][101941] Avg episode reward: [(0, '6.590'), (1, '7.670')] +[2023-10-08 13:22:03,208][102897] Updated weights for policy 0, policy_version 39940 (0.0009) +[2023-10-08 13:22:03,578][102897] Updated weights for policy 0, policy_version 39950 (0.0009) +[2023-10-08 13:22:03,952][102897] Updated weights for policy 0, policy_version 39960 (0.0009) +[2023-10-08 13:22:04,807][102898] Updated weights for policy 1, policy_version 39970 (0.0008) +[2023-10-08 13:22:05,184][102898] Updated weights for policy 1, policy_version 39980 (0.0007) +[2023-10-08 13:22:05,549][102898] Updated weights for policy 1, policy_version 39990 (0.0010) +[2023-10-08 13:22:05,913][102898] Updated weights for policy 1, policy_version 40000 (0.0008) +[2023-10-08 13:22:06,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 81887232. Throughput: 0: 1791.7, 1: 1791.8. Samples: 20474404. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 13:22:06,876][101941] Avg episode reward: [(0, '6.710'), (1, '6.860')] +[2023-10-08 13:22:07,860][102897] Updated weights for policy 0, policy_version 39970 (0.0009) +[2023-10-08 13:22:08,248][102897] Updated weights for policy 0, policy_version 39980 (0.0007) +[2023-10-08 13:22:08,622][102897] Updated weights for policy 0, policy_version 39990 (0.0009) +[2023-10-08 13:22:08,993][102897] Updated weights for policy 0, policy_version 40000 (0.0009) +[2023-10-08 13:22:09,620][102898] Updated weights for policy 1, policy_version 40010 (0.0007) +[2023-10-08 13:22:09,984][102898] Updated weights for policy 1, policy_version 40020 (0.0007) +[2023-10-08 13:22:10,357][102898] Updated weights for policy 1, policy_version 40030 (0.0009) +[2023-10-08 13:22:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 81952768. Throughput: 0: 1787.3, 1: 1791.6. Samples: 20495546. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 13:22:11,876][101941] Avg episode reward: [(0, '6.530'), (1, '7.450')] +[2023-10-08 13:22:12,741][102897] Updated weights for policy 0, policy_version 40010 (0.0008) +[2023-10-08 13:22:13,111][102897] Updated weights for policy 0, policy_version 40020 (0.0009) +[2023-10-08 13:22:13,478][102897] Updated weights for policy 0, policy_version 40030 (0.0007) +[2023-10-08 13:22:14,262][102898] Updated weights for policy 1, policy_version 40040 (0.0010) +[2023-10-08 13:22:14,635][102898] Updated weights for policy 1, policy_version 40050 (0.0010) +[2023-10-08 13:22:15,010][102898] Updated weights for policy 1, policy_version 40060 (0.0010) +[2023-10-08 13:22:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 82018304. Throughput: 0: 1787.2, 1: 1783.2. Samples: 20517424. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 13:22:16,876][101941] Avg episode reward: [(0, '6.340'), (1, '8.120')] +[2023-10-08 13:22:16,887][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000040064_41025536.pth... +[2023-10-08 13:22:16,888][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000040032_40992768.pth... +[2023-10-08 13:22:16,918][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000038400_39321600.pth +[2023-10-08 13:22:16,930][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000038368_39288832.pth +[2023-10-08 13:22:17,457][102897] Updated weights for policy 0, policy_version 40040 (0.0007) +[2023-10-08 13:22:17,839][102897] Updated weights for policy 0, policy_version 40050 (0.0007) +[2023-10-08 13:22:18,218][102897] Updated weights for policy 0, policy_version 40060 (0.0009) +[2023-10-08 13:22:18,657][102898] Updated weights for policy 1, policy_version 40070 (0.0010) +[2023-10-08 13:22:19,025][102898] Updated weights for policy 1, policy_version 40080 (0.0010) +[2023-10-08 13:22:19,387][102898] Updated weights for policy 1, policy_version 40090 (0.0007) +[2023-10-08 13:22:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 82083840. Throughput: 0: 1777.7, 1: 1787.3. Samples: 20527212. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 13:22:21,876][101941] Avg episode reward: [(0, '6.220'), (1, '8.010')] +[2023-10-08 13:22:22,021][102897] Updated weights for policy 0, policy_version 40070 (0.0008) +[2023-10-08 13:22:22,389][102897] Updated weights for policy 0, policy_version 40080 (0.0008) +[2023-10-08 13:22:22,769][102897] Updated weights for policy 0, policy_version 40090 (0.0007) +[2023-10-08 13:22:23,214][102898] Updated weights for policy 1, policy_version 40100 (0.0007) +[2023-10-08 13:22:23,578][102898] Updated weights for policy 1, policy_version 40110 (0.0008) +[2023-10-08 13:22:23,941][102898] Updated weights for policy 1, policy_version 40120 (0.0008) +[2023-10-08 13:22:26,302][102897] Updated weights for policy 0, policy_version 40100 (0.0010) +[2023-10-08 13:22:26,680][102897] Updated weights for policy 0, policy_version 40110 (0.0010) +[2023-10-08 13:22:26,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 82149376. Throughput: 0: 1775.9, 1: 1778.9. Samples: 20549360. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:22:26,875][101941] Avg episode reward: [(0, '6.280'), (1, '6.940')] +[2023-10-08 13:22:27,058][102897] Updated weights for policy 0, policy_version 40120 (0.0009) +[2023-10-08 13:22:27,690][102898] Updated weights for policy 1, policy_version 40130 (0.0009) +[2023-10-08 13:22:28,065][102898] Updated weights for policy 1, policy_version 40140 (0.0010) +[2023-10-08 13:22:28,439][102898] Updated weights for policy 1, policy_version 40150 (0.0009) +[2023-10-08 13:22:28,804][102898] Updated weights for policy 1, policy_version 40160 (0.0007) +[2023-10-08 13:22:30,718][102897] Updated weights for policy 0, policy_version 40130 (0.0008) +[2023-10-08 13:22:31,086][102897] Updated weights for policy 0, policy_version 40140 (0.0009) +[2023-10-08 13:22:31,461][102897] Updated weights for policy 0, policy_version 40150 (0.0008) +[2023-10-08 13:22:31,838][102897] Updated weights for policy 0, policy_version 40160 (0.0007) +[2023-10-08 13:22:31,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 82247680. Throughput: 0: 1787.2, 1: 1785.9. Samples: 20571122. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:22:31,876][101941] Avg episode reward: [(0, '6.440'), (1, '7.270')] +[2023-10-08 13:22:32,495][102898] Updated weights for policy 1, policy_version 40170 (0.0011) +[2023-10-08 13:22:32,865][102898] Updated weights for policy 1, policy_version 40180 (0.0010) +[2023-10-08 13:22:33,224][102898] Updated weights for policy 1, policy_version 40190 (0.0009) +[2023-10-08 13:22:35,766][102897] Updated weights for policy 0, policy_version 40170 (0.0008) +[2023-10-08 13:22:36,140][102897] Updated weights for policy 0, policy_version 40180 (0.0008) +[2023-10-08 13:22:36,516][102897] Updated weights for policy 0, policy_version 40190 (0.0009) +[2023-10-08 13:22:36,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 82313216. Throughput: 0: 1772.8, 1: 1788.0. Samples: 20581648. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:22:36,876][101941] Avg episode reward: [(0, '6.730'), (1, '7.570')] +[2023-10-08 13:22:36,979][102898] Updated weights for policy 1, policy_version 40200 (0.0008) +[2023-10-08 13:22:37,341][102898] Updated weights for policy 1, policy_version 40210 (0.0008) +[2023-10-08 13:22:37,711][102898] Updated weights for policy 1, policy_version 40220 (0.0007) +[2023-10-08 13:22:40,356][102897] Updated weights for policy 0, policy_version 40200 (0.0008) +[2023-10-08 13:22:40,722][102897] Updated weights for policy 0, policy_version 40210 (0.0007) +[2023-10-08 13:22:41,091][102897] Updated weights for policy 0, policy_version 40220 (0.0007) +[2023-10-08 13:22:41,466][102898] Updated weights for policy 1, policy_version 40230 (0.0008) +[2023-10-08 13:22:41,828][102898] Updated weights for policy 1, policy_version 40240 (0.0008) +[2023-10-08 13:22:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 82378752. Throughput: 0: 1798.4, 1: 1791.5. Samples: 20603758. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:22:41,876][101941] Avg episode reward: [(0, '6.930'), (1, '7.780')] +[2023-10-08 13:22:42,203][102898] Updated weights for policy 1, policy_version 40250 (0.0011) +[2023-10-08 13:22:44,676][102897] Updated weights for policy 0, policy_version 40230 (0.0007) +[2023-10-08 13:22:45,041][102897] Updated weights for policy 0, policy_version 40240 (0.0007) +[2023-10-08 13:22:45,411][102897] Updated weights for policy 0, policy_version 40250 (0.0007) +[2023-10-08 13:22:46,098][102898] Updated weights for policy 1, policy_version 40260 (0.0007) +[2023-10-08 13:22:46,463][102898] Updated weights for policy 1, policy_version 40270 (0.0008) +[2023-10-08 13:22:46,823][102898] Updated weights for policy 1, policy_version 40280 (0.0009) +[2023-10-08 13:22:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 82444288. Throughput: 0: 1775.8, 1: 1805.2. Samples: 20624508. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:22:46,876][101941] Avg episode reward: [(0, '6.890'), (1, '7.560')] +[2023-10-08 13:22:49,192][102897] Updated weights for policy 0, policy_version 40260 (0.0009) +[2023-10-08 13:22:49,569][102897] Updated weights for policy 0, policy_version 40270 (0.0008) +[2023-10-08 13:22:49,935][102897] Updated weights for policy 0, policy_version 40280 (0.0009) +[2023-10-08 13:22:50,655][102898] Updated weights for policy 1, policy_version 40290 (0.0009) +[2023-10-08 13:22:51,022][102898] Updated weights for policy 1, policy_version 40300 (0.0008) +[2023-10-08 13:22:51,398][102898] Updated weights for policy 1, policy_version 40310 (0.0008) +[2023-10-08 13:22:51,758][102898] Updated weights for policy 1, policy_version 40320 (0.0008) +[2023-10-08 13:22:51,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 82542592. Throughput: 0: 1800.1, 1: 1785.2. Samples: 20635740. Policy #0 lag: (min: 2.0, avg: 4.9, max: 34.0) +[2023-10-08 13:22:51,876][101941] Avg episode reward: [(0, '6.500'), (1, '7.660')] +[2023-10-08 13:22:53,755][102897] Updated weights for policy 0, policy_version 40290 (0.0010) +[2023-10-08 13:22:54,143][102897] Updated weights for policy 0, policy_version 40300 (0.0007) +[2023-10-08 13:22:54,517][102897] Updated weights for policy 0, policy_version 40310 (0.0009) +[2023-10-08 13:22:54,897][102897] Updated weights for policy 0, policy_version 40320 (0.0008) +[2023-10-08 13:22:55,488][102898] Updated weights for policy 1, policy_version 40330 (0.0009) +[2023-10-08 13:22:55,852][102898] Updated weights for policy 1, policy_version 40340 (0.0010) +[2023-10-08 13:22:56,216][102898] Updated weights for policy 1, policy_version 40350 (0.0009) +[2023-10-08 13:22:56,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 82608128. Throughput: 0: 1777.7, 1: 1803.4. Samples: 20656694. Policy #0 lag: (min: 2.0, avg: 4.9, max: 34.0) +[2023-10-08 13:22:56,875][101941] Avg episode reward: [(0, '6.450'), (1, '8.290')] +[2023-10-08 13:22:58,488][102897] Updated weights for policy 0, policy_version 40330 (0.0009) +[2023-10-08 13:22:58,861][102897] Updated weights for policy 0, policy_version 40340 (0.0009) +[2023-10-08 13:22:59,230][102897] Updated weights for policy 0, policy_version 40350 (0.0008) +[2023-10-08 13:23:00,126][102898] Updated weights for policy 1, policy_version 40360 (0.0008) +[2023-10-08 13:23:00,494][102898] Updated weights for policy 1, policy_version 40370 (0.0010) +[2023-10-08 13:23:00,861][102898] Updated weights for policy 1, policy_version 40380 (0.0009) +[2023-10-08 13:23:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 82673664. Throughput: 0: 1789.1, 1: 1785.7. Samples: 20678292. Policy #0 lag: (min: 2.0, avg: 4.9, max: 34.0) +[2023-10-08 13:23:01,875][101941] Avg episode reward: [(0, '6.450'), (1, '8.190')] +[2023-10-08 13:23:03,005][102897] Updated weights for policy 0, policy_version 40360 (0.0007) +[2023-10-08 13:23:03,381][102897] Updated weights for policy 0, policy_version 40370 (0.0008) +[2023-10-08 13:23:03,757][102897] Updated weights for policy 0, policy_version 40380 (0.0008) +[2023-10-08 13:23:04,508][102898] Updated weights for policy 1, policy_version 40390 (0.0009) +[2023-10-08 13:23:04,876][102898] Updated weights for policy 1, policy_version 40400 (0.0008) +[2023-10-08 13:23:05,238][102898] Updated weights for policy 1, policy_version 40410 (0.0010) +[2023-10-08 13:23:06,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 82739200. Throughput: 0: 1791.3, 1: 1813.1. Samples: 20689408. Policy #0 lag: (min: 2.0, avg: 4.9, max: 34.0) +[2023-10-08 13:23:06,876][101941] Avg episode reward: [(0, '6.930'), (1, '8.280')] +[2023-10-08 13:23:07,643][102897] Updated weights for policy 0, policy_version 40390 (0.0009) +[2023-10-08 13:23:08,018][102897] Updated weights for policy 0, policy_version 40400 (0.0010) +[2023-10-08 13:23:08,384][102897] Updated weights for policy 0, policy_version 40410 (0.0009) +[2023-10-08 13:23:08,860][102898] Updated weights for policy 1, policy_version 40420 (0.0011) +[2023-10-08 13:23:09,238][102898] Updated weights for policy 1, policy_version 40430 (0.0007) +[2023-10-08 13:23:09,604][102898] Updated weights for policy 1, policy_version 40440 (0.0009) +[2023-10-08 13:23:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 82804736. Throughput: 0: 1783.3, 1: 1798.4. Samples: 20710538. Policy #0 lag: (min: 2.0, avg: 4.9, max: 34.0) +[2023-10-08 13:23:11,876][101941] Avg episode reward: [(0, '7.540'), (1, '7.170')] +[2023-10-08 13:23:12,126][102897] Updated weights for policy 0, policy_version 40420 (0.0008) +[2023-10-08 13:23:12,493][102897] Updated weights for policy 0, policy_version 40430 (0.0009) +[2023-10-08 13:23:12,875][102897] Updated weights for policy 0, policy_version 40440 (0.0008) +[2023-10-08 13:23:13,275][102898] Updated weights for policy 1, policy_version 40450 (0.0008) +[2023-10-08 13:23:13,651][102898] Updated weights for policy 1, policy_version 40460 (0.0009) +[2023-10-08 13:23:14,011][102898] Updated weights for policy 1, policy_version 40470 (0.0008) +[2023-10-08 13:23:14,375][102898] Updated weights for policy 1, policy_version 40480 (0.0007) +[2023-10-08 13:23:16,688][102897] Updated weights for policy 0, policy_version 40450 (0.0009) +[2023-10-08 13:23:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 82870272. Throughput: 0: 1797.4, 1: 1797.1. Samples: 20732874. Policy #0 lag: (min: 2.0, avg: 4.9, max: 34.0) +[2023-10-08 13:23:16,876][101941] Avg episode reward: [(0, '7.740'), (1, '7.220')] +[2023-10-08 13:23:17,066][102897] Updated weights for policy 0, policy_version 40460 (0.0008) +[2023-10-08 13:23:17,435][102897] Updated weights for policy 0, policy_version 40470 (0.0008) +[2023-10-08 13:23:17,803][102897] Updated weights for policy 0, policy_version 40480 (0.0010) +[2023-10-08 13:23:18,135][102898] Updated weights for policy 1, policy_version 40490 (0.0010) +[2023-10-08 13:23:18,511][102898] Updated weights for policy 1, policy_version 40500 (0.0011) +[2023-10-08 13:23:18,880][102898] Updated weights for policy 1, policy_version 40510 (0.0008) +[2023-10-08 13:23:21,543][102897] Updated weights for policy 0, policy_version 40490 (0.0007) +[2023-10-08 13:23:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 82935808. Throughput: 0: 1781.7, 1: 1795.3. Samples: 20742612. Policy #0 lag: (min: 17.0, avg: 27.3, max: 49.0) +[2023-10-08 13:23:21,876][101941] Avg episode reward: [(0, '6.430'), (1, '7.770')] +[2023-10-08 13:23:21,904][102897] Updated weights for policy 0, policy_version 40500 (0.0009) +[2023-10-08 13:23:22,268][102897] Updated weights for policy 0, policy_version 40510 (0.0010) +[2023-10-08 13:23:22,518][102898] Updated weights for policy 1, policy_version 40520 (0.0008) +[2023-10-08 13:23:22,884][102898] Updated weights for policy 1, policy_version 40530 (0.0009) +[2023-10-08 13:23:23,242][102898] Updated weights for policy 1, policy_version 40540 (0.0008) +[2023-10-08 13:23:26,099][102897] Updated weights for policy 0, policy_version 40520 (0.0010) +[2023-10-08 13:23:26,466][102897] Updated weights for policy 0, policy_version 40530 (0.0010) +[2023-10-08 13:23:26,840][102897] Updated weights for policy 0, policy_version 40540 (0.0010) +[2023-10-08 13:23:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 83001344. Throughput: 0: 1787.2, 1: 1789.4. Samples: 20764704. Policy #0 lag: (min: 17.0, avg: 27.3, max: 49.0) +[2023-10-08 13:23:26,876][101941] Avg episode reward: [(0, '5.950'), (1, '7.480')] +[2023-10-08 13:23:27,060][102898] Updated weights for policy 1, policy_version 40550 (0.0009) +[2023-10-08 13:23:27,413][102898] Updated weights for policy 1, policy_version 40560 (0.0010) +[2023-10-08 13:23:27,775][102898] Updated weights for policy 1, policy_version 40570 (0.0009) +[2023-10-08 13:23:30,552][102897] Updated weights for policy 0, policy_version 40550 (0.0009) +[2023-10-08 13:23:30,924][102897] Updated weights for policy 0, policy_version 40560 (0.0008) +[2023-10-08 13:23:31,294][102897] Updated weights for policy 0, policy_version 40570 (0.0009) +[2023-10-08 13:23:31,539][102898] Updated weights for policy 1, policy_version 40580 (0.0009) +[2023-10-08 13:23:31,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 83099648. Throughput: 0: 1778.5, 1: 1805.0. Samples: 20785762. Policy #0 lag: (min: 17.0, avg: 27.3, max: 49.0) +[2023-10-08 13:23:31,875][101941] Avg episode reward: [(0, '6.350'), (1, '7.260')] +[2023-10-08 13:23:31,901][102898] Updated weights for policy 1, policy_version 40590 (0.0009) +[2023-10-08 13:23:32,273][102898] Updated weights for policy 1, policy_version 40600 (0.0009) +[2023-10-08 13:23:35,072][102897] Updated weights for policy 0, policy_version 40580 (0.0009) +[2023-10-08 13:23:35,445][102897] Updated weights for policy 0, policy_version 40590 (0.0008) +[2023-10-08 13:23:35,812][102897] Updated weights for policy 0, policy_version 40600 (0.0011) +[2023-10-08 13:23:36,195][102898] Updated weights for policy 1, policy_version 40610 (0.0009) +[2023-10-08 13:23:36,615][102898] Updated weights for policy 1, policy_version 40620 (0.0009) +[2023-10-08 13:23:36,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 83165184. Throughput: 0: 1778.9, 1: 1795.8. Samples: 20796602. Policy #0 lag: (min: 17.0, avg: 27.3, max: 49.0) +[2023-10-08 13:23:36,876][101941] Avg episode reward: [(0, '6.430'), (1, '7.310')] +[2023-10-08 13:23:36,997][102898] Updated weights for policy 1, policy_version 40630 (0.0010) +[2023-10-08 13:23:37,358][102898] Updated weights for policy 1, policy_version 40640 (0.0009) +[2023-10-08 13:23:39,596][102897] Updated weights for policy 0, policy_version 40610 (0.0009) +[2023-10-08 13:23:39,974][102897] Updated weights for policy 0, policy_version 40620 (0.0009) +[2023-10-08 13:23:40,342][102897] Updated weights for policy 0, policy_version 40630 (0.0007) +[2023-10-08 13:23:40,711][102897] Updated weights for policy 0, policy_version 40640 (0.0008) +[2023-10-08 13:23:41,236][102898] Updated weights for policy 1, policy_version 40650 (0.0007) +[2023-10-08 13:23:41,611][102898] Updated weights for policy 1, policy_version 40660 (0.0009) +[2023-10-08 13:23:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 83230720. Throughput: 0: 1777.8, 1: 1795.7. Samples: 20817502. Policy #0 lag: (min: 17.0, avg: 27.3, max: 49.0) +[2023-10-08 13:23:41,876][101941] Avg episode reward: [(0, '7.490'), (1, '6.870')] +[2023-10-08 13:23:41,970][102898] Updated weights for policy 1, policy_version 40670 (0.0009) +[2023-10-08 13:23:44,524][102897] Updated weights for policy 0, policy_version 40650 (0.0009) +[2023-10-08 13:23:44,909][102897] Updated weights for policy 0, policy_version 40660 (0.0007) +[2023-10-08 13:23:45,285][102897] Updated weights for policy 0, policy_version 40670 (0.0010) +[2023-10-08 13:23:45,843][102898] Updated weights for policy 1, policy_version 40680 (0.0008) +[2023-10-08 13:23:46,208][102898] Updated weights for policy 1, policy_version 40690 (0.0008) +[2023-10-08 13:23:46,587][102898] Updated weights for policy 1, policy_version 40700 (0.0009) +[2023-10-08 13:23:46,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 83329024. Throughput: 0: 1767.6, 1: 1790.4. Samples: 20838402. Policy #0 lag: (min: 18.0, avg: 21.2, max: 50.0) +[2023-10-08 13:23:46,875][101941] Avg episode reward: [(0, '7.610'), (1, '6.980')] +[2023-10-08 13:23:49,246][102897] Updated weights for policy 0, policy_version 40680 (0.0008) +[2023-10-08 13:23:49,610][102897] Updated weights for policy 0, policy_version 40690 (0.0009) +[2023-10-08 13:23:49,975][102897] Updated weights for policy 0, policy_version 40700 (0.0007) +[2023-10-08 13:23:50,342][102898] Updated weights for policy 1, policy_version 40710 (0.0009) +[2023-10-08 13:23:50,697][102898] Updated weights for policy 1, policy_version 40720 (0.0007) +[2023-10-08 13:23:51,067][102898] Updated weights for policy 1, policy_version 40730 (0.0008) +[2023-10-08 13:23:51,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 83394560. Throughput: 0: 1785.4, 1: 1780.7. Samples: 20849880. Policy #0 lag: (min: 18.0, avg: 21.2, max: 50.0) +[2023-10-08 13:23:51,876][101941] Avg episode reward: [(0, '6.660'), (1, '7.610')] +[2023-10-08 13:23:53,832][102897] Updated weights for policy 0, policy_version 40710 (0.0008) +[2023-10-08 13:23:54,202][102897] Updated weights for policy 0, policy_version 40720 (0.0011) +[2023-10-08 13:23:54,569][102897] Updated weights for policy 0, policy_version 40730 (0.0009) +[2023-10-08 13:23:54,911][102898] Updated weights for policy 1, policy_version 40740 (0.0007) +[2023-10-08 13:23:55,271][102898] Updated weights for policy 1, policy_version 40750 (0.0008) +[2023-10-08 13:23:55,640][102898] Updated weights for policy 1, policy_version 40760 (0.0009) +[2023-10-08 13:23:56,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 83460096. Throughput: 0: 1767.0, 1: 1786.3. Samples: 20870438. Policy #0 lag: (min: 18.0, avg: 21.2, max: 50.0) +[2023-10-08 13:23:56,876][101941] Avg episode reward: [(0, '6.670'), (1, '7.420')] +[2023-10-08 13:23:58,249][102897] Updated weights for policy 0, policy_version 40740 (0.0008) +[2023-10-08 13:23:58,625][102897] Updated weights for policy 0, policy_version 40750 (0.0008) +[2023-10-08 13:23:58,987][102897] Updated weights for policy 0, policy_version 40760 (0.0008) +[2023-10-08 13:23:59,392][102898] Updated weights for policy 1, policy_version 40770 (0.0008) +[2023-10-08 13:23:59,763][102898] Updated weights for policy 1, policy_version 40780 (0.0007) +[2023-10-08 13:24:00,129][102898] Updated weights for policy 1, policy_version 40790 (0.0011) +[2023-10-08 13:24:00,492][102898] Updated weights for policy 1, policy_version 40800 (0.0008) +[2023-10-08 13:24:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 83525632. Throughput: 0: 1771.6, 1: 1764.3. Samples: 20891988. Policy #0 lag: (min: 18.0, avg: 21.2, max: 50.0) +[2023-10-08 13:24:01,876][101941] Avg episode reward: [(0, '7.110'), (1, '7.370')] +[2023-10-08 13:24:02,731][102897] Updated weights for policy 0, policy_version 40770 (0.0009) +[2023-10-08 13:24:03,108][102897] Updated weights for policy 0, policy_version 40780 (0.0010) +[2023-10-08 13:24:03,482][102897] Updated weights for policy 0, policy_version 40790 (0.0010) +[2023-10-08 13:24:03,847][102897] Updated weights for policy 0, policy_version 40800 (0.0008) +[2023-10-08 13:24:04,232][102898] Updated weights for policy 1, policy_version 40810 (0.0008) +[2023-10-08 13:24:04,596][102898] Updated weights for policy 1, policy_version 40820 (0.0007) +[2023-10-08 13:24:04,973][102898] Updated weights for policy 1, policy_version 40830 (0.0007) +[2023-10-08 13:24:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 83591168. Throughput: 0: 1767.2, 1: 1785.9. Samples: 20902502. Policy #0 lag: (min: 18.0, avg: 21.2, max: 50.0) +[2023-10-08 13:24:06,876][101941] Avg episode reward: [(0, '7.060'), (1, '7.890')] +[2023-10-08 13:24:07,718][102897] Updated weights for policy 0, policy_version 40810 (0.0011) +[2023-10-08 13:24:08,087][102897] Updated weights for policy 0, policy_version 40820 (0.0010) +[2023-10-08 13:24:08,453][102897] Updated weights for policy 0, policy_version 40830 (0.0008) +[2023-10-08 13:24:08,616][102898] Updated weights for policy 1, policy_version 40840 (0.0007) +[2023-10-08 13:24:08,995][102898] Updated weights for policy 1, policy_version 40850 (0.0007) +[2023-10-08 13:24:09,352][102898] Updated weights for policy 1, policy_version 40860 (0.0010) +[2023-10-08 13:24:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 83656704. Throughput: 0: 1773.2, 1: 1777.4. Samples: 20924480. Policy #0 lag: (min: 18.0, avg: 21.2, max: 50.0) +[2023-10-08 13:24:11,876][101941] Avg episode reward: [(0, '7.000'), (1, '7.960')] +[2023-10-08 13:24:12,162][102897] Updated weights for policy 0, policy_version 40840 (0.0008) +[2023-10-08 13:24:12,529][102897] Updated weights for policy 0, policy_version 40850 (0.0007) +[2023-10-08 13:24:12,909][102897] Updated weights for policy 0, policy_version 40860 (0.0008) +[2023-10-08 13:24:13,070][102898] Updated weights for policy 1, policy_version 40870 (0.0009) +[2023-10-08 13:24:13,444][102898] Updated weights for policy 1, policy_version 40880 (0.0007) +[2023-10-08 13:24:13,818][102898] Updated weights for policy 1, policy_version 40890 (0.0011) +[2023-10-08 13:24:16,674][102897] Updated weights for policy 0, policy_version 40870 (0.0007) +[2023-10-08 13:24:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 83722240. Throughput: 0: 1798.3, 1: 1774.5. Samples: 20946538. Policy #0 lag: (min: 0.0, avg: 28.9, max: 32.0) +[2023-10-08 13:24:16,876][101941] Avg episode reward: [(0, '6.850'), (1, '7.240')] +[2023-10-08 13:24:16,882][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000040896_41877504.pth... +[2023-10-08 13:24:16,915][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000039232_40173568.pth +[2023-10-08 13:24:17,047][102897] Updated weights for policy 0, policy_version 40880 (0.0007) +[2023-10-08 13:24:17,418][102897] Updated weights for policy 0, policy_version 40890 (0.0007) +[2023-10-08 13:24:17,638][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000040896_41877504.pth... +[2023-10-08 13:24:17,666][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000039200_40140800.pth +[2023-10-08 13:24:17,694][102898] Updated weights for policy 1, policy_version 40900 (0.0010) +[2023-10-08 13:24:18,074][102898] Updated weights for policy 1, policy_version 40910 (0.0011) +[2023-10-08 13:24:18,438][102898] Updated weights for policy 1, policy_version 40920 (0.0011) +[2023-10-08 13:24:21,280][102897] Updated weights for policy 0, policy_version 40900 (0.0009) +[2023-10-08 13:24:21,649][102897] Updated weights for policy 0, policy_version 40910 (0.0008) +[2023-10-08 13:24:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 83787776. Throughput: 0: 1770.8, 1: 1772.5. Samples: 20956048. Policy #0 lag: (min: 0.0, avg: 28.9, max: 32.0) +[2023-10-08 13:24:21,876][101941] Avg episode reward: [(0, '6.380'), (1, '7.210')] +[2023-10-08 13:24:22,029][102897] Updated weights for policy 0, policy_version 40920 (0.0008) +[2023-10-08 13:24:22,349][102898] Updated weights for policy 1, policy_version 40930 (0.0008) +[2023-10-08 13:24:22,716][102898] Updated weights for policy 1, policy_version 40940 (0.0011) +[2023-10-08 13:24:23,096][102898] Updated weights for policy 1, policy_version 40950 (0.0008) +[2023-10-08 13:24:23,461][102898] Updated weights for policy 1, policy_version 40960 (0.0009) +[2023-10-08 13:24:25,871][102897] Updated weights for policy 0, policy_version 40930 (0.0008) +[2023-10-08 13:24:26,285][102897] Updated weights for policy 0, policy_version 40940 (0.0007) +[2023-10-08 13:24:26,649][102897] Updated weights for policy 0, policy_version 40950 (0.0007) +[2023-10-08 13:24:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 83853312. Throughput: 0: 1792.5, 1: 1773.8. Samples: 20977986. Policy #0 lag: (min: 0.0, avg: 28.9, max: 32.0) +[2023-10-08 13:24:26,875][101941] Avg episode reward: [(0, '6.530'), (1, '7.790')] +[2023-10-08 13:24:27,017][102897] Updated weights for policy 0, policy_version 40960 (0.0007) +[2023-10-08 13:24:27,338][102898] Updated weights for policy 1, policy_version 40970 (0.0010) +[2023-10-08 13:24:27,697][102898] Updated weights for policy 1, policy_version 40980 (0.0009) +[2023-10-08 13:24:28,067][102898] Updated weights for policy 1, policy_version 40990 (0.0010) +[2023-10-08 13:24:30,557][102897] Updated weights for policy 0, policy_version 40970 (0.0008) +[2023-10-08 13:24:30,926][102897] Updated weights for policy 0, policy_version 40980 (0.0007) +[2023-10-08 13:24:31,299][102897] Updated weights for policy 0, policy_version 40990 (0.0007) +[2023-10-08 13:24:31,815][102898] Updated weights for policy 1, policy_version 41000 (0.0009) +[2023-10-08 13:24:31,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 83951616. Throughput: 0: 1773.2, 1: 1799.7. Samples: 20999182. Policy #0 lag: (min: 0.0, avg: 28.9, max: 32.0) +[2023-10-08 13:24:31,875][101941] Avg episode reward: [(0, '6.750'), (1, '7.690')] +[2023-10-08 13:24:32,175][102898] Updated weights for policy 1, policy_version 41010 (0.0008) +[2023-10-08 13:24:32,545][102898] Updated weights for policy 1, policy_version 41020 (0.0007) +[2023-10-08 13:24:35,158][102897] Updated weights for policy 0, policy_version 41000 (0.0010) +[2023-10-08 13:24:35,529][102897] Updated weights for policy 0, policy_version 41010 (0.0010) +[2023-10-08 13:24:35,905][102897] Updated weights for policy 0, policy_version 41020 (0.0008) +[2023-10-08 13:24:36,212][102898] Updated weights for policy 1, policy_version 41030 (0.0007) +[2023-10-08 13:24:36,578][102898] Updated weights for policy 1, policy_version 41040 (0.0008) +[2023-10-08 13:24:36,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 84017152. Throughput: 0: 1787.7, 1: 1780.1. Samples: 21010428. Policy #0 lag: (min: 0.0, avg: 28.9, max: 32.0) +[2023-10-08 13:24:36,875][101941] Avg episode reward: [(0, '6.480'), (1, '7.540')] +[2023-10-08 13:24:36,949][102898] Updated weights for policy 1, policy_version 41050 (0.0008) +[2023-10-08 13:24:39,554][102897] Updated weights for policy 0, policy_version 41030 (0.0009) +[2023-10-08 13:24:39,917][102897] Updated weights for policy 0, policy_version 41040 (0.0007) +[2023-10-08 13:24:40,291][102897] Updated weights for policy 0, policy_version 41050 (0.0009) +[2023-10-08 13:24:40,633][102898] Updated weights for policy 1, policy_version 41060 (0.0009) +[2023-10-08 13:24:41,002][102898] Updated weights for policy 1, policy_version 41070 (0.0008) +[2023-10-08 13:24:41,368][102898] Updated weights for policy 1, policy_version 41080 (0.0009) +[2023-10-08 13:24:41,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 84115456. Throughput: 0: 1788.2, 1: 1802.0. Samples: 21031996. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:24:41,876][101941] Avg episode reward: [(0, '6.760'), (1, '7.150')] +[2023-10-08 13:24:44,010][102897] Updated weights for policy 0, policy_version 41060 (0.0007) +[2023-10-08 13:24:44,398][102897] Updated weights for policy 0, policy_version 41070 (0.0009) +[2023-10-08 13:24:44,761][102897] Updated weights for policy 0, policy_version 41080 (0.0008) +[2023-10-08 13:24:44,969][102898] Updated weights for policy 1, policy_version 41090 (0.0008) +[2023-10-08 13:24:45,341][102898] Updated weights for policy 1, policy_version 41100 (0.0007) +[2023-10-08 13:24:45,708][102898] Updated weights for policy 1, policy_version 41110 (0.0009) +[2023-10-08 13:24:46,069][102898] Updated weights for policy 1, policy_version 41120 (0.0007) +[2023-10-08 13:24:46,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 84180992. Throughput: 0: 1782.9, 1: 1793.3. Samples: 21052918. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:24:46,876][101941] Avg episode reward: [(0, '6.840'), (1, '7.810')] +[2023-10-08 13:24:48,445][102897] Updated weights for policy 0, policy_version 41090 (0.0008) +[2023-10-08 13:24:48,808][102897] Updated weights for policy 0, policy_version 41100 (0.0009) +[2023-10-08 13:24:49,182][102897] Updated weights for policy 0, policy_version 41110 (0.0011) +[2023-10-08 13:24:49,553][102897] Updated weights for policy 0, policy_version 41120 (0.0009) +[2023-10-08 13:24:49,910][102898] Updated weights for policy 1, policy_version 41130 (0.0010) +[2023-10-08 13:24:50,290][102898] Updated weights for policy 1, policy_version 41140 (0.0011) +[2023-10-08 13:24:50,653][102898] Updated weights for policy 1, policy_version 41150 (0.0008) +[2023-10-08 13:24:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 84246528. Throughput: 0: 1793.2, 1: 1804.6. Samples: 21064400. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:24:51,876][101941] Avg episode reward: [(0, '6.730'), (1, '7.740')] +[2023-10-08 13:24:53,439][102897] Updated weights for policy 0, policy_version 41130 (0.0008) +[2023-10-08 13:24:53,810][102897] Updated weights for policy 0, policy_version 41140 (0.0009) +[2023-10-08 13:24:54,182][102897] Updated weights for policy 0, policy_version 41150 (0.0007) +[2023-10-08 13:24:54,401][102898] Updated weights for policy 1, policy_version 41160 (0.0008) +[2023-10-08 13:24:54,766][102898] Updated weights for policy 1, policy_version 41170 (0.0007) +[2023-10-08 13:24:55,141][102898] Updated weights for policy 1, policy_version 41180 (0.0009) +[2023-10-08 13:24:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 84312064. Throughput: 0: 1778.8, 1: 1781.3. Samples: 21084680. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:24:56,876][101941] Avg episode reward: [(0, '6.650'), (1, '8.130')] +[2023-10-08 13:24:58,021][102897] Updated weights for policy 0, policy_version 41160 (0.0007) +[2023-10-08 13:24:58,390][102897] Updated weights for policy 0, policy_version 41170 (0.0008) +[2023-10-08 13:24:58,752][102897] Updated weights for policy 0, policy_version 41180 (0.0008) +[2023-10-08 13:24:58,785][102898] Updated weights for policy 1, policy_version 41190 (0.0008) +[2023-10-08 13:24:59,153][102898] Updated weights for policy 1, policy_version 41200 (0.0007) +[2023-10-08 13:24:59,510][102898] Updated weights for policy 1, policy_version 41210 (0.0007) +[2023-10-08 13:25:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 84377600. Throughput: 0: 1781.3, 1: 1784.5. Samples: 21106996. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:25:01,875][101941] Avg episode reward: [(0, '6.020'), (1, '8.180')] +[2023-10-08 13:25:02,619][102897] Updated weights for policy 0, policy_version 41190 (0.0008) +[2023-10-08 13:25:02,991][102897] Updated weights for policy 0, policy_version 41200 (0.0008) +[2023-10-08 13:25:03,364][102897] Updated weights for policy 0, policy_version 41210 (0.0007) +[2023-10-08 13:25:03,397][102898] Updated weights for policy 1, policy_version 41220 (0.0010) +[2023-10-08 13:25:03,769][102898] Updated weights for policy 1, policy_version 41230 (0.0008) +[2023-10-08 13:25:04,139][102898] Updated weights for policy 1, policy_version 41240 (0.0008) +[2023-10-08 13:25:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 84443136. Throughput: 0: 1784.2, 1: 1788.0. Samples: 21116798. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:25:06,876][101941] Avg episode reward: [(0, '6.060'), (1, '8.410')] +[2023-10-08 13:25:07,285][102897] Updated weights for policy 0, policy_version 41220 (0.0007) +[2023-10-08 13:25:07,660][102897] Updated weights for policy 0, policy_version 41230 (0.0010) +[2023-10-08 13:25:07,906][102898] Updated weights for policy 1, policy_version 41250 (0.0009) +[2023-10-08 13:25:08,030][102897] Updated weights for policy 0, policy_version 41240 (0.0009) +[2023-10-08 13:25:08,266][102898] Updated weights for policy 1, policy_version 41260 (0.0008) +[2023-10-08 13:25:08,640][102898] Updated weights for policy 1, policy_version 41270 (0.0008) +[2023-10-08 13:25:09,003][102898] Updated weights for policy 1, policy_version 41280 (0.0010) +[2023-10-08 13:25:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 84508672. Throughput: 0: 1784.0, 1: 1793.2. Samples: 21138964. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:25:11,875][101941] Avg episode reward: [(0, '6.090'), (1, '8.000')] +[2023-10-08 13:25:11,910][102897] Updated weights for policy 0, policy_version 41250 (0.0007) +[2023-10-08 13:25:12,324][102897] Updated weights for policy 0, policy_version 41260 (0.0007) +[2023-10-08 13:25:12,687][102897] Updated weights for policy 0, policy_version 41270 (0.0008) +[2023-10-08 13:25:12,789][102898] Updated weights for policy 1, policy_version 41290 (0.0008) +[2023-10-08 13:25:13,061][102897] Updated weights for policy 0, policy_version 41280 (0.0007) +[2023-10-08 13:25:13,157][102898] Updated weights for policy 1, policy_version 41300 (0.0009) +[2023-10-08 13:25:13,523][102898] Updated weights for policy 1, policy_version 41310 (0.0008) +[2023-10-08 13:25:16,723][102897] Updated weights for policy 0, policy_version 41290 (0.0007) +[2023-10-08 13:25:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 84574208. Throughput: 0: 1807.2, 1: 1794.7. Samples: 21161266. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:25:16,875][101941] Avg episode reward: [(0, '6.690'), (1, '7.120')] +[2023-10-08 13:25:17,099][102897] Updated weights for policy 0, policy_version 41300 (0.0007) +[2023-10-08 13:25:17,209][102898] Updated weights for policy 1, policy_version 41320 (0.0008) +[2023-10-08 13:25:17,461][102897] Updated weights for policy 0, policy_version 41310 (0.0007) +[2023-10-08 13:25:17,570][102898] Updated weights for policy 1, policy_version 41330 (0.0008) +[2023-10-08 13:25:17,950][102898] Updated weights for policy 1, policy_version 41340 (0.0008) +[2023-10-08 13:25:21,170][102897] Updated weights for policy 0, policy_version 41320 (0.0009) +[2023-10-08 13:25:21,532][102897] Updated weights for policy 0, policy_version 41330 (0.0008) +[2023-10-08 13:25:21,761][102898] Updated weights for policy 1, policy_version 41350 (0.0011) +[2023-10-08 13:25:21,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 84639744. Throughput: 0: 1775.3, 1: 1794.5. Samples: 21171068. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:25:21,876][101941] Avg episode reward: [(0, '6.440'), (1, '7.680')] +[2023-10-08 13:25:21,911][102897] Updated weights for policy 0, policy_version 41340 (0.0008) +[2023-10-08 13:25:22,137][102898] Updated weights for policy 1, policy_version 41360 (0.0007) +[2023-10-08 13:25:22,499][102898] Updated weights for policy 1, policy_version 41370 (0.0007) +[2023-10-08 13:25:25,612][102897] Updated weights for policy 0, policy_version 41350 (0.0007) +[2023-10-08 13:25:25,984][102897] Updated weights for policy 0, policy_version 41360 (0.0008) +[2023-10-08 13:25:26,227][102898] Updated weights for policy 1, policy_version 41380 (0.0008) +[2023-10-08 13:25:26,349][102897] Updated weights for policy 0, policy_version 41370 (0.0009) +[2023-10-08 13:25:26,592][102898] Updated weights for policy 1, policy_version 41390 (0.0009) +[2023-10-08 13:25:26,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 84738048. Throughput: 0: 1796.9, 1: 1788.2. Samples: 21193326. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:25:26,876][101941] Avg episode reward: [(0, '6.820'), (1, '7.500')] +[2023-10-08 13:25:26,959][102898] Updated weights for policy 1, policy_version 41400 (0.0008) +[2023-10-08 13:25:30,064][102897] Updated weights for policy 0, policy_version 41380 (0.0008) +[2023-10-08 13:25:30,437][102897] Updated weights for policy 0, policy_version 41390 (0.0008) +[2023-10-08 13:25:30,618][102898] Updated weights for policy 1, policy_version 41410 (0.0008) +[2023-10-08 13:25:30,801][102897] Updated weights for policy 0, policy_version 41400 (0.0007) +[2023-10-08 13:25:30,977][102898] Updated weights for policy 1, policy_version 41420 (0.0007) +[2023-10-08 13:25:31,349][102898] Updated weights for policy 1, policy_version 41430 (0.0009) +[2023-10-08 13:25:31,718][102898] Updated weights for policy 1, policy_version 41440 (0.0008) +[2023-10-08 13:25:31,875][101941] Fps is (10 sec: 19661.3, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 84836352. Throughput: 0: 1771.6, 1: 1796.9. Samples: 21213502. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:25:31,875][101941] Avg episode reward: [(0, '6.430'), (1, '7.770')] +[2023-10-08 13:25:34,470][102897] Updated weights for policy 0, policy_version 41410 (0.0007) +[2023-10-08 13:25:34,842][102897] Updated weights for policy 0, policy_version 41420 (0.0007) +[2023-10-08 13:25:35,216][102897] Updated weights for policy 0, policy_version 41430 (0.0007) +[2023-10-08 13:25:35,548][102898] Updated weights for policy 1, policy_version 41450 (0.0010) +[2023-10-08 13:25:35,582][102897] Updated weights for policy 0, policy_version 41440 (0.0008) +[2023-10-08 13:25:35,909][102898] Updated weights for policy 1, policy_version 41460 (0.0008) +[2023-10-08 13:25:36,280][102898] Updated weights for policy 1, policy_version 41470 (0.0010) +[2023-10-08 13:25:36,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 84901888. Throughput: 0: 1801.3, 1: 1787.7. Samples: 21225904. Policy #0 lag: (min: 17.0, avg: 33.0, max: 49.0) +[2023-10-08 13:25:36,875][101941] Avg episode reward: [(0, '7.090'), (1, '8.330')] +[2023-10-08 13:25:39,426][102897] Updated weights for policy 0, policy_version 41450 (0.0007) +[2023-10-08 13:25:39,802][102897] Updated weights for policy 0, policy_version 41460 (0.0008) +[2023-10-08 13:25:40,119][102898] Updated weights for policy 1, policy_version 41480 (0.0008) +[2023-10-08 13:25:40,171][102897] Updated weights for policy 0, policy_version 41470 (0.0008) +[2023-10-08 13:25:40,489][102898] Updated weights for policy 1, policy_version 41490 (0.0008) +[2023-10-08 13:25:40,851][102898] Updated weights for policy 1, policy_version 41500 (0.0009) +[2023-10-08 13:25:41,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 84967424. Throughput: 0: 1780.4, 1: 1805.1. Samples: 21246026. Policy #0 lag: (min: 17.0, avg: 33.0, max: 49.0) +[2023-10-08 13:25:41,876][101941] Avg episode reward: [(0, '7.280'), (1, '8.090')] +[2023-10-08 13:25:43,870][102897] Updated weights for policy 0, policy_version 41480 (0.0007) +[2023-10-08 13:25:44,236][102897] Updated weights for policy 0, policy_version 41490 (0.0009) +[2023-10-08 13:25:44,595][102898] Updated weights for policy 1, policy_version 41510 (0.0007) +[2023-10-08 13:25:44,608][102897] Updated weights for policy 0, policy_version 41500 (0.0007) +[2023-10-08 13:25:44,965][102898] Updated weights for policy 1, policy_version 41520 (0.0007) +[2023-10-08 13:25:45,339][102898] Updated weights for policy 1, policy_version 41530 (0.0007) +[2023-10-08 13:25:46,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 85032960. Throughput: 0: 1777.8, 1: 1793.0. Samples: 21267682. Policy #0 lag: (min: 17.0, avg: 33.0, max: 49.0) +[2023-10-08 13:25:46,876][101941] Avg episode reward: [(0, '7.040'), (1, '7.620')] +[2023-10-08 13:25:48,516][102897] Updated weights for policy 0, policy_version 41510 (0.0008) +[2023-10-08 13:25:48,880][102897] Updated weights for policy 0, policy_version 41520 (0.0010) +[2023-10-08 13:25:49,046][102898] Updated weights for policy 1, policy_version 41540 (0.0007) +[2023-10-08 13:25:49,254][102897] Updated weights for policy 0, policy_version 41530 (0.0008) +[2023-10-08 13:25:49,404][102898] Updated weights for policy 1, policy_version 41550 (0.0008) +[2023-10-08 13:25:49,776][102898] Updated weights for policy 1, policy_version 41560 (0.0010) +[2023-10-08 13:25:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 85098496. Throughput: 0: 1782.3, 1: 1807.3. Samples: 21278328. Policy #0 lag: (min: 17.0, avg: 33.0, max: 49.0) +[2023-10-08 13:25:51,876][101941] Avg episode reward: [(0, '6.750'), (1, '7.970')] +[2023-10-08 13:25:53,084][102897] Updated weights for policy 0, policy_version 41540 (0.0007) +[2023-10-08 13:25:53,456][102897] Updated weights for policy 0, policy_version 41550 (0.0007) +[2023-10-08 13:25:53,571][102898] Updated weights for policy 1, policy_version 41570 (0.0008) +[2023-10-08 13:25:53,812][102897] Updated weights for policy 0, policy_version 41560 (0.0007) +[2023-10-08 13:25:53,944][102898] Updated weights for policy 1, policy_version 41580 (0.0008) +[2023-10-08 13:25:54,312][102898] Updated weights for policy 1, policy_version 41590 (0.0007) +[2023-10-08 13:25:54,684][102898] Updated weights for policy 1, policy_version 41600 (0.0009) +[2023-10-08 13:25:56,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 85164032. Throughput: 0: 1779.6, 1: 1787.9. Samples: 21299500. Policy #0 lag: (min: 17.0, avg: 33.0, max: 49.0) +[2023-10-08 13:25:56,875][101941] Avg episode reward: [(0, '7.090'), (1, '7.450')] +[2023-10-08 13:25:57,698][102897] Updated weights for policy 0, policy_version 41570 (0.0008) +[2023-10-08 13:25:58,093][102897] Updated weights for policy 0, policy_version 41580 (0.0009) +[2023-10-08 13:25:58,466][102897] Updated weights for policy 0, policy_version 41590 (0.0007) +[2023-10-08 13:25:58,574][102898] Updated weights for policy 1, policy_version 41610 (0.0009) +[2023-10-08 13:25:58,828][102897] Updated weights for policy 0, policy_version 41600 (0.0008) +[2023-10-08 13:25:58,945][102898] Updated weights for policy 1, policy_version 41620 (0.0009) +[2023-10-08 13:25:59,304][102898] Updated weights for policy 1, policy_version 41630 (0.0011) +[2023-10-08 13:26:01,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 85229568. Throughput: 0: 1782.3, 1: 1781.4. Samples: 21321630. Policy #0 lag: (min: 17.0, avg: 33.0, max: 49.0) +[2023-10-08 13:26:01,876][101941] Avg episode reward: [(0, '7.020'), (1, '6.820')] +[2023-10-08 13:26:02,438][102897] Updated weights for policy 0, policy_version 41610 (0.0007) +[2023-10-08 13:26:02,816][102897] Updated weights for policy 0, policy_version 41620 (0.0009) +[2023-10-08 13:26:03,046][102898] Updated weights for policy 1, policy_version 41640 (0.0009) +[2023-10-08 13:26:03,185][102897] Updated weights for policy 0, policy_version 41630 (0.0007) +[2023-10-08 13:26:03,411][102898] Updated weights for policy 1, policy_version 41650 (0.0007) +[2023-10-08 13:26:03,783][102898] Updated weights for policy 1, policy_version 41660 (0.0009) +[2023-10-08 13:26:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 85295104. Throughput: 0: 1784.6, 1: 1779.4. Samples: 21331450. Policy #0 lag: (min: 31.0, avg: 32.9, max: 61.0) +[2023-10-08 13:26:06,875][101941] Avg episode reward: [(0, '6.580'), (1, '7.660')] +[2023-10-08 13:26:07,032][102897] Updated weights for policy 0, policy_version 41640 (0.0007) +[2023-10-08 13:26:07,404][102897] Updated weights for policy 0, policy_version 41650 (0.0007) +[2023-10-08 13:26:07,655][102898] Updated weights for policy 1, policy_version 41670 (0.0008) +[2023-10-08 13:26:07,764][102897] Updated weights for policy 0, policy_version 41660 (0.0009) +[2023-10-08 13:26:08,023][102898] Updated weights for policy 1, policy_version 41680 (0.0008) +[2023-10-08 13:26:08,397][102898] Updated weights for policy 1, policy_version 41690 (0.0009) +[2023-10-08 13:26:11,568][102897] Updated weights for policy 0, policy_version 41670 (0.0009) +[2023-10-08 13:26:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 85360640. Throughput: 0: 1783.2, 1: 1778.6. Samples: 21353610. Policy #0 lag: (min: 31.0, avg: 32.9, max: 61.0) +[2023-10-08 13:26:11,876][101941] Avg episode reward: [(0, '6.790'), (1, '7.850')] +[2023-10-08 13:26:11,935][102897] Updated weights for policy 0, policy_version 41680 (0.0008) +[2023-10-08 13:26:12,249][102898] Updated weights for policy 1, policy_version 41700 (0.0008) +[2023-10-08 13:26:12,300][102897] Updated weights for policy 0, policy_version 41690 (0.0007) +[2023-10-08 13:26:12,618][102898] Updated weights for policy 1, policy_version 41710 (0.0007) +[2023-10-08 13:26:12,986][102898] Updated weights for policy 1, policy_version 41720 (0.0007) +[2023-10-08 13:26:15,868][102897] Updated weights for policy 0, policy_version 41700 (0.0009) +[2023-10-08 13:26:16,239][102897] Updated weights for policy 0, policy_version 41710 (0.0011) +[2023-10-08 13:26:16,620][102897] Updated weights for policy 0, policy_version 41720 (0.0010) +[2023-10-08 13:26:16,745][102898] Updated weights for policy 1, policy_version 41730 (0.0008) +[2023-10-08 13:26:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 85426176. Throughput: 0: 1799.5, 1: 1792.4. Samples: 21375136. Policy #0 lag: (min: 31.0, avg: 32.9, max: 61.0) +[2023-10-08 13:26:16,876][101941] Avg episode reward: [(0, '6.800'), (1, '7.670')] +[2023-10-08 13:26:16,911][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000041728_42729472.pth... +[2023-10-08 13:26:16,939][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000040032_40992768.pth +[2023-10-08 13:26:16,943][102634] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p0/milestones/checkpoint_000041728_42729472.pth +[2023-10-08 13:26:17,122][102898] Updated weights for policy 1, policy_version 41740 (0.0009) +[2023-10-08 13:26:17,479][102898] Updated weights for policy 1, policy_version 41750 (0.0008) +[2023-10-08 13:26:17,853][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000041760_42762240.pth... +[2023-10-08 13:26:17,854][102898] Updated weights for policy 1, policy_version 41760 (0.0008) +[2023-10-08 13:26:17,884][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000040064_41025536.pth +[2023-10-08 13:26:17,888][102760] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p1/milestones/checkpoint_000041760_42762240.pth +[2023-10-08 13:26:20,180][102897] Updated weights for policy 0, policy_version 41730 (0.0009) +[2023-10-08 13:26:20,544][102897] Updated weights for policy 0, policy_version 41740 (0.0007) +[2023-10-08 13:26:20,919][102897] Updated weights for policy 0, policy_version 41750 (0.0007) +[2023-10-08 13:26:21,285][102897] Updated weights for policy 0, policy_version 41760 (0.0008) +[2023-10-08 13:26:21,758][102898] Updated weights for policy 1, policy_version 41770 (0.0009) +[2023-10-08 13:26:21,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 85524480. Throughput: 0: 1784.4, 1: 1764.6. Samples: 21385608. Policy #0 lag: (min: 31.0, avg: 32.9, max: 61.0) +[2023-10-08 13:26:21,875][101941] Avg episode reward: [(0, '6.250'), (1, '7.910')] +[2023-10-08 13:26:22,128][102898] Updated weights for policy 1, policy_version 41780 (0.0009) +[2023-10-08 13:26:22,502][102898] Updated weights for policy 1, policy_version 41790 (0.0007) +[2023-10-08 13:26:25,198][102897] Updated weights for policy 0, policy_version 41770 (0.0008) +[2023-10-08 13:26:25,567][102897] Updated weights for policy 0, policy_version 41780 (0.0008) +[2023-10-08 13:26:25,934][102897] Updated weights for policy 0, policy_version 41790 (0.0008) +[2023-10-08 13:26:26,353][102898] Updated weights for policy 1, policy_version 41800 (0.0008) +[2023-10-08 13:26:26,723][102898] Updated weights for policy 1, policy_version 41810 (0.0007) +[2023-10-08 13:26:26,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 85590016. Throughput: 0: 1801.7, 1: 1785.8. Samples: 21407464. Policy #0 lag: (min: 31.0, avg: 32.9, max: 61.0) +[2023-10-08 13:26:26,875][101941] Avg episode reward: [(0, '6.210'), (1, '7.350')] +[2023-10-08 13:26:27,095][102898] Updated weights for policy 1, policy_version 41820 (0.0008) +[2023-10-08 13:26:29,664][102897] Updated weights for policy 0, policy_version 41800 (0.0008) +[2023-10-08 13:26:30,041][102897] Updated weights for policy 0, policy_version 41810 (0.0009) +[2023-10-08 13:26:30,417][102897] Updated weights for policy 0, policy_version 41820 (0.0007) +[2023-10-08 13:26:30,797][102898] Updated weights for policy 1, policy_version 41830 (0.0008) +[2023-10-08 13:26:31,164][102898] Updated weights for policy 1, policy_version 41840 (0.0007) +[2023-10-08 13:26:31,526][102898] Updated weights for policy 1, policy_version 41850 (0.0008) +[2023-10-08 13:26:31,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 85688320. Throughput: 0: 1790.4, 1: 1776.5. Samples: 21428192. Policy #0 lag: (min: 31.0, avg: 32.9, max: 61.0) +[2023-10-08 13:26:31,876][101941] Avg episode reward: [(0, '6.560'), (1, '7.520')] +[2023-10-08 13:26:34,080][102897] Updated weights for policy 0, policy_version 41830 (0.0008) +[2023-10-08 13:26:34,456][102897] Updated weights for policy 0, policy_version 41840 (0.0007) +[2023-10-08 13:26:34,827][102897] Updated weights for policy 0, policy_version 41850 (0.0008) +[2023-10-08 13:26:35,254][102898] Updated weights for policy 1, policy_version 41860 (0.0009) +[2023-10-08 13:26:35,622][102898] Updated weights for policy 1, policy_version 41870 (0.0009) +[2023-10-08 13:26:35,984][102898] Updated weights for policy 1, policy_version 41880 (0.0009) +[2023-10-08 13:26:36,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 85753856. Throughput: 0: 1805.5, 1: 1781.5. Samples: 21439742. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:26:36,876][101941] Avg episode reward: [(0, '6.830'), (1, '8.430')] +[2023-10-08 13:26:38,711][102897] Updated weights for policy 0, policy_version 41860 (0.0008) +[2023-10-08 13:26:39,083][102897] Updated weights for policy 0, policy_version 41870 (0.0008) +[2023-10-08 13:26:39,465][102897] Updated weights for policy 0, policy_version 41880 (0.0010) +[2023-10-08 13:26:39,622][102898] Updated weights for policy 1, policy_version 41890 (0.0007) +[2023-10-08 13:26:39,996][102898] Updated weights for policy 1, policy_version 41900 (0.0010) +[2023-10-08 13:26:40,366][102898] Updated weights for policy 1, policy_version 41910 (0.0008) +[2023-10-08 13:26:40,724][102898] Updated weights for policy 1, policy_version 41920 (0.0008) +[2023-10-08 13:26:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 85819392. Throughput: 0: 1786.0, 1: 1783.5. Samples: 21460128. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:26:41,875][101941] Avg episode reward: [(0, '7.080'), (1, '8.260')] +[2023-10-08 13:26:43,460][102897] Updated weights for policy 0, policy_version 41890 (0.0009) +[2023-10-08 13:26:43,851][102897] Updated weights for policy 0, policy_version 41900 (0.0010) +[2023-10-08 13:26:44,221][102897] Updated weights for policy 0, policy_version 41910 (0.0008) +[2023-10-08 13:26:44,563][102898] Updated weights for policy 1, policy_version 41930 (0.0007) +[2023-10-08 13:26:44,597][102897] Updated weights for policy 0, policy_version 41920 (0.0007) +[2023-10-08 13:26:44,935][102898] Updated weights for policy 1, policy_version 41940 (0.0008) +[2023-10-08 13:26:45,301][102898] Updated weights for policy 1, policy_version 41950 (0.0008) +[2023-10-08 13:26:46,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 85884928. Throughput: 0: 1777.7, 1: 1772.5. Samples: 21481388. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:26:46,876][101941] Avg episode reward: [(0, '6.810'), (1, '8.180')] +[2023-10-08 13:26:48,304][102897] Updated weights for policy 0, policy_version 41930 (0.0010) +[2023-10-08 13:26:48,679][102897] Updated weights for policy 0, policy_version 41940 (0.0008) +[2023-10-08 13:26:49,040][102897] Updated weights for policy 0, policy_version 41950 (0.0009) +[2023-10-08 13:26:49,155][102898] Updated weights for policy 1, policy_version 41960 (0.0009) +[2023-10-08 13:26:49,531][102898] Updated weights for policy 1, policy_version 41970 (0.0008) +[2023-10-08 13:26:49,898][102898] Updated weights for policy 1, policy_version 41980 (0.0008) +[2023-10-08 13:26:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 85950464. Throughput: 0: 1773.6, 1: 1790.0. Samples: 21491814. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:26:51,876][101941] Avg episode reward: [(0, '6.710'), (1, '8.160')] +[2023-10-08 13:26:52,825][102897] Updated weights for policy 0, policy_version 41960 (0.0007) +[2023-10-08 13:26:53,201][102897] Updated weights for policy 0, policy_version 41970 (0.0008) +[2023-10-08 13:26:53,566][102897] Updated weights for policy 0, policy_version 41980 (0.0007) +[2023-10-08 13:26:53,670][102898] Updated weights for policy 1, policy_version 41990 (0.0007) +[2023-10-08 13:26:54,035][102898] Updated weights for policy 1, policy_version 42000 (0.0010) +[2023-10-08 13:26:54,407][102898] Updated weights for policy 1, policy_version 42010 (0.0008) +[2023-10-08 13:26:56,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 86016000. Throughput: 0: 1776.9, 1: 1776.0. Samples: 21513488. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:26:56,876][101941] Avg episode reward: [(0, '6.900'), (1, '7.780')] +[2023-10-08 13:26:57,393][102897] Updated weights for policy 0, policy_version 41990 (0.0008) +[2023-10-08 13:26:57,764][102897] Updated weights for policy 0, policy_version 42000 (0.0008) +[2023-10-08 13:26:58,026][102898] Updated weights for policy 1, policy_version 42020 (0.0008) +[2023-10-08 13:26:58,135][102897] Updated weights for policy 0, policy_version 42010 (0.0008) +[2023-10-08 13:26:58,394][102898] Updated weights for policy 1, policy_version 42030 (0.0009) +[2023-10-08 13:26:58,760][102898] Updated weights for policy 1, policy_version 42040 (0.0007) +[2023-10-08 13:27:01,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 86081536. Throughput: 0: 1786.3, 1: 1782.2. Samples: 21535716. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:27:01,876][101941] Avg episode reward: [(0, '7.290'), (1, '7.420')] +[2023-10-08 13:27:02,005][102897] Updated weights for policy 0, policy_version 42020 (0.0009) +[2023-10-08 13:27:02,378][102897] Updated weights for policy 0, policy_version 42030 (0.0008) +[2023-10-08 13:27:02,521][102898] Updated weights for policy 1, policy_version 42050 (0.0009) +[2023-10-08 13:27:02,760][102897] Updated weights for policy 0, policy_version 42040 (0.0008) +[2023-10-08 13:27:02,898][102898] Updated weights for policy 1, policy_version 42060 (0.0009) +[2023-10-08 13:27:03,253][102898] Updated weights for policy 1, policy_version 42070 (0.0010) +[2023-10-08 13:27:03,624][102898] Updated weights for policy 1, policy_version 42080 (0.0008) +[2023-10-08 13:27:06,523][102897] Updated weights for policy 0, policy_version 42050 (0.0008) +[2023-10-08 13:27:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 86147072. Throughput: 0: 1767.0, 1: 1785.4. Samples: 21545466. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:27:06,876][101941] Avg episode reward: [(0, '6.760'), (1, '7.360')] +[2023-10-08 13:27:06,901][102897] Updated weights for policy 0, policy_version 42060 (0.0010) +[2023-10-08 13:27:07,273][102897] Updated weights for policy 0, policy_version 42070 (0.0007) +[2023-10-08 13:27:07,539][102898] Updated weights for policy 1, policy_version 42090 (0.0007) +[2023-10-08 13:27:07,633][102897] Updated weights for policy 0, policy_version 42080 (0.0007) +[2023-10-08 13:27:07,901][102898] Updated weights for policy 1, policy_version 42100 (0.0009) +[2023-10-08 13:27:08,270][102898] Updated weights for policy 1, policy_version 42110 (0.0008) +[2023-10-08 13:27:11,469][102897] Updated weights for policy 0, policy_version 42090 (0.0008) +[2023-10-08 13:27:11,848][102897] Updated weights for policy 0, policy_version 42100 (0.0011) +[2023-10-08 13:27:11,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 86212608. Throughput: 0: 1783.5, 1: 1777.2. Samples: 21567696. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:27:11,876][101941] Avg episode reward: [(0, '6.060'), (1, '7.430')] +[2023-10-08 13:27:12,094][102898] Updated weights for policy 1, policy_version 42120 (0.0009) +[2023-10-08 13:27:12,213][102897] Updated weights for policy 0, policy_version 42110 (0.0009) +[2023-10-08 13:27:12,461][102898] Updated weights for policy 1, policy_version 42130 (0.0009) +[2023-10-08 13:27:12,821][102898] Updated weights for policy 1, policy_version 42140 (0.0011) +[2023-10-08 13:27:15,863][102897] Updated weights for policy 0, policy_version 42120 (0.0008) +[2023-10-08 13:27:16,246][102897] Updated weights for policy 0, policy_version 42130 (0.0008) +[2023-10-08 13:27:16,436][102898] Updated weights for policy 1, policy_version 42150 (0.0007) +[2023-10-08 13:27:16,622][102897] Updated weights for policy 0, policy_version 42140 (0.0007) +[2023-10-08 13:27:16,809][102898] Updated weights for policy 1, policy_version 42160 (0.0008) +[2023-10-08 13:27:16,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 86310912. Throughput: 0: 1783.0, 1: 1794.7. Samples: 21589190. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:27:16,876][101941] Avg episode reward: [(0, '6.750'), (1, '7.230')] +[2023-10-08 13:27:17,176][102898] Updated weights for policy 1, policy_version 42170 (0.0008) +[2023-10-08 13:27:20,269][102897] Updated weights for policy 0, policy_version 42150 (0.0007) +[2023-10-08 13:27:20,634][102897] Updated weights for policy 0, policy_version 42160 (0.0008) +[2023-10-08 13:27:21,003][102897] Updated weights for policy 0, policy_version 42170 (0.0009) +[2023-10-08 13:27:21,144][102898] Updated weights for policy 1, policy_version 42180 (0.0007) +[2023-10-08 13:27:21,519][102898] Updated weights for policy 1, policy_version 42190 (0.0010) +[2023-10-08 13:27:21,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 86376448. Throughput: 0: 1789.5, 1: 1776.2. Samples: 21600200. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:27:21,876][101941] Avg episode reward: [(0, '7.160'), (1, '7.070')] +[2023-10-08 13:27:21,880][102898] Updated weights for policy 1, policy_version 42200 (0.0010) +[2023-10-08 13:27:24,971][102897] Updated weights for policy 0, policy_version 42180 (0.0008) +[2023-10-08 13:27:25,335][102897] Updated weights for policy 0, policy_version 42190 (0.0007) +[2023-10-08 13:27:25,709][102897] Updated weights for policy 0, policy_version 42200 (0.0009) +[2023-10-08 13:27:25,716][102898] Updated weights for policy 1, policy_version 42210 (0.0009) +[2023-10-08 13:27:26,078][102898] Updated weights for policy 1, policy_version 42220 (0.0007) +[2023-10-08 13:27:26,440][102898] Updated weights for policy 1, policy_version 42230 (0.0007) +[2023-10-08 13:27:26,810][102898] Updated weights for policy 1, policy_version 42240 (0.0007) +[2023-10-08 13:27:26,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 86474752. Throughput: 0: 1798.0, 1: 1789.2. Samples: 21621552. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:27:26,876][101941] Avg episode reward: [(0, '7.570'), (1, '7.190')] +[2023-10-08 13:27:29,394][102897] Updated weights for policy 0, policy_version 42210 (0.0008) +[2023-10-08 13:27:29,776][102897] Updated weights for policy 0, policy_version 42220 (0.0007) +[2023-10-08 13:27:30,151][102897] Updated weights for policy 0, policy_version 42230 (0.0007) +[2023-10-08 13:27:30,512][102897] Updated weights for policy 0, policy_version 42240 (0.0007) +[2023-10-08 13:27:30,703][102898] Updated weights for policy 1, policy_version 42250 (0.0007) +[2023-10-08 13:27:31,062][102898] Updated weights for policy 1, policy_version 42260 (0.0008) +[2023-10-08 13:27:31,428][102898] Updated weights for policy 1, policy_version 42270 (0.0010) +[2023-10-08 13:27:31,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 86540288. Throughput: 0: 1789.1, 1: 1773.3. Samples: 21641692. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:27:31,875][101941] Avg episode reward: [(0, '7.750'), (1, '7.710')] +[2023-10-08 13:27:34,045][102897] Updated weights for policy 0, policy_version 42250 (0.0007) +[2023-10-08 13:27:34,414][102897] Updated weights for policy 0, policy_version 42260 (0.0007) +[2023-10-08 13:27:34,788][102897] Updated weights for policy 0, policy_version 42270 (0.0007) +[2023-10-08 13:27:35,262][102898] Updated weights for policy 1, policy_version 42280 (0.0010) +[2023-10-08 13:27:35,625][102898] Updated weights for policy 1, policy_version 42290 (0.0009) +[2023-10-08 13:27:35,997][102898] Updated weights for policy 1, policy_version 42300 (0.0011) +[2023-10-08 13:27:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 86605824. Throughput: 0: 1807.3, 1: 1782.6. Samples: 21653358. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 13:27:36,876][101941] Avg episode reward: [(0, '7.080'), (1, '7.760')] +[2023-10-08 13:27:38,630][102897] Updated weights for policy 0, policy_version 42280 (0.0009) +[2023-10-08 13:27:38,998][102897] Updated weights for policy 0, policy_version 42290 (0.0008) +[2023-10-08 13:27:39,365][102897] Updated weights for policy 0, policy_version 42300 (0.0009) +[2023-10-08 13:27:39,675][102898] Updated weights for policy 1, policy_version 42310 (0.0009) +[2023-10-08 13:27:40,041][102898] Updated weights for policy 1, policy_version 42320 (0.0009) +[2023-10-08 13:27:40,406][102898] Updated weights for policy 1, policy_version 42330 (0.0008) +[2023-10-08 13:27:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 86671360. Throughput: 0: 1788.1, 1: 1776.8. Samples: 21673910. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 13:27:41,876][101941] Avg episode reward: [(0, '6.010'), (1, '7.870')] +[2023-10-08 13:27:43,183][102897] Updated weights for policy 0, policy_version 42310 (0.0008) +[2023-10-08 13:27:43,565][102897] Updated weights for policy 0, policy_version 42320 (0.0007) +[2023-10-08 13:27:43,928][102897] Updated weights for policy 0, policy_version 42330 (0.0007) +[2023-10-08 13:27:44,157][102898] Updated weights for policy 1, policy_version 42340 (0.0007) +[2023-10-08 13:27:44,515][102898] Updated weights for policy 1, policy_version 42350 (0.0008) +[2023-10-08 13:27:44,885][102898] Updated weights for policy 1, policy_version 42360 (0.0007) +[2023-10-08 13:27:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 86736896. Throughput: 0: 1788.3, 1: 1774.1. Samples: 21696022. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 13:27:46,876][101941] Avg episode reward: [(0, '6.440'), (1, '7.420')] +[2023-10-08 13:27:47,766][102897] Updated weights for policy 0, policy_version 42340 (0.0009) +[2023-10-08 13:27:48,134][102897] Updated weights for policy 0, policy_version 42350 (0.0008) +[2023-10-08 13:27:48,507][102897] Updated weights for policy 0, policy_version 42360 (0.0009) +[2023-10-08 13:27:48,549][102898] Updated weights for policy 1, policy_version 42370 (0.0007) +[2023-10-08 13:27:48,919][102898] Updated weights for policy 1, policy_version 42380 (0.0008) +[2023-10-08 13:27:49,279][102898] Updated weights for policy 1, policy_version 42390 (0.0008) +[2023-10-08 13:27:49,660][102898] Updated weights for policy 1, policy_version 42400 (0.0007) +[2023-10-08 13:27:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 86802432. Throughput: 0: 1782.5, 1: 1783.4. Samples: 21705934. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 13:27:51,875][101941] Avg episode reward: [(0, '6.980'), (1, '7.950')] +[2023-10-08 13:27:52,398][102897] Updated weights for policy 0, policy_version 42370 (0.0008) +[2023-10-08 13:27:52,771][102897] Updated weights for policy 0, policy_version 42380 (0.0010) +[2023-10-08 13:27:53,141][102897] Updated weights for policy 0, policy_version 42390 (0.0008) +[2023-10-08 13:27:53,508][102898] Updated weights for policy 1, policy_version 42410 (0.0007) +[2023-10-08 13:27:53,514][102897] Updated weights for policy 0, policy_version 42400 (0.0008) +[2023-10-08 13:27:53,866][102898] Updated weights for policy 1, policy_version 42420 (0.0010) +[2023-10-08 13:27:54,232][102898] Updated weights for policy 1, policy_version 42430 (0.0010) +[2023-10-08 13:27:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 86867968. Throughput: 0: 1776.4, 1: 1777.3. Samples: 21727614. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 13:27:56,876][101941] Avg episode reward: [(0, '7.040'), (1, '8.520')] +[2023-10-08 13:27:57,316][102897] Updated weights for policy 0, policy_version 42410 (0.0007) +[2023-10-08 13:27:57,687][102897] Updated weights for policy 0, policy_version 42420 (0.0008) +[2023-10-08 13:27:58,054][102897] Updated weights for policy 0, policy_version 42430 (0.0007) +[2023-10-08 13:27:58,102][102898] Updated weights for policy 1, policy_version 42440 (0.0008) +[2023-10-08 13:27:58,481][102898] Updated weights for policy 1, policy_version 42450 (0.0010) +[2023-10-08 13:27:58,849][102898] Updated weights for policy 1, policy_version 42460 (0.0010) +[2023-10-08 13:28:01,796][102897] Updated weights for policy 0, policy_version 42440 (0.0010) +[2023-10-08 13:28:01,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 86933504. Throughput: 0: 1789.5, 1: 1776.5. Samples: 21749660. Policy #0 lag: (min: 31.0, avg: 34.0, max: 63.0) +[2023-10-08 13:28:01,876][101941] Avg episode reward: [(0, '6.710'), (1, '8.370')] +[2023-10-08 13:28:02,177][102897] Updated weights for policy 0, policy_version 42450 (0.0009) +[2023-10-08 13:28:02,549][102897] Updated weights for policy 0, policy_version 42460 (0.0010) +[2023-10-08 13:28:02,574][102898] Updated weights for policy 1, policy_version 42470 (0.0009) +[2023-10-08 13:28:02,939][102898] Updated weights for policy 1, policy_version 42480 (0.0008) +[2023-10-08 13:28:03,302][102898] Updated weights for policy 1, policy_version 42490 (0.0008) +[2023-10-08 13:28:06,343][102897] Updated weights for policy 0, policy_version 42470 (0.0009) +[2023-10-08 13:28:06,724][102897] Updated weights for policy 0, policy_version 42480 (0.0009) +[2023-10-08 13:28:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 86999040. Throughput: 0: 1762.8, 1: 1772.9. Samples: 21759304. Policy #0 lag: (min: 31.0, avg: 36.2, max: 63.0) +[2023-10-08 13:28:06,876][101941] Avg episode reward: [(0, '6.740'), (1, '8.070')] +[2023-10-08 13:28:06,955][102898] Updated weights for policy 1, policy_version 42500 (0.0008) +[2023-10-08 13:28:07,094][102897] Updated weights for policy 0, policy_version 42490 (0.0008) +[2023-10-08 13:28:07,327][102898] Updated weights for policy 1, policy_version 42510 (0.0008) +[2023-10-08 13:28:07,697][102898] Updated weights for policy 1, policy_version 42520 (0.0009) +[2023-10-08 13:28:10,816][102897] Updated weights for policy 0, policy_version 42500 (0.0009) +[2023-10-08 13:28:11,182][102897] Updated weights for policy 0, policy_version 42510 (0.0008) +[2023-10-08 13:28:11,505][102898] Updated weights for policy 1, policy_version 42530 (0.0009) +[2023-10-08 13:28:11,559][102897] Updated weights for policy 0, policy_version 42520 (0.0007) +[2023-10-08 13:28:11,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 87097344. Throughput: 0: 1780.2, 1: 1776.7. Samples: 21781610. Policy #0 lag: (min: 31.0, avg: 36.2, max: 63.0) +[2023-10-08 13:28:11,875][101941] Avg episode reward: [(0, '6.670'), (1, '7.780')] +[2023-10-08 13:28:11,877][102898] Updated weights for policy 1, policy_version 42540 (0.0010) +[2023-10-08 13:28:12,249][102898] Updated weights for policy 1, policy_version 42550 (0.0007) +[2023-10-08 13:28:12,618][102898] Updated weights for policy 1, policy_version 42560 (0.0007) +[2023-10-08 13:28:15,470][102897] Updated weights for policy 0, policy_version 42530 (0.0008) +[2023-10-08 13:28:15,873][102897] Updated weights for policy 0, policy_version 42540 (0.0007) +[2023-10-08 13:28:16,243][102897] Updated weights for policy 0, policy_version 42550 (0.0007) +[2023-10-08 13:28:16,477][102898] Updated weights for policy 1, policy_version 42570 (0.0009) +[2023-10-08 13:28:16,614][102897] Updated weights for policy 0, policy_version 42560 (0.0007) +[2023-10-08 13:28:16,847][102898] Updated weights for policy 1, policy_version 42580 (0.0009) +[2023-10-08 13:28:16,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 87162880. Throughput: 0: 1767.7, 1: 1798.6. Samples: 21802176. Policy #0 lag: (min: 31.0, avg: 36.2, max: 63.0) +[2023-10-08 13:28:16,875][101941] Avg episode reward: [(0, '6.540'), (1, '7.780')] +[2023-10-08 13:28:16,886][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000042560_43581440.pth... +[2023-10-08 13:28:16,926][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000040896_41877504.pth +[2023-10-08 13:28:17,205][102898] Updated weights for policy 1, policy_version 42590 (0.0008) +[2023-10-08 13:28:17,279][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000042592_43614208.pth... +[2023-10-08 13:28:17,308][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000040896_41877504.pth +[2023-10-08 13:28:20,355][102897] Updated weights for policy 0, policy_version 42570 (0.0011) +[2023-10-08 13:28:20,722][102897] Updated weights for policy 0, policy_version 42580 (0.0009) +[2023-10-08 13:28:20,979][102898] Updated weights for policy 1, policy_version 42600 (0.0009) +[2023-10-08 13:28:21,094][102897] Updated weights for policy 0, policy_version 42590 (0.0007) +[2023-10-08 13:28:21,349][102898] Updated weights for policy 1, policy_version 42610 (0.0008) +[2023-10-08 13:28:21,724][102898] Updated weights for policy 1, policy_version 42620 (0.0009) +[2023-10-08 13:28:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 87261184. Throughput: 0: 1773.9, 1: 1780.7. Samples: 21813312. Policy #0 lag: (min: 31.0, avg: 36.2, max: 63.0) +[2023-10-08 13:28:21,876][101941] Avg episode reward: [(0, '6.140'), (1, '7.920')] +[2023-10-08 13:28:24,906][102897] Updated weights for policy 0, policy_version 42600 (0.0007) +[2023-10-08 13:28:25,270][102897] Updated weights for policy 0, policy_version 42610 (0.0008) +[2023-10-08 13:28:25,530][102898] Updated weights for policy 1, policy_version 42630 (0.0008) +[2023-10-08 13:28:25,642][102897] Updated weights for policy 0, policy_version 42620 (0.0009) +[2023-10-08 13:28:25,893][102898] Updated weights for policy 1, policy_version 42640 (0.0010) +[2023-10-08 13:28:26,263][102898] Updated weights for policy 1, policy_version 42650 (0.0009) +[2023-10-08 13:28:26,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 87326720. Throughput: 0: 1768.1, 1: 1799.4. Samples: 21834446. Policy #0 lag: (min: 31.0, avg: 36.2, max: 63.0) +[2023-10-08 13:28:26,876][101941] Avg episode reward: [(0, '6.220'), (1, '7.470')] +[2023-10-08 13:28:29,282][102897] Updated weights for policy 0, policy_version 42630 (0.0008) +[2023-10-08 13:28:29,652][102897] Updated weights for policy 0, policy_version 42640 (0.0007) +[2023-10-08 13:28:30,023][102897] Updated weights for policy 0, policy_version 42650 (0.0008) +[2023-10-08 13:28:30,129][102898] Updated weights for policy 1, policy_version 42660 (0.0008) +[2023-10-08 13:28:30,496][102898] Updated weights for policy 1, policy_version 42670 (0.0008) +[2023-10-08 13:28:30,856][102898] Updated weights for policy 1, policy_version 42680 (0.0007) +[2023-10-08 13:28:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 87392256. Throughput: 0: 1764.1, 1: 1769.2. Samples: 21855020. Policy #0 lag: (min: 31.0, avg: 36.2, max: 63.0) +[2023-10-08 13:28:31,875][101941] Avg episode reward: [(0, '6.640'), (1, '7.630')] +[2023-10-08 13:28:33,732][102897] Updated weights for policy 0, policy_version 42660 (0.0008) +[2023-10-08 13:28:34,102][102897] Updated weights for policy 0, policy_version 42670 (0.0008) +[2023-10-08 13:28:34,482][102897] Updated weights for policy 0, policy_version 42680 (0.0009) +[2023-10-08 13:28:34,618][102898] Updated weights for policy 1, policy_version 42690 (0.0009) +[2023-10-08 13:28:34,985][102898] Updated weights for policy 1, policy_version 42700 (0.0008) +[2023-10-08 13:28:35,350][102898] Updated weights for policy 1, policy_version 42710 (0.0008) +[2023-10-08 13:28:35,722][102898] Updated weights for policy 1, policy_version 42720 (0.0009) +[2023-10-08 13:28:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 87457792. Throughput: 0: 1779.6, 1: 1792.6. Samples: 21866684. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:28:36,875][101941] Avg episode reward: [(0, '6.580'), (1, '7.940')] +[2023-10-08 13:28:38,215][102897] Updated weights for policy 0, policy_version 42690 (0.0010) +[2023-10-08 13:28:38,591][102897] Updated weights for policy 0, policy_version 42700 (0.0009) +[2023-10-08 13:28:38,959][102897] Updated weights for policy 0, policy_version 42710 (0.0009) +[2023-10-08 13:28:39,332][102897] Updated weights for policy 0, policy_version 42720 (0.0009) +[2023-10-08 13:28:39,683][102898] Updated weights for policy 1, policy_version 42730 (0.0008) +[2023-10-08 13:28:40,064][102898] Updated weights for policy 1, policy_version 42740 (0.0008) +[2023-10-08 13:28:40,436][102898] Updated weights for policy 1, policy_version 42750 (0.0011) +[2023-10-08 13:28:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 87523328. Throughput: 0: 1779.5, 1: 1772.4. Samples: 21887452. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:28:41,875][101941] Avg episode reward: [(0, '6.350'), (1, '8.000')] +[2023-10-08 13:28:43,025][102897] Updated weights for policy 0, policy_version 42730 (0.0008) +[2023-10-08 13:28:43,407][102897] Updated weights for policy 0, policy_version 42740 (0.0009) +[2023-10-08 13:28:43,776][102897] Updated weights for policy 0, policy_version 42750 (0.0009) +[2023-10-08 13:28:44,174][102898] Updated weights for policy 1, policy_version 42760 (0.0010) +[2023-10-08 13:28:44,546][102898] Updated weights for policy 1, policy_version 42770 (0.0007) +[2023-10-08 13:28:44,921][102898] Updated weights for policy 1, policy_version 42780 (0.0008) +[2023-10-08 13:28:46,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 87588864. Throughput: 0: 1787.5, 1: 1778.2. Samples: 21910118. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:28:46,876][101941] Avg episode reward: [(0, '6.250'), (1, '7.490')] +[2023-10-08 13:28:47,406][102897] Updated weights for policy 0, policy_version 42760 (0.0008) +[2023-10-08 13:28:47,772][102897] Updated weights for policy 0, policy_version 42770 (0.0008) +[2023-10-08 13:28:48,147][102897] Updated weights for policy 0, policy_version 42780 (0.0008) +[2023-10-08 13:28:48,647][102898] Updated weights for policy 1, policy_version 42790 (0.0007) +[2023-10-08 13:28:49,022][102898] Updated weights for policy 1, policy_version 42800 (0.0009) +[2023-10-08 13:28:49,387][102898] Updated weights for policy 1, policy_version 42810 (0.0007) +[2023-10-08 13:28:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 87654400. Throughput: 0: 1788.2, 1: 1784.4. Samples: 21920072. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:28:51,875][101941] Avg episode reward: [(0, '6.870'), (1, '7.120')] +[2023-10-08 13:28:51,933][102897] Updated weights for policy 0, policy_version 42790 (0.0007) +[2023-10-08 13:28:52,300][102897] Updated weights for policy 0, policy_version 42800 (0.0008) +[2023-10-08 13:28:52,671][102897] Updated weights for policy 0, policy_version 42810 (0.0007) +[2023-10-08 13:28:53,134][102898] Updated weights for policy 1, policy_version 42820 (0.0009) +[2023-10-08 13:28:53,510][102898] Updated weights for policy 1, policy_version 42830 (0.0010) +[2023-10-08 13:28:53,873][102898] Updated weights for policy 1, policy_version 42840 (0.0009) +[2023-10-08 13:28:56,556][102897] Updated weights for policy 0, policy_version 42820 (0.0007) +[2023-10-08 13:28:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 87719936. Throughput: 0: 1785.4, 1: 1777.2. Samples: 21941924. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:28:56,876][101941] Avg episode reward: [(0, '6.820'), (1, '7.940')] +[2023-10-08 13:28:56,920][102897] Updated weights for policy 0, policy_version 42830 (0.0007) +[2023-10-08 13:28:57,297][102897] Updated weights for policy 0, policy_version 42840 (0.0007) +[2023-10-08 13:28:57,663][102898] Updated weights for policy 1, policy_version 42850 (0.0009) +[2023-10-08 13:28:58,030][102898] Updated weights for policy 1, policy_version 42860 (0.0008) +[2023-10-08 13:28:58,402][102898] Updated weights for policy 1, policy_version 42870 (0.0009) +[2023-10-08 13:28:58,769][102898] Updated weights for policy 1, policy_version 42880 (0.0008) +[2023-10-08 13:29:01,218][102897] Updated weights for policy 0, policy_version 42850 (0.0007) +[2023-10-08 13:29:01,615][102897] Updated weights for policy 0, policy_version 42860 (0.0007) +[2023-10-08 13:29:01,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 87785472. Throughput: 0: 1802.7, 1: 1789.1. Samples: 21963808. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:29:01,876][101941] Avg episode reward: [(0, '6.870'), (1, '8.280')] +[2023-10-08 13:29:01,984][102897] Updated weights for policy 0, policy_version 42870 (0.0009) +[2023-10-08 13:29:02,357][102897] Updated weights for policy 0, policy_version 42880 (0.0009) +[2023-10-08 13:29:02,606][102898] Updated weights for policy 1, policy_version 42890 (0.0008) +[2023-10-08 13:29:02,974][102898] Updated weights for policy 1, policy_version 42900 (0.0008) +[2023-10-08 13:29:03,341][102898] Updated weights for policy 1, policy_version 42910 (0.0008) +[2023-10-08 13:29:06,041][102897] Updated weights for policy 0, policy_version 42890 (0.0008) +[2023-10-08 13:29:06,401][102897] Updated weights for policy 0, policy_version 42900 (0.0008) +[2023-10-08 13:29:06,782][102897] Updated weights for policy 0, policy_version 42910 (0.0008) +[2023-10-08 13:29:06,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 87883776. Throughput: 0: 1787.0, 1: 1777.7. Samples: 21973722. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:29:06,876][101941] Avg episode reward: [(0, '6.620'), (1, '8.760')] +[2023-10-08 13:29:07,125][102898] Updated weights for policy 1, policy_version 42920 (0.0007) +[2023-10-08 13:29:07,489][102898] Updated weights for policy 1, policy_version 42930 (0.0009) +[2023-10-08 13:29:07,859][102898] Updated weights for policy 1, policy_version 42940 (0.0008) +[2023-10-08 13:29:10,661][102897] Updated weights for policy 0, policy_version 42920 (0.0008) +[2023-10-08 13:29:11,027][102897] Updated weights for policy 0, policy_version 42930 (0.0008) +[2023-10-08 13:29:11,396][102897] Updated weights for policy 0, policy_version 42940 (0.0008) +[2023-10-08 13:29:11,594][102898] Updated weights for policy 1, policy_version 42950 (0.0009) +[2023-10-08 13:29:11,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 87949312. Throughput: 0: 1807.6, 1: 1778.4. Samples: 21995816. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:29:11,876][101941] Avg episode reward: [(0, '6.990'), (1, '8.650')] +[2023-10-08 13:29:11,968][102898] Updated weights for policy 1, policy_version 42960 (0.0010) +[2023-10-08 13:29:12,333][102898] Updated weights for policy 1, policy_version 42970 (0.0008) +[2023-10-08 13:29:15,059][102897] Updated weights for policy 0, policy_version 42950 (0.0008) +[2023-10-08 13:29:15,427][102897] Updated weights for policy 0, policy_version 42960 (0.0007) +[2023-10-08 13:29:15,809][102897] Updated weights for policy 0, policy_version 42970 (0.0009) +[2023-10-08 13:29:15,976][102898] Updated weights for policy 1, policy_version 42980 (0.0009) +[2023-10-08 13:29:16,345][102898] Updated weights for policy 1, policy_version 42990 (0.0009) +[2023-10-08 13:29:16,705][102898] Updated weights for policy 1, policy_version 43000 (0.0008) +[2023-10-08 13:29:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 88014848. Throughput: 0: 1786.1, 1: 1796.0. Samples: 22016214. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:29:16,876][101941] Avg episode reward: [(0, '6.650'), (1, '7.700')] +[2023-10-08 13:29:19,480][102897] Updated weights for policy 0, policy_version 42980 (0.0007) +[2023-10-08 13:29:19,851][102897] Updated weights for policy 0, policy_version 42990 (0.0009) +[2023-10-08 13:29:20,232][102897] Updated weights for policy 0, policy_version 43000 (0.0009) +[2023-10-08 13:29:20,484][102898] Updated weights for policy 1, policy_version 43010 (0.0009) +[2023-10-08 13:29:20,849][102898] Updated weights for policy 1, policy_version 43020 (0.0010) +[2023-10-08 13:29:21,225][102898] Updated weights for policy 1, policy_version 43030 (0.0009) +[2023-10-08 13:29:21,594][102898] Updated weights for policy 1, policy_version 43040 (0.0009) +[2023-10-08 13:29:21,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 88113152. Throughput: 0: 1807.7, 1: 1777.2. Samples: 22028006. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:29:21,875][101941] Avg episode reward: [(0, '6.170'), (1, '7.560')] +[2023-10-08 13:29:24,030][102897] Updated weights for policy 0, policy_version 43010 (0.0008) +[2023-10-08 13:29:24,398][102897] Updated weights for policy 0, policy_version 43020 (0.0007) +[2023-10-08 13:29:24,759][102897] Updated weights for policy 0, policy_version 43030 (0.0009) +[2023-10-08 13:29:25,126][102897] Updated weights for policy 0, policy_version 43040 (0.0008) +[2023-10-08 13:29:25,355][102898] Updated weights for policy 1, policy_version 43050 (0.0009) +[2023-10-08 13:29:25,717][102898] Updated weights for policy 1, policy_version 43060 (0.0007) +[2023-10-08 13:29:26,091][102898] Updated weights for policy 1, policy_version 43070 (0.0008) +[2023-10-08 13:29:26,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 88178688. Throughput: 0: 1778.4, 1: 1794.0. Samples: 22048214. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:29:26,876][101941] Avg episode reward: [(0, '6.430'), (1, '8.390')] +[2023-10-08 13:29:28,831][102897] Updated weights for policy 0, policy_version 43050 (0.0007) +[2023-10-08 13:29:29,207][102897] Updated weights for policy 0, policy_version 43060 (0.0008) +[2023-10-08 13:29:29,576][102897] Updated weights for policy 0, policy_version 43070 (0.0008) +[2023-10-08 13:29:29,989][102898] Updated weights for policy 1, policy_version 43080 (0.0007) +[2023-10-08 13:29:30,357][102898] Updated weights for policy 1, policy_version 43090 (0.0007) +[2023-10-08 13:29:30,719][102898] Updated weights for policy 1, policy_version 43100 (0.0007) +[2023-10-08 13:29:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 88244224. Throughput: 0: 1777.1, 1: 1777.0. Samples: 22070050. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:29:31,875][101941] Avg episode reward: [(0, '6.950'), (1, '8.600')] +[2023-10-08 13:29:33,350][102897] Updated weights for policy 0, policy_version 43080 (0.0008) +[2023-10-08 13:29:33,716][102897] Updated weights for policy 0, policy_version 43090 (0.0009) +[2023-10-08 13:29:34,082][102897] Updated weights for policy 0, policy_version 43100 (0.0007) +[2023-10-08 13:29:34,369][102898] Updated weights for policy 1, policy_version 43110 (0.0008) +[2023-10-08 13:29:34,735][102898] Updated weights for policy 1, policy_version 43120 (0.0008) +[2023-10-08 13:29:35,092][102898] Updated weights for policy 1, policy_version 43130 (0.0009) +[2023-10-08 13:29:36,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 88309760. Throughput: 0: 1775.6, 1: 1795.7. Samples: 22080780. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:29:36,876][101941] Avg episode reward: [(0, '6.820'), (1, '7.530')] +[2023-10-08 13:29:37,913][102897] Updated weights for policy 0, policy_version 43110 (0.0010) +[2023-10-08 13:29:38,281][102897] Updated weights for policy 0, policy_version 43120 (0.0008) +[2023-10-08 13:29:38,651][102897] Updated weights for policy 0, policy_version 43130 (0.0009) +[2023-10-08 13:29:38,902][102898] Updated weights for policy 1, policy_version 43140 (0.0009) +[2023-10-08 13:29:39,270][102898] Updated weights for policy 1, policy_version 43150 (0.0009) +[2023-10-08 13:29:39,637][102898] Updated weights for policy 1, policy_version 43160 (0.0007) +[2023-10-08 13:29:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 88375296. Throughput: 0: 1779.2, 1: 1779.8. Samples: 22102076. Policy #0 lag: (min: 16.0, avg: 44.6, max: 48.0) +[2023-10-08 13:29:41,876][101941] Avg episode reward: [(0, '6.630'), (1, '7.620')] +[2023-10-08 13:29:42,307][102897] Updated weights for policy 0, policy_version 43140 (0.0009) +[2023-10-08 13:29:42,679][102897] Updated weights for policy 0, policy_version 43150 (0.0008) +[2023-10-08 13:29:43,053][102897] Updated weights for policy 0, policy_version 43160 (0.0009) +[2023-10-08 13:29:43,406][102898] Updated weights for policy 1, policy_version 43170 (0.0008) +[2023-10-08 13:29:43,778][102898] Updated weights for policy 1, policy_version 43180 (0.0008) +[2023-10-08 13:29:44,142][102898] Updated weights for policy 1, policy_version 43190 (0.0008) +[2023-10-08 13:29:44,502][102898] Updated weights for policy 1, policy_version 43200 (0.0010) +[2023-10-08 13:29:46,714][102897] Updated weights for policy 0, policy_version 43170 (0.0009) +[2023-10-08 13:29:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 88440832. Throughput: 0: 1796.5, 1: 1772.9. Samples: 22124430. Policy #0 lag: (min: 16.0, avg: 44.6, max: 48.0) +[2023-10-08 13:29:46,876][101941] Avg episode reward: [(0, '6.950'), (1, '8.010')] +[2023-10-08 13:29:47,123][102897] Updated weights for policy 0, policy_version 43180 (0.0010) +[2023-10-08 13:29:47,499][102897] Updated weights for policy 0, policy_version 43190 (0.0009) +[2023-10-08 13:29:47,869][102897] Updated weights for policy 0, policy_version 43200 (0.0009) +[2023-10-08 13:29:48,418][102898] Updated weights for policy 1, policy_version 43210 (0.0009) +[2023-10-08 13:29:48,786][102898] Updated weights for policy 1, policy_version 43220 (0.0009) +[2023-10-08 13:29:49,152][102898] Updated weights for policy 1, policy_version 43230 (0.0010) +[2023-10-08 13:29:51,733][102897] Updated weights for policy 0, policy_version 43210 (0.0007) +[2023-10-08 13:29:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 88506368. Throughput: 0: 1788.9, 1: 1774.5. Samples: 22134074. Policy #0 lag: (min: 16.0, avg: 44.6, max: 48.0) +[2023-10-08 13:29:51,875][101941] Avg episode reward: [(0, '6.840'), (1, '8.100')] +[2023-10-08 13:29:52,095][102897] Updated weights for policy 0, policy_version 43220 (0.0010) +[2023-10-08 13:29:52,470][102897] Updated weights for policy 0, policy_version 43230 (0.0010) +[2023-10-08 13:29:52,840][102898] Updated weights for policy 1, policy_version 43240 (0.0009) +[2023-10-08 13:29:53,206][102898] Updated weights for policy 1, policy_version 43250 (0.0009) +[2023-10-08 13:29:53,576][102898] Updated weights for policy 1, policy_version 43260 (0.0008) +[2023-10-08 13:29:56,287][102897] Updated weights for policy 0, policy_version 43240 (0.0008) +[2023-10-08 13:29:56,652][102897] Updated weights for policy 0, policy_version 43250 (0.0009) +[2023-10-08 13:29:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 88571904. Throughput: 0: 1787.7, 1: 1776.2. Samples: 22156192. Policy #0 lag: (min: 16.0, avg: 44.6, max: 48.0) +[2023-10-08 13:29:56,875][101941] Avg episode reward: [(0, '7.110'), (1, '8.140')] +[2023-10-08 13:29:57,021][102897] Updated weights for policy 0, policy_version 43260 (0.0008) +[2023-10-08 13:29:57,460][102898] Updated weights for policy 1, policy_version 43270 (0.0010) +[2023-10-08 13:29:57,843][102898] Updated weights for policy 1, policy_version 43280 (0.0009) +[2023-10-08 13:29:58,207][102898] Updated weights for policy 1, policy_version 43290 (0.0008) +[2023-10-08 13:30:00,804][102897] Updated weights for policy 0, policy_version 43270 (0.0008) +[2023-10-08 13:30:01,181][102897] Updated weights for policy 0, policy_version 43280 (0.0007) +[2023-10-08 13:30:01,557][102897] Updated weights for policy 0, policy_version 43290 (0.0007) +[2023-10-08 13:30:01,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 88670208. Throughput: 0: 1795.4, 1: 1786.9. Samples: 22177416. Policy #0 lag: (min: 16.0, avg: 44.6, max: 48.0) +[2023-10-08 13:30:01,876][101941] Avg episode reward: [(0, '7.070'), (1, '8.430')] +[2023-10-08 13:30:02,037][102898] Updated weights for policy 1, policy_version 43300 (0.0009) +[2023-10-08 13:30:02,414][102898] Updated weights for policy 1, policy_version 43310 (0.0009) +[2023-10-08 13:30:02,780][102898] Updated weights for policy 1, policy_version 43320 (0.0007) +[2023-10-08 13:30:05,224][102897] Updated weights for policy 0, policy_version 43300 (0.0009) +[2023-10-08 13:30:05,599][102897] Updated weights for policy 0, policy_version 43310 (0.0007) +[2023-10-08 13:30:05,964][102897] Updated weights for policy 0, policy_version 43320 (0.0008) +[2023-10-08 13:30:06,426][102898] Updated weights for policy 1, policy_version 43330 (0.0007) +[2023-10-08 13:30:06,798][102898] Updated weights for policy 1, policy_version 43340 (0.0008) +[2023-10-08 13:30:06,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 88735744. Throughput: 0: 1783.5, 1: 1777.9. Samples: 22188270. Policy #0 lag: (min: 16.0, avg: 44.6, max: 48.0) +[2023-10-08 13:30:06,876][101941] Avg episode reward: [(0, '6.850'), (1, '8.850')] +[2023-10-08 13:30:07,161][102898] Updated weights for policy 1, policy_version 43350 (0.0009) +[2023-10-08 13:30:07,526][102898] Updated weights for policy 1, policy_version 43360 (0.0008) +[2023-10-08 13:30:09,787][102897] Updated weights for policy 0, policy_version 43330 (0.0007) +[2023-10-08 13:30:10,161][102897] Updated weights for policy 0, policy_version 43340 (0.0008) +[2023-10-08 13:30:10,530][102897] Updated weights for policy 0, policy_version 43350 (0.0007) +[2023-10-08 13:30:10,903][102897] Updated weights for policy 0, policy_version 43360 (0.0007) +[2023-10-08 13:30:11,481][102898] Updated weights for policy 1, policy_version 43370 (0.0007) +[2023-10-08 13:30:11,844][102898] Updated weights for policy 1, policy_version 43380 (0.0007) +[2023-10-08 13:30:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 88801280. Throughput: 0: 1803.7, 1: 1789.1. Samples: 22209888. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:30:11,876][101941] Avg episode reward: [(0, '7.180'), (1, '8.990')] +[2023-10-08 13:30:12,210][102898] Updated weights for policy 1, policy_version 43390 (0.0007) +[2023-10-08 13:30:12,275][102760] Saving new best policy, reward=8.990! +[2023-10-08 13:30:14,478][102897] Updated weights for policy 0, policy_version 43370 (0.0007) +[2023-10-08 13:30:14,849][102897] Updated weights for policy 0, policy_version 43380 (0.0010) +[2023-10-08 13:30:15,225][102897] Updated weights for policy 0, policy_version 43390 (0.0008) +[2023-10-08 13:30:15,953][102898] Updated weights for policy 1, policy_version 43400 (0.0007) +[2023-10-08 13:30:16,323][102898] Updated weights for policy 1, policy_version 43410 (0.0008) +[2023-10-08 13:30:16,684][102898] Updated weights for policy 1, policy_version 43420 (0.0009) +[2023-10-08 13:30:16,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 88899584. Throughput: 0: 1788.8, 1: 1786.0. Samples: 22230918. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:30:16,876][101941] Avg episode reward: [(0, '7.350'), (1, '8.520')] +[2023-10-08 13:30:16,885][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000043424_44466176.pth... +[2023-10-08 13:30:16,885][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000043392_44433408.pth... +[2023-10-08 13:30:16,923][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000041760_42762240.pth +[2023-10-08 13:30:16,926][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000041728_42729472.pth +[2023-10-08 13:30:18,810][102897] Updated weights for policy 0, policy_version 43400 (0.0007) +[2023-10-08 13:30:19,179][102897] Updated weights for policy 0, policy_version 43410 (0.0008) +[2023-10-08 13:30:19,551][102897] Updated weights for policy 0, policy_version 43420 (0.0009) +[2023-10-08 13:30:20,433][102898] Updated weights for policy 1, policy_version 43430 (0.0008) +[2023-10-08 13:30:20,798][102898] Updated weights for policy 1, policy_version 43440 (0.0008) +[2023-10-08 13:30:21,169][102898] Updated weights for policy 1, policy_version 43450 (0.0010) +[2023-10-08 13:30:21,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 88965120. Throughput: 0: 1807.7, 1: 1779.3. Samples: 22242196. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:30:21,876][101941] Avg episode reward: [(0, '7.110'), (1, '7.970')] +[2023-10-08 13:30:23,503][102897] Updated weights for policy 0, policy_version 43430 (0.0010) +[2023-10-08 13:30:23,874][102897] Updated weights for policy 0, policy_version 43440 (0.0009) +[2023-10-08 13:30:24,242][102897] Updated weights for policy 0, policy_version 43450 (0.0011) +[2023-10-08 13:30:24,950][102898] Updated weights for policy 1, policy_version 43460 (0.0009) +[2023-10-08 13:30:25,318][102898] Updated weights for policy 1, policy_version 43470 (0.0008) +[2023-10-08 13:30:25,685][102898] Updated weights for policy 1, policy_version 43480 (0.0011) +[2023-10-08 13:30:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 89030656. Throughput: 0: 1794.4, 1: 1785.5. Samples: 22263172. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:30:26,876][101941] Avg episode reward: [(0, '6.670'), (1, '7.990')] +[2023-10-08 13:30:27,980][102897] Updated weights for policy 0, policy_version 43460 (0.0008) +[2023-10-08 13:30:28,358][102897] Updated weights for policy 0, policy_version 43470 (0.0008) +[2023-10-08 13:30:28,734][102897] Updated weights for policy 0, policy_version 43480 (0.0008) +[2023-10-08 13:30:29,512][102898] Updated weights for policy 1, policy_version 43490 (0.0009) +[2023-10-08 13:30:29,873][102898] Updated weights for policy 1, policy_version 43500 (0.0007) +[2023-10-08 13:30:30,238][102898] Updated weights for policy 1, policy_version 43510 (0.0008) +[2023-10-08 13:30:30,601][102898] Updated weights for policy 1, policy_version 43520 (0.0007) +[2023-10-08 13:30:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 89096192. Throughput: 0: 1787.9, 1: 1776.5. Samples: 22284830. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:30:31,876][101941] Avg episode reward: [(0, '7.170'), (1, '8.650')] +[2023-10-08 13:30:32,622][102897] Updated weights for policy 0, policy_version 43490 (0.0007) +[2023-10-08 13:30:33,021][102897] Updated weights for policy 0, policy_version 43500 (0.0008) +[2023-10-08 13:30:33,389][102897] Updated weights for policy 0, policy_version 43510 (0.0010) +[2023-10-08 13:30:33,765][102897] Updated weights for policy 0, policy_version 43520 (0.0008) +[2023-10-08 13:30:34,542][102898] Updated weights for policy 1, policy_version 43530 (0.0009) +[2023-10-08 13:30:34,907][102898] Updated weights for policy 1, policy_version 43540 (0.0007) +[2023-10-08 13:30:35,276][102898] Updated weights for policy 1, policy_version 43550 (0.0008) +[2023-10-08 13:30:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 89161728. Throughput: 0: 1784.8, 1: 1795.1. Samples: 22295168. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:30:36,876][101941] Avg episode reward: [(0, '6.860'), (1, '8.230')] +[2023-10-08 13:30:37,503][102897] Updated weights for policy 0, policy_version 43530 (0.0011) +[2023-10-08 13:30:37,868][102897] Updated weights for policy 0, policy_version 43540 (0.0010) +[2023-10-08 13:30:38,231][102897] Updated weights for policy 0, policy_version 43550 (0.0010) +[2023-10-08 13:30:39,142][102898] Updated weights for policy 1, policy_version 43560 (0.0008) +[2023-10-08 13:30:39,514][102898] Updated weights for policy 1, policy_version 43570 (0.0008) +[2023-10-08 13:30:39,878][102898] Updated weights for policy 1, policy_version 43580 (0.0009) +[2023-10-08 13:30:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 89227264. Throughput: 0: 1788.8, 1: 1765.0. Samples: 22316116. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 13:30:41,876][101941] Avg episode reward: [(0, '6.610'), (1, '7.670')] +[2023-10-08 13:30:42,051][102897] Updated weights for policy 0, policy_version 43560 (0.0008) +[2023-10-08 13:30:42,419][102897] Updated weights for policy 0, policy_version 43570 (0.0007) +[2023-10-08 13:30:42,793][102897] Updated weights for policy 0, policy_version 43580 (0.0008) +[2023-10-08 13:30:43,680][102898] Updated weights for policy 1, policy_version 43590 (0.0008) +[2023-10-08 13:30:44,052][102898] Updated weights for policy 1, policy_version 43600 (0.0010) +[2023-10-08 13:30:44,421][102898] Updated weights for policy 1, policy_version 43610 (0.0008) +[2023-10-08 13:30:46,513][102897] Updated weights for policy 0, policy_version 43590 (0.0007) +[2023-10-08 13:30:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 89292800. Throughput: 0: 1807.8, 1: 1765.7. Samples: 22338224. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:30:46,876][101941] Avg episode reward: [(0, '6.470'), (1, '7.910')] +[2023-10-08 13:30:46,881][102897] Updated weights for policy 0, policy_version 43600 (0.0008) +[2023-10-08 13:30:47,250][102897] Updated weights for policy 0, policy_version 43610 (0.0007) +[2023-10-08 13:30:48,246][102898] Updated weights for policy 1, policy_version 43620 (0.0009) +[2023-10-08 13:30:48,613][102898] Updated weights for policy 1, policy_version 43630 (0.0010) +[2023-10-08 13:30:48,975][102898] Updated weights for policy 1, policy_version 43640 (0.0010) +[2023-10-08 13:30:51,005][102897] Updated weights for policy 0, policy_version 43620 (0.0009) +[2023-10-08 13:30:51,379][102897] Updated weights for policy 0, policy_version 43630 (0.0008) +[2023-10-08 13:30:51,752][102897] Updated weights for policy 0, policy_version 43640 (0.0008) +[2023-10-08 13:30:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 89358336. Throughput: 0: 1790.4, 1: 1761.3. Samples: 22348096. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:30:51,876][101941] Avg episode reward: [(0, '6.310'), (1, '7.710')] +[2023-10-08 13:30:52,688][102898] Updated weights for policy 1, policy_version 43650 (0.0011) +[2023-10-08 13:30:53,058][102898] Updated weights for policy 1, policy_version 43660 (0.0010) +[2023-10-08 13:30:53,433][102898] Updated weights for policy 1, policy_version 43670 (0.0010) +[2023-10-08 13:30:53,804][102898] Updated weights for policy 1, policy_version 43680 (0.0010) +[2023-10-08 13:30:55,501][102897] Updated weights for policy 0, policy_version 43650 (0.0007) +[2023-10-08 13:30:55,870][102897] Updated weights for policy 0, policy_version 43660 (0.0009) +[2023-10-08 13:30:56,243][102897] Updated weights for policy 0, policy_version 43670 (0.0008) +[2023-10-08 13:30:56,609][102897] Updated weights for policy 0, policy_version 43680 (0.0008) +[2023-10-08 13:30:56,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 89456640. Throughput: 0: 1800.6, 1: 1764.9. Samples: 22370336. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:30:56,876][101941] Avg episode reward: [(0, '7.120'), (1, '7.530')] +[2023-10-08 13:30:57,505][102898] Updated weights for policy 1, policy_version 43690 (0.0011) +[2023-10-08 13:30:57,886][102898] Updated weights for policy 1, policy_version 43700 (0.0010) +[2023-10-08 13:30:58,252][102898] Updated weights for policy 1, policy_version 43710 (0.0008) +[2023-10-08 13:31:00,417][102897] Updated weights for policy 0, policy_version 43690 (0.0009) +[2023-10-08 13:31:00,785][102897] Updated weights for policy 0, policy_version 43700 (0.0008) +[2023-10-08 13:31:01,167][102897] Updated weights for policy 0, policy_version 43710 (0.0009) +[2023-10-08 13:31:01,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 89522176. Throughput: 0: 1775.6, 1: 1793.3. Samples: 22391516. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:31:01,876][101941] Avg episode reward: [(0, '7.270'), (1, '7.620')] +[2023-10-08 13:31:02,013][102898] Updated weights for policy 1, policy_version 43720 (0.0008) +[2023-10-08 13:31:02,383][102898] Updated weights for policy 1, policy_version 43730 (0.0008) +[2023-10-08 13:31:02,756][102898] Updated weights for policy 1, policy_version 43740 (0.0008) +[2023-10-08 13:31:04,853][102897] Updated weights for policy 0, policy_version 43720 (0.0008) +[2023-10-08 13:31:05,226][102897] Updated weights for policy 0, policy_version 43730 (0.0008) +[2023-10-08 13:31:05,600][102897] Updated weights for policy 0, policy_version 43740 (0.0009) +[2023-10-08 13:31:06,476][102898] Updated weights for policy 1, policy_version 43750 (0.0010) +[2023-10-08 13:31:06,834][102898] Updated weights for policy 1, policy_version 43760 (0.0009) +[2023-10-08 13:31:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 89587712. Throughput: 0: 1796.5, 1: 1773.9. Samples: 22402862. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:31:06,876][101941] Avg episode reward: [(0, '7.030'), (1, '8.150')] +[2023-10-08 13:31:07,212][102898] Updated weights for policy 1, policy_version 43770 (0.0009) +[2023-10-08 13:31:09,285][102897] Updated weights for policy 0, policy_version 43750 (0.0009) +[2023-10-08 13:31:09,659][102897] Updated weights for policy 0, policy_version 43760 (0.0007) +[2023-10-08 13:31:10,029][102897] Updated weights for policy 0, policy_version 43770 (0.0008) +[2023-10-08 13:31:10,838][102898] Updated weights for policy 1, policy_version 43780 (0.0008) +[2023-10-08 13:31:11,206][102898] Updated weights for policy 1, policy_version 43790 (0.0007) +[2023-10-08 13:31:11,571][102898] Updated weights for policy 1, policy_version 43800 (0.0007) +[2023-10-08 13:31:11,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 89686016. Throughput: 0: 1779.7, 1: 1799.9. Samples: 22424256. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:31:11,875][101941] Avg episode reward: [(0, '7.640'), (1, '7.360')] +[2023-10-08 13:31:13,777][102897] Updated weights for policy 0, policy_version 43780 (0.0008) +[2023-10-08 13:31:14,148][102897] Updated weights for policy 0, policy_version 43790 (0.0009) +[2023-10-08 13:31:14,521][102897] Updated weights for policy 0, policy_version 43800 (0.0007) +[2023-10-08 13:31:15,412][102898] Updated weights for policy 1, policy_version 43810 (0.0009) +[2023-10-08 13:31:15,773][102898] Updated weights for policy 1, policy_version 43820 (0.0008) +[2023-10-08 13:31:16,139][102898] Updated weights for policy 1, policy_version 43830 (0.0008) +[2023-10-08 13:31:16,503][102898] Updated weights for policy 1, policy_version 43840 (0.0007) +[2023-10-08 13:31:16,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 89751552. Throughput: 0: 1786.2, 1: 1784.9. Samples: 22445528. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:31:16,876][101941] Avg episode reward: [(0, '7.560'), (1, '6.930')] +[2023-10-08 13:31:18,218][102897] Updated weights for policy 0, policy_version 43810 (0.0007) +[2023-10-08 13:31:18,607][102897] Updated weights for policy 0, policy_version 43820 (0.0009) +[2023-10-08 13:31:18,988][102897] Updated weights for policy 0, policy_version 43830 (0.0010) +[2023-10-08 13:31:19,355][102897] Updated weights for policy 0, policy_version 43840 (0.0011) +[2023-10-08 13:31:20,322][102898] Updated weights for policy 1, policy_version 43850 (0.0008) +[2023-10-08 13:31:20,695][102898] Updated weights for policy 1, policy_version 43860 (0.0009) +[2023-10-08 13:31:21,053][102898] Updated weights for policy 1, policy_version 43870 (0.0007) +[2023-10-08 13:31:21,875][101941] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 89817088. Throughput: 0: 1793.5, 1: 1799.2. Samples: 22456842. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:31:21,876][101941] Avg episode reward: [(0, '6.940'), (1, '8.070')] +[2023-10-08 13:31:23,058][102897] Updated weights for policy 0, policy_version 43850 (0.0009) +[2023-10-08 13:31:23,417][102897] Updated weights for policy 0, policy_version 43860 (0.0007) +[2023-10-08 13:31:23,786][102897] Updated weights for policy 0, policy_version 43870 (0.0007) +[2023-10-08 13:31:24,640][102898] Updated weights for policy 1, policy_version 43880 (0.0007) +[2023-10-08 13:31:25,006][102898] Updated weights for policy 1, policy_version 43890 (0.0008) +[2023-10-08 13:31:25,368][102898] Updated weights for policy 1, policy_version 43900 (0.0007) +[2023-10-08 13:31:26,876][101941] Fps is (10 sec: 13106.3, 60 sec: 14199.3, 300 sec: 14217.9). Total num frames: 89882624. Throughput: 0: 1790.5, 1: 1803.7. Samples: 22477860. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:31:26,877][101941] Avg episode reward: [(0, '6.360'), (1, '7.760')] +[2023-10-08 13:31:27,556][102897] Updated weights for policy 0, policy_version 43880 (0.0008) +[2023-10-08 13:31:27,935][102897] Updated weights for policy 0, policy_version 43890 (0.0007) +[2023-10-08 13:31:28,307][102897] Updated weights for policy 0, policy_version 43900 (0.0008) +[2023-10-08 13:31:29,166][102898] Updated weights for policy 1, policy_version 43910 (0.0008) +[2023-10-08 13:31:29,526][102898] Updated weights for policy 1, policy_version 43920 (0.0007) +[2023-10-08 13:31:29,899][102898] Updated weights for policy 1, policy_version 43930 (0.0007) +[2023-10-08 13:31:31,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 89948160. Throughput: 0: 1796.4, 1: 1804.6. Samples: 22500266. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:31:31,875][101941] Avg episode reward: [(0, '6.160'), (1, '7.030')] +[2023-10-08 13:31:32,048][102897] Updated weights for policy 0, policy_version 43910 (0.0007) +[2023-10-08 13:31:32,425][102897] Updated weights for policy 0, policy_version 43920 (0.0007) +[2023-10-08 13:31:32,790][102897] Updated weights for policy 0, policy_version 43930 (0.0007) +[2023-10-08 13:31:33,555][102898] Updated weights for policy 1, policy_version 43940 (0.0007) +[2023-10-08 13:31:33,922][102898] Updated weights for policy 1, policy_version 43950 (0.0008) +[2023-10-08 13:31:34,296][102898] Updated weights for policy 1, policy_version 43960 (0.0009) +[2023-10-08 13:31:36,542][102897] Updated weights for policy 0, policy_version 43940 (0.0009) +[2023-10-08 13:31:36,875][101941] Fps is (10 sec: 13108.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 90013696. Throughput: 0: 1793.0, 1: 1810.4. Samples: 22510250. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:31:36,876][101941] Avg episode reward: [(0, '6.170'), (1, '7.440')] +[2023-10-08 13:31:36,901][102897] Updated weights for policy 0, policy_version 43950 (0.0009) +[2023-10-08 13:31:37,273][102897] Updated weights for policy 0, policy_version 43960 (0.0008) +[2023-10-08 13:31:38,247][102898] Updated weights for policy 1, policy_version 43970 (0.0008) +[2023-10-08 13:31:38,611][102898] Updated weights for policy 1, policy_version 43980 (0.0009) +[2023-10-08 13:31:38,972][102898] Updated weights for policy 1, policy_version 43990 (0.0008) +[2023-10-08 13:31:39,340][102898] Updated weights for policy 1, policy_version 44000 (0.0007) +[2023-10-08 13:31:41,029][102897] Updated weights for policy 0, policy_version 43970 (0.0009) +[2023-10-08 13:31:41,395][102897] Updated weights for policy 0, policy_version 43980 (0.0007) +[2023-10-08 13:31:41,769][102897] Updated weights for policy 0, policy_version 43990 (0.0008) +[2023-10-08 13:31:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 90079232. Throughput: 0: 1796.4, 1: 1800.7. Samples: 22532204. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:31:41,875][101941] Avg episode reward: [(0, '6.810'), (1, '7.210')] +[2023-10-08 13:31:42,149][102897] Updated weights for policy 0, policy_version 44000 (0.0008) +[2023-10-08 13:31:43,279][102898] Updated weights for policy 1, policy_version 44010 (0.0008) +[2023-10-08 13:31:43,637][102898] Updated weights for policy 1, policy_version 44020 (0.0007) +[2023-10-08 13:31:44,001][102898] Updated weights for policy 1, policy_version 44030 (0.0007) +[2023-10-08 13:31:45,937][102897] Updated weights for policy 0, policy_version 44010 (0.0008) +[2023-10-08 13:31:46,310][102897] Updated weights for policy 0, policy_version 44020 (0.0007) +[2023-10-08 13:31:46,681][102897] Updated weights for policy 0, policy_version 44030 (0.0008) +[2023-10-08 13:31:46,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 90177536. Throughput: 0: 1808.8, 1: 1790.2. Samples: 22553468. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:31:46,875][101941] Avg episode reward: [(0, '6.540'), (1, '8.060')] +[2023-10-08 13:31:47,708][102898] Updated weights for policy 1, policy_version 44040 (0.0008) +[2023-10-08 13:31:48,071][102898] Updated weights for policy 1, policy_version 44050 (0.0009) +[2023-10-08 13:31:48,431][102898] Updated weights for policy 1, policy_version 44060 (0.0011) +[2023-10-08 13:31:50,437][102897] Updated weights for policy 0, policy_version 44040 (0.0007) +[2023-10-08 13:31:50,819][102897] Updated weights for policy 0, policy_version 44050 (0.0007) +[2023-10-08 13:31:51,186][102897] Updated weights for policy 0, policy_version 44060 (0.0009) +[2023-10-08 13:31:51,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 90243072. Throughput: 0: 1795.8, 1: 1792.5. Samples: 22564336. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:31:51,875][101941] Avg episode reward: [(0, '7.300'), (1, '7.910')] +[2023-10-08 13:31:52,172][102898] Updated weights for policy 1, policy_version 44070 (0.0011) +[2023-10-08 13:31:52,539][102898] Updated weights for policy 1, policy_version 44080 (0.0008) +[2023-10-08 13:31:52,904][102898] Updated weights for policy 1, policy_version 44090 (0.0009) +[2023-10-08 13:31:54,926][102897] Updated weights for policy 0, policy_version 44070 (0.0008) +[2023-10-08 13:31:55,303][102897] Updated weights for policy 0, policy_version 44080 (0.0009) +[2023-10-08 13:31:55,673][102897] Updated weights for policy 0, policy_version 44090 (0.0011) +[2023-10-08 13:31:56,664][102898] Updated weights for policy 1, policy_version 44100 (0.0009) +[2023-10-08 13:31:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 90308608. Throughput: 0: 1803.2, 1: 1785.8. Samples: 22585760. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:31:56,875][101941] Avg episode reward: [(0, '6.800'), (1, '7.430')] +[2023-10-08 13:31:57,023][102898] Updated weights for policy 1, policy_version 44110 (0.0007) +[2023-10-08 13:31:57,392][102898] Updated weights for policy 1, policy_version 44120 (0.0009) +[2023-10-08 13:31:59,600][102897] Updated weights for policy 0, policy_version 44100 (0.0009) +[2023-10-08 13:31:59,967][102897] Updated weights for policy 0, policy_version 44110 (0.0010) +[2023-10-08 13:32:00,333][102897] Updated weights for policy 0, policy_version 44120 (0.0009) +[2023-10-08 13:32:01,014][102898] Updated weights for policy 1, policy_version 44130 (0.0008) +[2023-10-08 13:32:01,391][102898] Updated weights for policy 1, policy_version 44140 (0.0009) +[2023-10-08 13:32:01,763][102898] Updated weights for policy 1, policy_version 44150 (0.0010) +[2023-10-08 13:32:01,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 90374144. Throughput: 0: 1779.4, 1: 1802.9. Samples: 22606732. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:32:01,876][101941] Avg episode reward: [(0, '6.650'), (1, '7.640')] +[2023-10-08 13:32:02,132][102898] Updated weights for policy 1, policy_version 44160 (0.0008) +[2023-10-08 13:32:04,240][102897] Updated weights for policy 0, policy_version 44130 (0.0010) +[2023-10-08 13:32:04,622][102897] Updated weights for policy 0, policy_version 44140 (0.0010) +[2023-10-08 13:32:04,983][102897] Updated weights for policy 0, policy_version 44150 (0.0008) +[2023-10-08 13:32:05,356][102897] Updated weights for policy 0, policy_version 44160 (0.0007) +[2023-10-08 13:32:05,927][102898] Updated weights for policy 1, policy_version 44170 (0.0009) +[2023-10-08 13:32:06,295][102898] Updated weights for policy 1, policy_version 44180 (0.0009) +[2023-10-08 13:32:06,659][102898] Updated weights for policy 1, policy_version 44190 (0.0008) +[2023-10-08 13:32:06,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 90472448. Throughput: 0: 1800.0, 1: 1787.4. Samples: 22618274. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:32:06,876][101941] Avg episode reward: [(0, '7.340'), (1, '8.450')] +[2023-10-08 13:32:09,075][102897] Updated weights for policy 0, policy_version 44170 (0.0010) +[2023-10-08 13:32:09,457][102897] Updated weights for policy 0, policy_version 44180 (0.0009) +[2023-10-08 13:32:09,826][102897] Updated weights for policy 0, policy_version 44190 (0.0008) +[2023-10-08 13:32:10,417][102898] Updated weights for policy 1, policy_version 44200 (0.0008) +[2023-10-08 13:32:10,782][102898] Updated weights for policy 1, policy_version 44210 (0.0008) +[2023-10-08 13:32:11,150][102898] Updated weights for policy 1, policy_version 44220 (0.0007) +[2023-10-08 13:32:11,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 90537984. Throughput: 0: 1775.4, 1: 1804.2. Samples: 22638936. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:32:11,876][101941] Avg episode reward: [(0, '7.670'), (1, '8.040')] +[2023-10-08 13:32:13,623][102897] Updated weights for policy 0, policy_version 44200 (0.0008) +[2023-10-08 13:32:14,008][102897] Updated weights for policy 0, policy_version 44210 (0.0009) +[2023-10-08 13:32:14,374][102897] Updated weights for policy 0, policy_version 44220 (0.0007) +[2023-10-08 13:32:14,838][102898] Updated weights for policy 1, policy_version 44230 (0.0009) +[2023-10-08 13:32:15,213][102898] Updated weights for policy 1, policy_version 44240 (0.0007) +[2023-10-08 13:32:15,565][102898] Updated weights for policy 1, policy_version 44250 (0.0007) +[2023-10-08 13:32:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 90603520. Throughput: 0: 1777.9, 1: 1788.9. Samples: 22660772. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:32:16,876][101941] Avg episode reward: [(0, '7.210'), (1, '7.960')] +[2023-10-08 13:32:16,886][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000044224_45285376.pth... +[2023-10-08 13:32:16,886][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000044256_45318144.pth... +[2023-10-08 13:32:16,922][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000042560_43581440.pth +[2023-10-08 13:32:16,923][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000042592_43614208.pth +[2023-10-08 13:32:18,085][102897] Updated weights for policy 0, policy_version 44230 (0.0008) +[2023-10-08 13:32:18,457][102897] Updated weights for policy 0, policy_version 44240 (0.0007) +[2023-10-08 13:32:18,832][102897] Updated weights for policy 0, policy_version 44250 (0.0007) +[2023-10-08 13:32:19,031][102898] Updated weights for policy 1, policy_version 44260 (0.0007) +[2023-10-08 13:32:19,398][102898] Updated weights for policy 1, policy_version 44270 (0.0010) +[2023-10-08 13:32:19,759][102898] Updated weights for policy 1, policy_version 44280 (0.0008) +[2023-10-08 13:32:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 90669056. Throughput: 0: 1777.6, 1: 1805.7. Samples: 22671498. Policy #0 lag: (min: 24.0, avg: 39.1, max: 40.0) +[2023-10-08 13:32:21,876][101941] Avg episode reward: [(0, '7.300'), (1, '8.290')] +[2023-10-08 13:32:22,592][102897] Updated weights for policy 0, policy_version 44260 (0.0008) +[2023-10-08 13:32:22,963][102897] Updated weights for policy 0, policy_version 44270 (0.0010) +[2023-10-08 13:32:23,332][102897] Updated weights for policy 0, policy_version 44280 (0.0010) +[2023-10-08 13:32:23,534][102898] Updated weights for policy 1, policy_version 44290 (0.0010) +[2023-10-08 13:32:23,902][102898] Updated weights for policy 1, policy_version 44300 (0.0007) +[2023-10-08 13:32:24,259][102898] Updated weights for policy 1, policy_version 44310 (0.0007) +[2023-10-08 13:32:24,622][102898] Updated weights for policy 1, policy_version 44320 (0.0008) +[2023-10-08 13:32:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.7, 300 sec: 14218.0). Total num frames: 90734592. Throughput: 0: 1775.1, 1: 1794.8. Samples: 22692850. Policy #0 lag: (min: 24.0, avg: 39.1, max: 40.0) +[2023-10-08 13:32:26,875][101941] Avg episode reward: [(0, '7.310'), (1, '8.350')] +[2023-10-08 13:32:27,090][102897] Updated weights for policy 0, policy_version 44290 (0.0007) +[2023-10-08 13:32:27,461][102897] Updated weights for policy 0, policy_version 44300 (0.0009) +[2023-10-08 13:32:27,828][102897] Updated weights for policy 0, policy_version 44310 (0.0009) +[2023-10-08 13:32:28,196][102897] Updated weights for policy 0, policy_version 44320 (0.0008) +[2023-10-08 13:32:28,486][102898] Updated weights for policy 1, policy_version 44330 (0.0007) +[2023-10-08 13:32:28,847][102898] Updated weights for policy 1, policy_version 44340 (0.0007) +[2023-10-08 13:32:29,210][102898] Updated weights for policy 1, policy_version 44350 (0.0009) +[2023-10-08 13:32:31,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 90800128. Throughput: 0: 1797.1, 1: 1789.9. Samples: 22714882. Policy #0 lag: (min: 24.0, avg: 39.1, max: 40.0) +[2023-10-08 13:32:31,876][101941] Avg episode reward: [(0, '6.920'), (1, '8.050')] +[2023-10-08 13:32:32,080][102897] Updated weights for policy 0, policy_version 44330 (0.0008) +[2023-10-08 13:32:32,460][102897] Updated weights for policy 0, policy_version 44340 (0.0009) +[2023-10-08 13:32:32,837][102897] Updated weights for policy 0, policy_version 44350 (0.0008) +[2023-10-08 13:32:32,937][102898] Updated weights for policy 1, policy_version 44360 (0.0008) +[2023-10-08 13:32:33,306][102898] Updated weights for policy 1, policy_version 44370 (0.0008) +[2023-10-08 13:32:33,675][102898] Updated weights for policy 1, policy_version 44380 (0.0007) +[2023-10-08 13:32:36,640][102897] Updated weights for policy 0, policy_version 44360 (0.0008) +[2023-10-08 13:32:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 90865664. Throughput: 0: 1770.2, 1: 1790.3. Samples: 22724560. Policy #0 lag: (min: 24.0, avg: 39.1, max: 40.0) +[2023-10-08 13:32:36,876][101941] Avg episode reward: [(0, '6.240'), (1, '8.250')] +[2023-10-08 13:32:37,014][102897] Updated weights for policy 0, policy_version 44370 (0.0008) +[2023-10-08 13:32:37,386][102897] Updated weights for policy 0, policy_version 44380 (0.0007) +[2023-10-08 13:32:37,437][102898] Updated weights for policy 1, policy_version 44390 (0.0008) +[2023-10-08 13:32:37,804][102898] Updated weights for policy 1, policy_version 44400 (0.0008) +[2023-10-08 13:32:38,173][102898] Updated weights for policy 1, policy_version 44410 (0.0008) +[2023-10-08 13:32:41,010][102897] Updated weights for policy 0, policy_version 44390 (0.0007) +[2023-10-08 13:32:41,384][102897] Updated weights for policy 0, policy_version 44400 (0.0009) +[2023-10-08 13:32:41,752][102897] Updated weights for policy 0, policy_version 44410 (0.0010) +[2023-10-08 13:32:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 90931200. Throughput: 0: 1791.7, 1: 1790.6. Samples: 22746966. Policy #0 lag: (min: 24.0, avg: 39.1, max: 40.0) +[2023-10-08 13:32:41,876][101941] Avg episode reward: [(0, '6.180'), (1, '8.390')] +[2023-10-08 13:32:42,073][102898] Updated weights for policy 1, policy_version 44420 (0.0009) +[2023-10-08 13:32:42,445][102898] Updated weights for policy 1, policy_version 44430 (0.0008) +[2023-10-08 13:32:42,819][102898] Updated weights for policy 1, policy_version 44440 (0.0007) +[2023-10-08 13:32:45,470][102897] Updated weights for policy 0, policy_version 44420 (0.0009) +[2023-10-08 13:32:45,839][102897] Updated weights for policy 0, policy_version 44430 (0.0009) +[2023-10-08 13:32:46,215][102897] Updated weights for policy 0, policy_version 44440 (0.0010) +[2023-10-08 13:32:46,698][102898] Updated weights for policy 1, policy_version 44450 (0.0008) +[2023-10-08 13:32:46,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 91029504. Throughput: 0: 1785.2, 1: 1799.7. Samples: 22768050. Policy #0 lag: (min: 24.0, avg: 39.1, max: 40.0) +[2023-10-08 13:32:46,875][101941] Avg episode reward: [(0, '7.230'), (1, '8.270')] +[2023-10-08 13:32:47,064][102898] Updated weights for policy 1, policy_version 44460 (0.0008) +[2023-10-08 13:32:47,432][102898] Updated weights for policy 1, policy_version 44470 (0.0009) +[2023-10-08 13:32:47,803][102898] Updated weights for policy 1, policy_version 44480 (0.0009) +[2023-10-08 13:32:50,053][102897] Updated weights for policy 0, policy_version 44450 (0.0008) +[2023-10-08 13:32:50,426][102897] Updated weights for policy 0, policy_version 44460 (0.0009) +[2023-10-08 13:32:50,804][102897] Updated weights for policy 0, policy_version 44470 (0.0007) +[2023-10-08 13:32:51,177][102897] Updated weights for policy 0, policy_version 44480 (0.0007) +[2023-10-08 13:32:51,640][102898] Updated weights for policy 1, policy_version 44490 (0.0007) +[2023-10-08 13:32:51,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 91095040. Throughput: 0: 1787.4, 1: 1780.7. Samples: 22778836. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:32:51,875][101941] Avg episode reward: [(0, '7.350'), (1, '8.140')] +[2023-10-08 13:32:52,007][102898] Updated weights for policy 1, policy_version 44500 (0.0007) +[2023-10-08 13:32:52,388][102898] Updated weights for policy 1, policy_version 44510 (0.0008) +[2023-10-08 13:32:54,999][102897] Updated weights for policy 0, policy_version 44490 (0.0008) +[2023-10-08 13:32:55,369][102897] Updated weights for policy 0, policy_version 44500 (0.0008) +[2023-10-08 13:32:55,751][102897] Updated weights for policy 0, policy_version 44510 (0.0009) +[2023-10-08 13:32:56,136][102898] Updated weights for policy 1, policy_version 44520 (0.0007) +[2023-10-08 13:32:56,510][102898] Updated weights for policy 1, policy_version 44530 (0.0008) +[2023-10-08 13:32:56,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 91160576. Throughput: 0: 1795.9, 1: 1788.9. Samples: 22800252. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:32:56,876][101941] Avg episode reward: [(0, '7.160'), (1, '8.810')] +[2023-10-08 13:32:56,880][102898] Updated weights for policy 1, policy_version 44540 (0.0008) +[2023-10-08 13:32:59,432][102897] Updated weights for policy 0, policy_version 44520 (0.0009) +[2023-10-08 13:32:59,806][102897] Updated weights for policy 0, policy_version 44530 (0.0011) +[2023-10-08 13:33:00,182][102897] Updated weights for policy 0, policy_version 44540 (0.0008) +[2023-10-08 13:33:00,777][102898] Updated weights for policy 1, policy_version 44550 (0.0009) +[2023-10-08 13:33:01,145][102898] Updated weights for policy 1, policy_version 44560 (0.0009) +[2023-10-08 13:33:01,516][102898] Updated weights for policy 1, policy_version 44570 (0.0009) +[2023-10-08 13:33:01,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 91258880. Throughput: 0: 1778.8, 1: 1781.4. Samples: 22820980. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:33:01,876][101941] Avg episode reward: [(0, '7.620'), (1, '8.680')] +[2023-10-08 13:33:03,941][102897] Updated weights for policy 0, policy_version 44550 (0.0010) +[2023-10-08 13:33:04,311][102897] Updated weights for policy 0, policy_version 44560 (0.0009) +[2023-10-08 13:33:04,678][102897] Updated weights for policy 0, policy_version 44570 (0.0010) +[2023-10-08 13:33:05,172][102898] Updated weights for policy 1, policy_version 44580 (0.0008) +[2023-10-08 13:33:05,545][102898] Updated weights for policy 1, policy_version 44590 (0.0008) +[2023-10-08 13:33:05,910][102898] Updated weights for policy 1, policy_version 44600 (0.0007) +[2023-10-08 13:33:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 91324416. Throughput: 0: 1793.6, 1: 1785.9. Samples: 22832572. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:33:06,876][101941] Avg episode reward: [(0, '8.470'), (1, '8.360')] +[2023-10-08 13:33:06,877][102634] Saving new best policy, reward=8.470! +[2023-10-08 13:33:08,507][102897] Updated weights for policy 0, policy_version 44580 (0.0008) +[2023-10-08 13:33:08,871][102897] Updated weights for policy 0, policy_version 44590 (0.0009) +[2023-10-08 13:33:09,246][102897] Updated weights for policy 0, policy_version 44600 (0.0008) +[2023-10-08 13:33:09,543][102898] Updated weights for policy 1, policy_version 44610 (0.0007) +[2023-10-08 13:33:09,904][102898] Updated weights for policy 1, policy_version 44620 (0.0007) +[2023-10-08 13:33:10,275][102898] Updated weights for policy 1, policy_version 44630 (0.0008) +[2023-10-08 13:33:10,642][102898] Updated weights for policy 1, policy_version 44640 (0.0010) +[2023-10-08 13:33:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 91389952. Throughput: 0: 1785.3, 1: 1783.1. Samples: 22853428. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:33:11,876][101941] Avg episode reward: [(0, '8.360'), (1, '8.160')] +[2023-10-08 13:33:13,183][102897] Updated weights for policy 0, policy_version 44610 (0.0007) +[2023-10-08 13:33:13,551][102897] Updated weights for policy 0, policy_version 44620 (0.0009) +[2023-10-08 13:33:13,926][102897] Updated weights for policy 0, policy_version 44630 (0.0008) +[2023-10-08 13:33:14,291][102897] Updated weights for policy 0, policy_version 44640 (0.0009) +[2023-10-08 13:33:14,401][102898] Updated weights for policy 1, policy_version 44650 (0.0007) +[2023-10-08 13:33:14,763][102898] Updated weights for policy 1, policy_version 44660 (0.0008) +[2023-10-08 13:33:15,136][102898] Updated weights for policy 1, policy_version 44670 (0.0008) +[2023-10-08 13:33:16,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 91455488. Throughput: 0: 1780.8, 1: 1779.2. Samples: 22875078. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:33:16,876][101941] Avg episode reward: [(0, '7.570'), (1, '7.950')] +[2023-10-08 13:33:17,821][102897] Updated weights for policy 0, policy_version 44650 (0.0007) +[2023-10-08 13:33:18,203][102897] Updated weights for policy 0, policy_version 44660 (0.0011) +[2023-10-08 13:33:18,571][102897] Updated weights for policy 0, policy_version 44670 (0.0009) +[2023-10-08 13:33:18,961][102898] Updated weights for policy 1, policy_version 44680 (0.0010) +[2023-10-08 13:33:19,323][102898] Updated weights for policy 1, policy_version 44690 (0.0009) +[2023-10-08 13:33:19,690][102898] Updated weights for policy 1, policy_version 44700 (0.0008) +[2023-10-08 13:33:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 91521024. Throughput: 0: 1782.8, 1: 1789.6. Samples: 22885318. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:33:21,876][101941] Avg episode reward: [(0, '6.950'), (1, '7.790')] +[2023-10-08 13:33:22,318][102897] Updated weights for policy 0, policy_version 44680 (0.0007) +[2023-10-08 13:33:22,691][102897] Updated weights for policy 0, policy_version 44690 (0.0007) +[2023-10-08 13:33:23,065][102897] Updated weights for policy 0, policy_version 44700 (0.0009) +[2023-10-08 13:33:23,485][102898] Updated weights for policy 1, policy_version 44710 (0.0008) +[2023-10-08 13:33:23,845][102898] Updated weights for policy 1, policy_version 44720 (0.0008) +[2023-10-08 13:33:24,216][102898] Updated weights for policy 1, policy_version 44730 (0.0009) +[2023-10-08 13:33:26,762][102897] Updated weights for policy 0, policy_version 44710 (0.0008) +[2023-10-08 13:33:26,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 91586560. Throughput: 0: 1786.5, 1: 1775.7. Samples: 22907264. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:33:26,876][101941] Avg episode reward: [(0, '7.100'), (1, '8.380')] +[2023-10-08 13:33:27,128][102897] Updated weights for policy 0, policy_version 44720 (0.0008) +[2023-10-08 13:33:27,505][102897] Updated weights for policy 0, policy_version 44730 (0.0008) +[2023-10-08 13:33:28,031][102898] Updated weights for policy 1, policy_version 44740 (0.0010) +[2023-10-08 13:33:28,397][102898] Updated weights for policy 1, policy_version 44750 (0.0010) +[2023-10-08 13:33:28,758][102898] Updated weights for policy 1, policy_version 44760 (0.0007) +[2023-10-08 13:33:31,068][102897] Updated weights for policy 0, policy_version 44740 (0.0008) +[2023-10-08 13:33:31,444][102897] Updated weights for policy 0, policy_version 44750 (0.0008) +[2023-10-08 13:33:31,819][102897] Updated weights for policy 0, policy_version 44760 (0.0009) +[2023-10-08 13:33:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 91652096. Throughput: 0: 1803.8, 1: 1781.6. Samples: 22929392. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:33:31,876][101941] Avg episode reward: [(0, '6.790'), (1, '7.910')] +[2023-10-08 13:33:32,578][102898] Updated weights for policy 1, policy_version 44770 (0.0009) +[2023-10-08 13:33:32,950][102898] Updated weights for policy 1, policy_version 44780 (0.0011) +[2023-10-08 13:33:33,307][102898] Updated weights for policy 1, policy_version 44790 (0.0007) +[2023-10-08 13:33:33,680][102898] Updated weights for policy 1, policy_version 44800 (0.0010) +[2023-10-08 13:33:35,739][102897] Updated weights for policy 0, policy_version 44770 (0.0010) +[2023-10-08 13:33:36,155][102897] Updated weights for policy 0, policy_version 44780 (0.0008) +[2023-10-08 13:33:36,518][102897] Updated weights for policy 0, policy_version 44790 (0.0008) +[2023-10-08 13:33:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 91717632. Throughput: 0: 1788.4, 1: 1784.6. Samples: 22939622. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:33:36,876][101941] Avg episode reward: [(0, '7.480'), (1, '8.390')] +[2023-10-08 13:33:36,893][102897] Updated weights for policy 0, policy_version 44800 (0.0008) +[2023-10-08 13:33:37,506][102898] Updated weights for policy 1, policy_version 44810 (0.0009) +[2023-10-08 13:33:37,878][102898] Updated weights for policy 1, policy_version 44820 (0.0011) +[2023-10-08 13:33:38,254][102898] Updated weights for policy 1, policy_version 44830 (0.0010) +[2023-10-08 13:33:40,634][102897] Updated weights for policy 0, policy_version 44810 (0.0009) +[2023-10-08 13:33:41,004][102897] Updated weights for policy 0, policy_version 44820 (0.0007) +[2023-10-08 13:33:41,369][102897] Updated weights for policy 0, policy_version 44830 (0.0008) +[2023-10-08 13:33:41,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 91815936. Throughput: 0: 1800.4, 1: 1787.6. Samples: 22961710. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:33:41,876][101941] Avg episode reward: [(0, '7.360'), (1, '8.470')] +[2023-10-08 13:33:42,005][102898] Updated weights for policy 1, policy_version 44840 (0.0008) +[2023-10-08 13:33:42,370][102898] Updated weights for policy 1, policy_version 44850 (0.0008) +[2023-10-08 13:33:42,748][102898] Updated weights for policy 1, policy_version 44860 (0.0010) +[2023-10-08 13:33:45,158][102897] Updated weights for policy 0, policy_version 44840 (0.0009) +[2023-10-08 13:33:45,530][102897] Updated weights for policy 0, policy_version 44850 (0.0009) +[2023-10-08 13:33:45,902][102897] Updated weights for policy 0, policy_version 44860 (0.0009) +[2023-10-08 13:33:46,319][102898] Updated weights for policy 1, policy_version 44870 (0.0008) +[2023-10-08 13:33:46,695][102898] Updated weights for policy 1, policy_version 44880 (0.0009) +[2023-10-08 13:33:46,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 91881472. Throughput: 0: 1788.2, 1: 1803.8. Samples: 22982620. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:33:46,876][101941] Avg episode reward: [(0, '6.800'), (1, '8.400')] +[2023-10-08 13:33:47,060][102898] Updated weights for policy 1, policy_version 44890 (0.0009) +[2023-10-08 13:33:49,699][102897] Updated weights for policy 0, policy_version 44870 (0.0010) +[2023-10-08 13:33:50,073][102897] Updated weights for policy 0, policy_version 44880 (0.0009) +[2023-10-08 13:33:50,450][102897] Updated weights for policy 0, policy_version 44890 (0.0007) +[2023-10-08 13:33:50,812][102898] Updated weights for policy 1, policy_version 44900 (0.0009) +[2023-10-08 13:33:51,190][102898] Updated weights for policy 1, policy_version 44910 (0.0008) +[2023-10-08 13:33:51,553][102898] Updated weights for policy 1, policy_version 44920 (0.0008) +[2023-10-08 13:33:51,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 91979776. Throughput: 0: 1804.0, 1: 1786.4. Samples: 22994138. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:33:51,876][101941] Avg episode reward: [(0, '6.700'), (1, '8.010')] +[2023-10-08 13:33:54,237][102897] Updated weights for policy 0, policy_version 44900 (0.0008) +[2023-10-08 13:33:54,608][102897] Updated weights for policy 0, policy_version 44910 (0.0007) +[2023-10-08 13:33:54,984][102897] Updated weights for policy 0, policy_version 44920 (0.0008) +[2023-10-08 13:33:55,482][102898] Updated weights for policy 1, policy_version 44930 (0.0010) +[2023-10-08 13:33:55,846][102898] Updated weights for policy 1, policy_version 44940 (0.0007) +[2023-10-08 13:33:56,208][102898] Updated weights for policy 1, policy_version 44950 (0.0009) +[2023-10-08 13:33:56,577][102898] Updated weights for policy 1, policy_version 44960 (0.0010) +[2023-10-08 13:33:56,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 92045312. Throughput: 0: 1778.0, 1: 1808.5. Samples: 23014820. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:33:56,875][101941] Avg episode reward: [(0, '6.190'), (1, '8.100')] +[2023-10-08 13:33:58,787][102897] Updated weights for policy 0, policy_version 44930 (0.0010) +[2023-10-08 13:33:59,162][102897] Updated weights for policy 0, policy_version 44940 (0.0011) +[2023-10-08 13:33:59,542][102897] Updated weights for policy 0, policy_version 44950 (0.0010) +[2023-10-08 13:33:59,912][102897] Updated weights for policy 0, policy_version 44960 (0.0008) +[2023-10-08 13:34:00,382][102898] Updated weights for policy 1, policy_version 44970 (0.0008) +[2023-10-08 13:34:00,736][102898] Updated weights for policy 1, policy_version 44980 (0.0008) +[2023-10-08 13:34:01,103][102898] Updated weights for policy 1, policy_version 44990 (0.0009) +[2023-10-08 13:34:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 92110848. Throughput: 0: 1781.6, 1: 1785.7. Samples: 23035604. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:34:01,876][101941] Avg episode reward: [(0, '6.870'), (1, '8.370')] +[2023-10-08 13:34:03,719][102897] Updated weights for policy 0, policy_version 44970 (0.0009) +[2023-10-08 13:34:04,086][102897] Updated weights for policy 0, policy_version 44980 (0.0009) +[2023-10-08 13:34:04,451][102897] Updated weights for policy 0, policy_version 44990 (0.0009) +[2023-10-08 13:34:04,928][102898] Updated weights for policy 1, policy_version 45000 (0.0007) +[2023-10-08 13:34:05,293][102898] Updated weights for policy 1, policy_version 45010 (0.0008) +[2023-10-08 13:34:05,655][102898] Updated weights for policy 1, policy_version 45020 (0.0007) +[2023-10-08 13:34:06,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 92176384. Throughput: 0: 1785.9, 1: 1806.2. Samples: 23046962. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:34:06,876][101941] Avg episode reward: [(0, '7.800'), (1, '8.580')] +[2023-10-08 13:34:08,145][102897] Updated weights for policy 0, policy_version 45000 (0.0007) +[2023-10-08 13:34:08,515][102897] Updated weights for policy 0, policy_version 45010 (0.0008) +[2023-10-08 13:34:08,885][102897] Updated weights for policy 0, policy_version 45020 (0.0007) +[2023-10-08 13:34:09,268][102898] Updated weights for policy 1, policy_version 45030 (0.0007) +[2023-10-08 13:34:09,623][102898] Updated weights for policy 1, policy_version 45040 (0.0008) +[2023-10-08 13:34:09,991][102898] Updated weights for policy 1, policy_version 45050 (0.0007) +[2023-10-08 13:34:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 92241920. Throughput: 0: 1780.1, 1: 1792.2. Samples: 23068018. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:34:11,876][101941] Avg episode reward: [(0, '7.350'), (1, '8.790')] +[2023-10-08 13:34:12,617][102897] Updated weights for policy 0, policy_version 45030 (0.0008) +[2023-10-08 13:34:12,983][102897] Updated weights for policy 0, policy_version 45040 (0.0010) +[2023-10-08 13:34:13,350][102897] Updated weights for policy 0, policy_version 45050 (0.0008) +[2023-10-08 13:34:13,776][102898] Updated weights for policy 1, policy_version 45060 (0.0009) +[2023-10-08 13:34:14,139][102898] Updated weights for policy 1, policy_version 45070 (0.0007) +[2023-10-08 13:34:14,504][102898] Updated weights for policy 1, policy_version 45080 (0.0008) +[2023-10-08 13:34:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 92307456. Throughput: 0: 1788.9, 1: 1788.2. Samples: 23090360. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:34:16,876][101941] Avg episode reward: [(0, '6.890'), (1, '7.390')] +[2023-10-08 13:34:16,888][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000045088_46170112.pth... +[2023-10-08 13:34:16,888][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000045056_46137344.pth... +[2023-10-08 13:34:16,925][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000043424_44466176.pth +[2023-10-08 13:34:16,928][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000043392_44433408.pth +[2023-10-08 13:34:17,167][102897] Updated weights for policy 0, policy_version 45060 (0.0007) +[2023-10-08 13:34:17,537][102897] Updated weights for policy 0, policy_version 45070 (0.0007) +[2023-10-08 13:34:17,905][102897] Updated weights for policy 0, policy_version 45080 (0.0007) +[2023-10-08 13:34:18,330][102898] Updated weights for policy 1, policy_version 45090 (0.0008) +[2023-10-08 13:34:18,691][102898] Updated weights for policy 1, policy_version 45100 (0.0007) +[2023-10-08 13:34:19,057][102898] Updated weights for policy 1, policy_version 45110 (0.0009) +[2023-10-08 13:34:19,421][102898] Updated weights for policy 1, policy_version 45120 (0.0008) +[2023-10-08 13:34:21,668][102897] Updated weights for policy 0, policy_version 45090 (0.0008) +[2023-10-08 13:34:21,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 92372992. Throughput: 0: 1777.5, 1: 1789.2. Samples: 23100124. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:34:21,876][101941] Avg episode reward: [(0, '7.450'), (1, '8.800')] +[2023-10-08 13:34:22,045][102897] Updated weights for policy 0, policy_version 45100 (0.0010) +[2023-10-08 13:34:22,419][102897] Updated weights for policy 0, policy_version 45110 (0.0008) +[2023-10-08 13:34:22,791][102897] Updated weights for policy 0, policy_version 45120 (0.0008) +[2023-10-08 13:34:23,184][102898] Updated weights for policy 1, policy_version 45130 (0.0009) +[2023-10-08 13:34:23,556][102898] Updated weights for policy 1, policy_version 45140 (0.0009) +[2023-10-08 13:34:23,929][102898] Updated weights for policy 1, policy_version 45150 (0.0010) +[2023-10-08 13:34:26,380][102897] Updated weights for policy 0, policy_version 45130 (0.0010) +[2023-10-08 13:34:26,752][102897] Updated weights for policy 0, policy_version 45140 (0.0008) +[2023-10-08 13:34:26,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 92438528. Throughput: 0: 1782.7, 1: 1787.3. Samples: 23122356. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:34:26,876][101941] Avg episode reward: [(0, '7.340'), (1, '9.000')] +[2023-10-08 13:34:26,876][102760] Saving new best policy, reward=9.000! +[2023-10-08 13:34:27,119][102897] Updated weights for policy 0, policy_version 45150 (0.0007) +[2023-10-08 13:34:27,810][102898] Updated weights for policy 1, policy_version 45160 (0.0010) +[2023-10-08 13:34:28,189][102898] Updated weights for policy 1, policy_version 45170 (0.0010) +[2023-10-08 13:34:28,550][102898] Updated weights for policy 1, policy_version 45180 (0.0008) +[2023-10-08 13:34:30,924][102897] Updated weights for policy 0, policy_version 45160 (0.0007) +[2023-10-08 13:34:31,309][102897] Updated weights for policy 0, policy_version 45170 (0.0008) +[2023-10-08 13:34:31,681][102897] Updated weights for policy 0, policy_version 45180 (0.0010) +[2023-10-08 13:34:31,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 92536832. Throughput: 0: 1787.6, 1: 1793.1. Samples: 23143750. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:34:31,876][101941] Avg episode reward: [(0, '7.590'), (1, '8.610')] +[2023-10-08 13:34:32,352][102898] Updated weights for policy 1, policy_version 45190 (0.0009) +[2023-10-08 13:34:32,727][102898] Updated weights for policy 1, policy_version 45200 (0.0010) +[2023-10-08 13:34:33,092][102898] Updated weights for policy 1, policy_version 45210 (0.0009) +[2023-10-08 13:34:35,590][102897] Updated weights for policy 0, policy_version 45190 (0.0008) +[2023-10-08 13:34:35,957][102897] Updated weights for policy 0, policy_version 45200 (0.0009) +[2023-10-08 13:34:36,324][102897] Updated weights for policy 0, policy_version 45210 (0.0010) +[2023-10-08 13:34:36,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 92602368. Throughput: 0: 1774.0, 1: 1782.4. Samples: 23154176. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:34:36,876][101941] Avg episode reward: [(0, '6.380'), (1, '8.660')] +[2023-10-08 13:34:36,907][102898] Updated weights for policy 1, policy_version 45220 (0.0009) +[2023-10-08 13:34:37,270][102898] Updated weights for policy 1, policy_version 45230 (0.0008) +[2023-10-08 13:34:37,635][102898] Updated weights for policy 1, policy_version 45240 (0.0008) +[2023-10-08 13:34:40,032][102897] Updated weights for policy 0, policy_version 45220 (0.0011) +[2023-10-08 13:34:40,393][102897] Updated weights for policy 0, policy_version 45230 (0.0008) +[2023-10-08 13:34:40,771][102897] Updated weights for policy 0, policy_version 45240 (0.0009) +[2023-10-08 13:34:41,390][102898] Updated weights for policy 1, policy_version 45250 (0.0009) +[2023-10-08 13:34:41,746][102898] Updated weights for policy 1, policy_version 45260 (0.0008) +[2023-10-08 13:34:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 92667904. Throughput: 0: 1798.5, 1: 1778.3. Samples: 23175776. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:34:41,876][101941] Avg episode reward: [(0, '6.580'), (1, '8.260')] +[2023-10-08 13:34:42,108][102898] Updated weights for policy 1, policy_version 45270 (0.0008) +[2023-10-08 13:34:42,473][102898] Updated weights for policy 1, policy_version 45280 (0.0009) +[2023-10-08 13:34:44,466][102897] Updated weights for policy 0, policy_version 45250 (0.0008) +[2023-10-08 13:34:44,837][102897] Updated weights for policy 0, policy_version 45260 (0.0008) +[2023-10-08 13:34:45,222][102897] Updated weights for policy 0, policy_version 45270 (0.0010) +[2023-10-08 13:34:45,581][102897] Updated weights for policy 0, policy_version 45280 (0.0010) +[2023-10-08 13:34:46,119][102898] Updated weights for policy 1, policy_version 45290 (0.0008) +[2023-10-08 13:34:46,495][102898] Updated weights for policy 1, policy_version 45300 (0.0009) +[2023-10-08 13:34:46,856][102898] Updated weights for policy 1, policy_version 45310 (0.0009) +[2023-10-08 13:34:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 92733440. Throughput: 0: 1782.4, 1: 1793.5. Samples: 23196522. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:34:46,876][101941] Avg episode reward: [(0, '7.050'), (1, '8.820')] +[2023-10-08 13:34:49,371][102897] Updated weights for policy 0, policy_version 45290 (0.0007) +[2023-10-08 13:34:49,739][102897] Updated weights for policy 0, policy_version 45300 (0.0009) +[2023-10-08 13:34:50,107][102897] Updated weights for policy 0, policy_version 45310 (0.0007) +[2023-10-08 13:34:50,625][102898] Updated weights for policy 1, policy_version 45320 (0.0009) +[2023-10-08 13:34:50,990][102898] Updated weights for policy 1, policy_version 45330 (0.0008) +[2023-10-08 13:34:51,363][102898] Updated weights for policy 1, policy_version 45340 (0.0008) +[2023-10-08 13:34:51,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 92831744. Throughput: 0: 1799.6, 1: 1778.8. Samples: 23207988. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:34:51,876][101941] Avg episode reward: [(0, '6.650'), (1, '8.210')] +[2023-10-08 13:34:53,949][102897] Updated weights for policy 0, policy_version 45320 (0.0008) +[2023-10-08 13:34:54,318][102897] Updated weights for policy 0, policy_version 45330 (0.0009) +[2023-10-08 13:34:54,702][102897] Updated weights for policy 0, policy_version 45340 (0.0010) +[2023-10-08 13:34:55,174][102898] Updated weights for policy 1, policy_version 45350 (0.0008) +[2023-10-08 13:34:55,542][102898] Updated weights for policy 1, policy_version 45360 (0.0007) +[2023-10-08 13:34:55,910][102898] Updated weights for policy 1, policy_version 45370 (0.0007) +[2023-10-08 13:34:56,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 92897280. Throughput: 0: 1779.9, 1: 1794.0. Samples: 23228846. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:34:56,876][101941] Avg episode reward: [(0, '6.750'), (1, '7.520')] +[2023-10-08 13:34:58,503][102897] Updated weights for policy 0, policy_version 45350 (0.0008) +[2023-10-08 13:34:58,883][102897] Updated weights for policy 0, policy_version 45360 (0.0008) +[2023-10-08 13:34:59,265][102897] Updated weights for policy 0, policy_version 45370 (0.0010) +[2023-10-08 13:34:59,706][102898] Updated weights for policy 1, policy_version 45380 (0.0009) +[2023-10-08 13:35:00,081][102898] Updated weights for policy 1, policy_version 45390 (0.0008) +[2023-10-08 13:35:00,439][102898] Updated weights for policy 1, policy_version 45400 (0.0008) +[2023-10-08 13:35:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 92962816. Throughput: 0: 1780.1, 1: 1777.5. Samples: 23250448. Policy #0 lag: (min: 16.0, avg: 35.0, max: 48.0) +[2023-10-08 13:35:01,875][101941] Avg episode reward: [(0, '7.230'), (1, '7.970')] +[2023-10-08 13:35:03,146][102897] Updated weights for policy 0, policy_version 45380 (0.0008) +[2023-10-08 13:35:03,516][102897] Updated weights for policy 0, policy_version 45390 (0.0008) +[2023-10-08 13:35:03,893][102897] Updated weights for policy 0, policy_version 45400 (0.0007) +[2023-10-08 13:35:04,216][102898] Updated weights for policy 1, policy_version 45410 (0.0007) +[2023-10-08 13:35:04,586][102898] Updated weights for policy 1, policy_version 45420 (0.0007) +[2023-10-08 13:35:04,952][102898] Updated weights for policy 1, policy_version 45430 (0.0008) +[2023-10-08 13:35:05,320][102898] Updated weights for policy 1, policy_version 45440 (0.0008) +[2023-10-08 13:35:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 93028352. Throughput: 0: 1778.8, 1: 1802.2. Samples: 23261270. Policy #0 lag: (min: 16.0, avg: 35.0, max: 48.0) +[2023-10-08 13:35:06,875][101941] Avg episode reward: [(0, '7.450'), (1, '7.710')] +[2023-10-08 13:35:07,585][102897] Updated weights for policy 0, policy_version 45410 (0.0007) +[2023-10-08 13:35:07,965][102897] Updated weights for policy 0, policy_version 45420 (0.0007) +[2023-10-08 13:35:08,336][102897] Updated weights for policy 0, policy_version 45430 (0.0007) +[2023-10-08 13:35:08,705][102897] Updated weights for policy 0, policy_version 45440 (0.0008) +[2023-10-08 13:35:09,001][102898] Updated weights for policy 1, policy_version 45450 (0.0008) +[2023-10-08 13:35:09,363][102898] Updated weights for policy 1, policy_version 45460 (0.0009) +[2023-10-08 13:35:09,740][102898] Updated weights for policy 1, policy_version 45470 (0.0009) +[2023-10-08 13:35:11,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 93093888. Throughput: 0: 1784.1, 1: 1779.3. Samples: 23282708. Policy #0 lag: (min: 16.0, avg: 35.0, max: 48.0) +[2023-10-08 13:35:11,877][101941] Avg episode reward: [(0, '7.650'), (1, '8.090')] +[2023-10-08 13:35:12,433][102897] Updated weights for policy 0, policy_version 45450 (0.0007) +[2023-10-08 13:35:12,796][102897] Updated weights for policy 0, policy_version 45460 (0.0008) +[2023-10-08 13:35:13,169][102897] Updated weights for policy 0, policy_version 45470 (0.0007) +[2023-10-08 13:35:13,727][102898] Updated weights for policy 1, policy_version 45480 (0.0008) +[2023-10-08 13:35:14,095][102898] Updated weights for policy 1, policy_version 45490 (0.0010) +[2023-10-08 13:35:14,460][102898] Updated weights for policy 1, policy_version 45500 (0.0010) +[2023-10-08 13:35:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 93159424. Throughput: 0: 1801.3, 1: 1773.8. Samples: 23304632. Policy #0 lag: (min: 16.0, avg: 35.0, max: 48.0) +[2023-10-08 13:35:16,876][101941] Avg episode reward: [(0, '8.110'), (1, '8.550')] +[2023-10-08 13:35:16,944][102897] Updated weights for policy 0, policy_version 45480 (0.0008) +[2023-10-08 13:35:17,312][102897] Updated weights for policy 0, policy_version 45490 (0.0007) +[2023-10-08 13:35:17,691][102897] Updated weights for policy 0, policy_version 45500 (0.0009) +[2023-10-08 13:35:18,144][102898] Updated weights for policy 1, policy_version 45510 (0.0008) +[2023-10-08 13:35:18,504][102898] Updated weights for policy 1, policy_version 45520 (0.0009) +[2023-10-08 13:35:18,872][102898] Updated weights for policy 1, policy_version 45530 (0.0008) +[2023-10-08 13:35:21,454][102897] Updated weights for policy 0, policy_version 45510 (0.0008) +[2023-10-08 13:35:21,827][102897] Updated weights for policy 0, policy_version 45520 (0.0008) +[2023-10-08 13:35:21,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 93224960. Throughput: 0: 1784.5, 1: 1778.9. Samples: 23314530. Policy #0 lag: (min: 16.0, avg: 35.0, max: 48.0) +[2023-10-08 13:35:21,876][101941] Avg episode reward: [(0, '8.080'), (1, '8.780')] +[2023-10-08 13:35:22,201][102897] Updated weights for policy 0, policy_version 45530 (0.0009) +[2023-10-08 13:35:22,615][102898] Updated weights for policy 1, policy_version 45540 (0.0007) +[2023-10-08 13:35:22,985][102898] Updated weights for policy 1, policy_version 45550 (0.0007) +[2023-10-08 13:35:23,357][102898] Updated weights for policy 1, policy_version 45560 (0.0010) +[2023-10-08 13:35:25,924][102897] Updated weights for policy 0, policy_version 45540 (0.0009) +[2023-10-08 13:35:26,282][102897] Updated weights for policy 0, policy_version 45550 (0.0009) +[2023-10-08 13:35:26,651][102897] Updated weights for policy 0, policy_version 45560 (0.0007) +[2023-10-08 13:35:26,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 93290496. Throughput: 0: 1798.4, 1: 1778.7. Samples: 23336750. Policy #0 lag: (min: 16.0, avg: 35.0, max: 48.0) +[2023-10-08 13:35:26,876][101941] Avg episode reward: [(0, '7.830'), (1, '8.170')] +[2023-10-08 13:35:27,200][102898] Updated weights for policy 1, policy_version 45570 (0.0011) +[2023-10-08 13:35:27,576][102898] Updated weights for policy 1, policy_version 45580 (0.0009) +[2023-10-08 13:35:27,946][102898] Updated weights for policy 1, policy_version 45590 (0.0008) +[2023-10-08 13:35:28,304][102898] Updated weights for policy 1, policy_version 45600 (0.0008) +[2023-10-08 13:35:30,254][102897] Updated weights for policy 0, policy_version 45570 (0.0007) +[2023-10-08 13:35:30,636][102897] Updated weights for policy 0, policy_version 45580 (0.0008) +[2023-10-08 13:35:30,995][102897] Updated weights for policy 0, policy_version 45590 (0.0011) +[2023-10-08 13:35:31,365][102897] Updated weights for policy 0, policy_version 45600 (0.0009) +[2023-10-08 13:35:31,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 93388800. Throughput: 0: 1787.5, 1: 1795.5. Samples: 23357754. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:35:31,876][101941] Avg episode reward: [(0, '7.870'), (1, '8.800')] +[2023-10-08 13:35:32,177][102898] Updated weights for policy 1, policy_version 45610 (0.0008) +[2023-10-08 13:35:32,547][102898] Updated weights for policy 1, policy_version 45620 (0.0008) +[2023-10-08 13:35:32,915][102898] Updated weights for policy 1, policy_version 45630 (0.0007) +[2023-10-08 13:35:35,243][102897] Updated weights for policy 0, policy_version 45610 (0.0007) +[2023-10-08 13:35:35,614][102897] Updated weights for policy 0, policy_version 45620 (0.0009) +[2023-10-08 13:35:35,991][102897] Updated weights for policy 0, policy_version 45630 (0.0007) +[2023-10-08 13:35:36,592][102898] Updated weights for policy 1, policy_version 45640 (0.0007) +[2023-10-08 13:35:36,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 93454336. Throughput: 0: 1797.2, 1: 1777.4. Samples: 23368842. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:35:36,876][101941] Avg episode reward: [(0, '7.380'), (1, '7.700')] +[2023-10-08 13:35:36,956][102898] Updated weights for policy 1, policy_version 45650 (0.0008) +[2023-10-08 13:35:37,335][102898] Updated weights for policy 1, policy_version 45660 (0.0008) +[2023-10-08 13:35:39,665][102897] Updated weights for policy 0, policy_version 45640 (0.0009) +[2023-10-08 13:35:40,039][102897] Updated weights for policy 0, policy_version 45650 (0.0008) +[2023-10-08 13:35:40,413][102897] Updated weights for policy 0, policy_version 45660 (0.0007) +[2023-10-08 13:35:41,011][102898] Updated weights for policy 1, policy_version 45670 (0.0010) +[2023-10-08 13:35:41,384][102898] Updated weights for policy 1, policy_version 45680 (0.0009) +[2023-10-08 13:35:41,742][102898] Updated weights for policy 1, policy_version 45690 (0.0008) +[2023-10-08 13:35:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 93519872. Throughput: 0: 1790.8, 1: 1795.1. Samples: 23390210. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:35:41,876][101941] Avg episode reward: [(0, '7.730'), (1, '7.400')] +[2023-10-08 13:35:44,124][102897] Updated weights for policy 0, policy_version 45670 (0.0008) +[2023-10-08 13:35:44,489][102897] Updated weights for policy 0, policy_version 45680 (0.0007) +[2023-10-08 13:35:44,870][102897] Updated weights for policy 0, policy_version 45690 (0.0007) +[2023-10-08 13:35:45,572][102898] Updated weights for policy 1, policy_version 45700 (0.0008) +[2023-10-08 13:35:45,947][102898] Updated weights for policy 1, policy_version 45710 (0.0008) +[2023-10-08 13:35:46,307][102898] Updated weights for policy 1, policy_version 45720 (0.0011) +[2023-10-08 13:35:46,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 93618176. Throughput: 0: 1787.3, 1: 1781.8. Samples: 23411056. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:35:46,875][101941] Avg episode reward: [(0, '7.400'), (1, '7.940')] +[2023-10-08 13:35:48,694][102897] Updated weights for policy 0, policy_version 45700 (0.0007) +[2023-10-08 13:35:49,063][102897] Updated weights for policy 0, policy_version 45710 (0.0007) +[2023-10-08 13:35:49,439][102897] Updated weights for policy 0, policy_version 45720 (0.0008) +[2023-10-08 13:35:50,066][102898] Updated weights for policy 1, policy_version 45730 (0.0009) +[2023-10-08 13:35:50,425][102898] Updated weights for policy 1, policy_version 45740 (0.0009) +[2023-10-08 13:35:50,785][102898] Updated weights for policy 1, policy_version 45750 (0.0011) +[2023-10-08 13:35:51,146][102898] Updated weights for policy 1, policy_version 45760 (0.0008) +[2023-10-08 13:35:51,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 93683712. Throughput: 0: 1801.9, 1: 1783.9. Samples: 23422630. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:35:51,876][101941] Avg episode reward: [(0, '7.280'), (1, '7.860')] +[2023-10-08 13:35:53,192][102897] Updated weights for policy 0, policy_version 45730 (0.0007) +[2023-10-08 13:35:53,561][102897] Updated weights for policy 0, policy_version 45740 (0.0009) +[2023-10-08 13:35:53,924][102897] Updated weights for policy 0, policy_version 45750 (0.0008) +[2023-10-08 13:35:54,300][102897] Updated weights for policy 0, policy_version 45760 (0.0009) +[2023-10-08 13:35:54,772][102898] Updated weights for policy 1, policy_version 45770 (0.0009) +[2023-10-08 13:35:55,142][102898] Updated weights for policy 1, policy_version 45780 (0.0009) +[2023-10-08 13:35:55,505][102898] Updated weights for policy 1, policy_version 45790 (0.0009) +[2023-10-08 13:35:56,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 93749248. Throughput: 0: 1787.4, 1: 1789.1. Samples: 23443652. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:35:56,876][101941] Avg episode reward: [(0, '7.230'), (1, '8.120')] +[2023-10-08 13:35:58,134][102897] Updated weights for policy 0, policy_version 45770 (0.0008) +[2023-10-08 13:35:58,509][102897] Updated weights for policy 0, policy_version 45780 (0.0009) +[2023-10-08 13:35:58,887][102897] Updated weights for policy 0, policy_version 45790 (0.0010) +[2023-10-08 13:35:59,245][102898] Updated weights for policy 1, policy_version 45800 (0.0009) +[2023-10-08 13:35:59,615][102898] Updated weights for policy 1, policy_version 45810 (0.0009) +[2023-10-08 13:35:59,993][102898] Updated weights for policy 1, policy_version 45820 (0.0008) +[2023-10-08 13:36:01,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 93814784. Throughput: 0: 1790.6, 1: 1791.1. Samples: 23465806. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:36:01,876][101941] Avg episode reward: [(0, '6.680'), (1, '8.410')] +[2023-10-08 13:36:02,429][102897] Updated weights for policy 0, policy_version 45800 (0.0008) +[2023-10-08 13:36:02,803][102897] Updated weights for policy 0, policy_version 45810 (0.0007) +[2023-10-08 13:36:03,175][102897] Updated weights for policy 0, policy_version 45820 (0.0008) +[2023-10-08 13:36:03,730][102898] Updated weights for policy 1, policy_version 45830 (0.0007) +[2023-10-08 13:36:04,097][102898] Updated weights for policy 1, policy_version 45840 (0.0009) +[2023-10-08 13:36:04,460][102898] Updated weights for policy 1, policy_version 45850 (0.0007) +[2023-10-08 13:36:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 93880320. Throughput: 0: 1790.0, 1: 1796.8. Samples: 23475936. Policy #0 lag: (min: 23.0, avg: 24.7, max: 52.0) +[2023-10-08 13:36:06,876][101941] Avg episode reward: [(0, '6.310'), (1, '8.430')] +[2023-10-08 13:36:07,045][102897] Updated weights for policy 0, policy_version 45830 (0.0011) +[2023-10-08 13:36:07,414][102897] Updated weights for policy 0, policy_version 45840 (0.0009) +[2023-10-08 13:36:07,794][102897] Updated weights for policy 0, policy_version 45850 (0.0009) +[2023-10-08 13:36:08,043][102898] Updated weights for policy 1, policy_version 45860 (0.0007) +[2023-10-08 13:36:08,414][102898] Updated weights for policy 1, policy_version 45870 (0.0008) +[2023-10-08 13:36:08,786][102898] Updated weights for policy 1, policy_version 45880 (0.0008) +[2023-10-08 13:36:11,568][102897] Updated weights for policy 0, policy_version 45860 (0.0009) +[2023-10-08 13:36:11,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 93945856. Throughput: 0: 1788.9, 1: 1800.9. Samples: 23498290. Policy #0 lag: (min: 23.0, avg: 24.7, max: 52.0) +[2023-10-08 13:36:11,876][101941] Avg episode reward: [(0, '6.960'), (1, '8.100')] +[2023-10-08 13:36:11,934][102897] Updated weights for policy 0, policy_version 45870 (0.0010) +[2023-10-08 13:36:12,302][102897] Updated weights for policy 0, policy_version 45880 (0.0007) +[2023-10-08 13:36:12,525][102898] Updated weights for policy 1, policy_version 45890 (0.0008) +[2023-10-08 13:36:12,896][102898] Updated weights for policy 1, policy_version 45900 (0.0009) +[2023-10-08 13:36:13,265][102898] Updated weights for policy 1, policy_version 45910 (0.0009) +[2023-10-08 13:36:13,635][102898] Updated weights for policy 1, policy_version 45920 (0.0010) +[2023-10-08 13:36:15,949][102897] Updated weights for policy 0, policy_version 45890 (0.0008) +[2023-10-08 13:36:16,326][102897] Updated weights for policy 0, policy_version 45900 (0.0008) +[2023-10-08 13:36:16,690][102897] Updated weights for policy 0, policy_version 45910 (0.0008) +[2023-10-08 13:36:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 94011392. Throughput: 0: 1803.9, 1: 1806.0. Samples: 23520202. Policy #0 lag: (min: 23.0, avg: 24.7, max: 52.0) +[2023-10-08 13:36:16,875][101941] Avg episode reward: [(0, '7.640'), (1, '8.140')] +[2023-10-08 13:36:17,055][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000045920_47022080.pth... +[2023-10-08 13:36:17,059][102897] Updated weights for policy 0, policy_version 45920 (0.0008) +[2023-10-08 13:36:17,089][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000044224_45285376.pth +[2023-10-08 13:36:17,324][102898] Updated weights for policy 1, policy_version 45930 (0.0007) +[2023-10-08 13:36:17,696][102898] Updated weights for policy 1, policy_version 45940 (0.0008) +[2023-10-08 13:36:18,067][102898] Updated weights for policy 1, policy_version 45950 (0.0008) +[2023-10-08 13:36:18,139][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000045952_47054848.pth... +[2023-10-08 13:36:18,178][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000044256_45318144.pth +[2023-10-08 13:36:20,982][102897] Updated weights for policy 0, policy_version 45930 (0.0008) +[2023-10-08 13:36:21,350][102897] Updated weights for policy 0, policy_version 45940 (0.0009) +[2023-10-08 13:36:21,726][102897] Updated weights for policy 0, policy_version 45950 (0.0008) +[2023-10-08 13:36:21,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 94109696. Throughput: 0: 1784.9, 1: 1805.0. Samples: 23530388. Policy #0 lag: (min: 23.0, avg: 24.7, max: 52.0) +[2023-10-08 13:36:21,875][101941] Avg episode reward: [(0, '7.520'), (1, '8.440')] +[2023-10-08 13:36:22,000][102898] Updated weights for policy 1, policy_version 45960 (0.0009) +[2023-10-08 13:36:22,363][102898] Updated weights for policy 1, policy_version 45970 (0.0009) +[2023-10-08 13:36:22,736][102898] Updated weights for policy 1, policy_version 45980 (0.0008) +[2023-10-08 13:36:25,524][102897] Updated weights for policy 0, policy_version 45960 (0.0008) +[2023-10-08 13:36:25,896][102897] Updated weights for policy 0, policy_version 45970 (0.0009) +[2023-10-08 13:36:26,266][102897] Updated weights for policy 0, policy_version 45980 (0.0007) +[2023-10-08 13:36:26,418][102898] Updated weights for policy 1, policy_version 45990 (0.0007) +[2023-10-08 13:36:26,786][102898] Updated weights for policy 1, policy_version 46000 (0.0007) +[2023-10-08 13:36:26,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 94175232. Throughput: 0: 1807.7, 1: 1793.9. Samples: 23552282. Policy #0 lag: (min: 23.0, avg: 24.7, max: 52.0) +[2023-10-08 13:36:26,876][101941] Avg episode reward: [(0, '7.250'), (1, '8.590')] +[2023-10-08 13:36:27,152][102898] Updated weights for policy 1, policy_version 46010 (0.0010) +[2023-10-08 13:36:30,152][102897] Updated weights for policy 0, policy_version 45990 (0.0007) +[2023-10-08 13:36:30,528][102897] Updated weights for policy 0, policy_version 46000 (0.0009) +[2023-10-08 13:36:30,898][102897] Updated weights for policy 0, policy_version 46010 (0.0008) +[2023-10-08 13:36:30,922][102898] Updated weights for policy 1, policy_version 46020 (0.0009) +[2023-10-08 13:36:31,286][102898] Updated weights for policy 1, policy_version 46030 (0.0008) +[2023-10-08 13:36:31,660][102898] Updated weights for policy 1, policy_version 46040 (0.0008) +[2023-10-08 13:36:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 94240768. Throughput: 0: 1778.0, 1: 1809.6. Samples: 23572502. Policy #0 lag: (min: 23.0, avg: 24.7, max: 52.0) +[2023-10-08 13:36:31,875][101941] Avg episode reward: [(0, '6.290'), (1, '9.080')] +[2023-10-08 13:36:31,943][102760] Saving new best policy, reward=9.080! +[2023-10-08 13:36:34,770][102897] Updated weights for policy 0, policy_version 46020 (0.0008) +[2023-10-08 13:36:35,148][102897] Updated weights for policy 0, policy_version 46030 (0.0007) +[2023-10-08 13:36:35,511][102897] Updated weights for policy 0, policy_version 46040 (0.0008) +[2023-10-08 13:36:35,556][102898] Updated weights for policy 1, policy_version 46050 (0.0008) +[2023-10-08 13:36:35,911][102898] Updated weights for policy 1, policy_version 46060 (0.0007) +[2023-10-08 13:36:36,281][102898] Updated weights for policy 1, policy_version 46070 (0.0008) +[2023-10-08 13:36:36,650][102898] Updated weights for policy 1, policy_version 46080 (0.0009) +[2023-10-08 13:36:36,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 94339072. Throughput: 0: 1794.8, 1: 1795.8. Samples: 23584204. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:36:36,876][101941] Avg episode reward: [(0, '5.950'), (1, '7.990')] +[2023-10-08 13:36:39,485][102897] Updated weights for policy 0, policy_version 46050 (0.0007) +[2023-10-08 13:36:39,850][102897] Updated weights for policy 0, policy_version 46060 (0.0009) +[2023-10-08 13:36:40,221][102897] Updated weights for policy 0, policy_version 46070 (0.0009) +[2023-10-08 13:36:40,506][102898] Updated weights for policy 1, policy_version 46090 (0.0008) +[2023-10-08 13:36:40,583][102897] Updated weights for policy 0, policy_version 46080 (0.0007) +[2023-10-08 13:36:40,872][102898] Updated weights for policy 1, policy_version 46100 (0.0008) +[2023-10-08 13:36:41,244][102898] Updated weights for policy 1, policy_version 46110 (0.0009) +[2023-10-08 13:36:41,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 94404608. Throughput: 0: 1773.3, 1: 1804.3. Samples: 23604640. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:36:41,875][101941] Avg episode reward: [(0, '6.310'), (1, '7.550')] +[2023-10-08 13:36:44,457][102897] Updated weights for policy 0, policy_version 46090 (0.0010) +[2023-10-08 13:36:44,834][102897] Updated weights for policy 0, policy_version 46100 (0.0009) +[2023-10-08 13:36:45,099][102898] Updated weights for policy 1, policy_version 46120 (0.0007) +[2023-10-08 13:36:45,211][102897] Updated weights for policy 0, policy_version 46110 (0.0007) +[2023-10-08 13:36:45,473][102898] Updated weights for policy 1, policy_version 46130 (0.0008) +[2023-10-08 13:36:45,837][102898] Updated weights for policy 1, policy_version 46140 (0.0010) +[2023-10-08 13:36:46,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 94470144. Throughput: 0: 1759.8, 1: 1779.8. Samples: 23625088. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:36:46,875][101941] Avg episode reward: [(0, '6.720'), (1, '8.470')] +[2023-10-08 13:36:49,090][102897] Updated weights for policy 0, policy_version 46120 (0.0009) +[2023-10-08 13:36:49,464][102897] Updated weights for policy 0, policy_version 46130 (0.0007) +[2023-10-08 13:36:49,666][102898] Updated weights for policy 1, policy_version 46150 (0.0009) +[2023-10-08 13:36:49,830][102897] Updated weights for policy 0, policy_version 46140 (0.0007) +[2023-10-08 13:36:50,036][102898] Updated weights for policy 1, policy_version 46160 (0.0007) +[2023-10-08 13:36:50,398][102898] Updated weights for policy 1, policy_version 46170 (0.0008) +[2023-10-08 13:36:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 94535680. Throughput: 0: 1773.1, 1: 1804.0. Samples: 23636904. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:36:51,876][101941] Avg episode reward: [(0, '6.560'), (1, '8.510')] +[2023-10-08 13:36:53,546][102897] Updated weights for policy 0, policy_version 46150 (0.0008) +[2023-10-08 13:36:53,910][102897] Updated weights for policy 0, policy_version 46160 (0.0010) +[2023-10-08 13:36:54,147][102898] Updated weights for policy 1, policy_version 46180 (0.0008) +[2023-10-08 13:36:54,289][102897] Updated weights for policy 0, policy_version 46170 (0.0010) +[2023-10-08 13:36:54,506][102898] Updated weights for policy 1, policy_version 46190 (0.0008) +[2023-10-08 13:36:54,883][102898] Updated weights for policy 1, policy_version 46200 (0.0010) +[2023-10-08 13:36:56,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 94601216. Throughput: 0: 1752.3, 1: 1772.6. Samples: 23656910. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:36:56,876][101941] Avg episode reward: [(0, '7.000'), (1, '8.620')] +[2023-10-08 13:36:58,184][102897] Updated weights for policy 0, policy_version 46180 (0.0009) +[2023-10-08 13:36:58,558][102897] Updated weights for policy 0, policy_version 46190 (0.0010) +[2023-10-08 13:36:58,641][102898] Updated weights for policy 1, policy_version 46210 (0.0009) +[2023-10-08 13:36:58,933][102897] Updated weights for policy 0, policy_version 46200 (0.0008) +[2023-10-08 13:36:59,005][102898] Updated weights for policy 1, policy_version 46220 (0.0008) +[2023-10-08 13:36:59,368][102898] Updated weights for policy 1, policy_version 46230 (0.0009) +[2023-10-08 13:36:59,739][102898] Updated weights for policy 1, policy_version 46240 (0.0010) +[2023-10-08 13:37:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 94666752. Throughput: 0: 1763.7, 1: 1765.9. Samples: 23679036. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:37:01,876][101941] Avg episode reward: [(0, '7.060'), (1, '8.670')] +[2023-10-08 13:37:02,616][102897] Updated weights for policy 0, policy_version 46210 (0.0008) +[2023-10-08 13:37:02,993][102897] Updated weights for policy 0, policy_version 46220 (0.0008) +[2023-10-08 13:37:03,371][102897] Updated weights for policy 0, policy_version 46230 (0.0009) +[2023-10-08 13:37:03,656][102898] Updated weights for policy 1, policy_version 46250 (0.0007) +[2023-10-08 13:37:03,734][102897] Updated weights for policy 0, policy_version 46240 (0.0008) +[2023-10-08 13:37:04,018][102898] Updated weights for policy 1, policy_version 46260 (0.0008) +[2023-10-08 13:37:04,386][102898] Updated weights for policy 1, policy_version 46270 (0.0010) +[2023-10-08 13:37:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 94732288. Throughput: 0: 1748.8, 1: 1766.0. Samples: 23688552. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:37:06,876][101941] Avg episode reward: [(0, '6.800'), (1, '8.200')] +[2023-10-08 13:37:07,422][102897] Updated weights for policy 0, policy_version 46250 (0.0009) +[2023-10-08 13:37:07,798][102897] Updated weights for policy 0, policy_version 46260 (0.0009) +[2023-10-08 13:37:08,166][102897] Updated weights for policy 0, policy_version 46270 (0.0008) +[2023-10-08 13:37:08,230][102898] Updated weights for policy 1, policy_version 46280 (0.0007) +[2023-10-08 13:37:08,600][102898] Updated weights for policy 1, policy_version 46290 (0.0008) +[2023-10-08 13:37:08,958][102898] Updated weights for policy 1, policy_version 46300 (0.0008) +[2023-10-08 13:37:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 94797824. Throughput: 0: 1751.5, 1: 1769.0. Samples: 23710704. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:37:11,876][101941] Avg episode reward: [(0, '6.920'), (1, '8.540')] +[2023-10-08 13:37:11,905][102897] Updated weights for policy 0, policy_version 46280 (0.0009) +[2023-10-08 13:37:12,272][102897] Updated weights for policy 0, policy_version 46290 (0.0009) +[2023-10-08 13:37:12,653][102897] Updated weights for policy 0, policy_version 46300 (0.0007) +[2023-10-08 13:37:12,791][102898] Updated weights for policy 1, policy_version 46310 (0.0009) +[2023-10-08 13:37:13,155][102898] Updated weights for policy 1, policy_version 46320 (0.0011) +[2023-10-08 13:37:13,525][102898] Updated weights for policy 1, policy_version 46330 (0.0007) +[2023-10-08 13:37:16,433][102897] Updated weights for policy 0, policy_version 46310 (0.0010) +[2023-10-08 13:37:16,808][102897] Updated weights for policy 0, policy_version 46320 (0.0010) +[2023-10-08 13:37:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 94863360. Throughput: 0: 1785.2, 1: 1777.5. Samples: 23732820. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:37:16,875][101941] Avg episode reward: [(0, '6.840'), (1, '8.640')] +[2023-10-08 13:37:17,185][102897] Updated weights for policy 0, policy_version 46330 (0.0011) +[2023-10-08 13:37:17,384][102898] Updated weights for policy 1, policy_version 46340 (0.0008) +[2023-10-08 13:37:17,754][102898] Updated weights for policy 1, policy_version 46350 (0.0007) +[2023-10-08 13:37:18,118][102898] Updated weights for policy 1, policy_version 46360 (0.0007) +[2023-10-08 13:37:20,954][102897] Updated weights for policy 0, policy_version 46340 (0.0008) +[2023-10-08 13:37:21,332][102897] Updated weights for policy 0, policy_version 46350 (0.0007) +[2023-10-08 13:37:21,699][102897] Updated weights for policy 0, policy_version 46360 (0.0010) +[2023-10-08 13:37:21,858][102898] Updated weights for policy 1, policy_version 46370 (0.0007) +[2023-10-08 13:37:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 13653.3, 300 sec: 14218.0). Total num frames: 94928896. Throughput: 0: 1759.6, 1: 1764.0. Samples: 23742764. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:37:21,876][101941] Avg episode reward: [(0, '7.590'), (1, '8.330')] +[2023-10-08 13:37:22,224][102898] Updated weights for policy 1, policy_version 46380 (0.0008) +[2023-10-08 13:37:22,601][102898] Updated weights for policy 1, policy_version 46390 (0.0008) +[2023-10-08 13:37:22,971][102898] Updated weights for policy 1, policy_version 46400 (0.0010) +[2023-10-08 13:37:25,368][102897] Updated weights for policy 0, policy_version 46370 (0.0007) +[2023-10-08 13:37:25,739][102897] Updated weights for policy 0, policy_version 46380 (0.0010) +[2023-10-08 13:37:26,105][102897] Updated weights for policy 0, policy_version 46390 (0.0009) +[2023-10-08 13:37:26,477][102897] Updated weights for policy 0, policy_version 46400 (0.0007) +[2023-10-08 13:37:26,788][102898] Updated weights for policy 1, policy_version 46410 (0.0009) +[2023-10-08 13:37:26,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 95027200. Throughput: 0: 1789.4, 1: 1774.9. Samples: 23765032. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:37:26,875][101941] Avg episode reward: [(0, '7.750'), (1, '8.160')] +[2023-10-08 13:37:27,151][102898] Updated weights for policy 1, policy_version 46420 (0.0011) +[2023-10-08 13:37:27,519][102898] Updated weights for policy 1, policy_version 46430 (0.0010) +[2023-10-08 13:37:30,241][102897] Updated weights for policy 0, policy_version 46410 (0.0008) +[2023-10-08 13:37:30,620][102897] Updated weights for policy 0, policy_version 46420 (0.0007) +[2023-10-08 13:37:30,988][102897] Updated weights for policy 0, policy_version 46430 (0.0010) +[2023-10-08 13:37:31,474][102898] Updated weights for policy 1, policy_version 46440 (0.0008) +[2023-10-08 13:37:31,840][102898] Updated weights for policy 1, policy_version 46450 (0.0009) +[2023-10-08 13:37:31,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 95092736. Throughput: 0: 1772.6, 1: 1787.1. Samples: 23785274. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:37:31,876][101941] Avg episode reward: [(0, '7.910'), (1, '7.810')] +[2023-10-08 13:37:32,199][102898] Updated weights for policy 1, policy_version 46460 (0.0011) +[2023-10-08 13:37:34,821][102897] Updated weights for policy 0, policy_version 46440 (0.0008) +[2023-10-08 13:37:35,189][102897] Updated weights for policy 0, policy_version 46450 (0.0007) +[2023-10-08 13:37:35,569][102897] Updated weights for policy 0, policy_version 46460 (0.0009) +[2023-10-08 13:37:36,044][102898] Updated weights for policy 1, policy_version 46470 (0.0007) +[2023-10-08 13:37:36,413][102898] Updated weights for policy 1, policy_version 46480 (0.0007) +[2023-10-08 13:37:36,777][102898] Updated weights for policy 1, policy_version 46490 (0.0007) +[2023-10-08 13:37:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 13653.4, 300 sec: 14329.1). Total num frames: 95158272. Throughput: 0: 1792.0, 1: 1759.1. Samples: 23796700. Policy #0 lag: (min: 14.0, avg: 14.0, max: 14.0) +[2023-10-08 13:37:36,876][101941] Avg episode reward: [(0, '7.500'), (1, '8.370')] +[2023-10-08 13:37:39,451][102897] Updated weights for policy 0, policy_version 46470 (0.0010) +[2023-10-08 13:37:39,830][102897] Updated weights for policy 0, policy_version 46480 (0.0009) +[2023-10-08 13:37:40,197][102897] Updated weights for policy 0, policy_version 46490 (0.0009) +[2023-10-08 13:37:40,661][102898] Updated weights for policy 1, policy_version 46500 (0.0007) +[2023-10-08 13:37:41,027][102898] Updated weights for policy 1, policy_version 46510 (0.0008) +[2023-10-08 13:37:41,393][102898] Updated weights for policy 1, policy_version 46520 (0.0008) +[2023-10-08 13:37:41,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 95256576. Throughput: 0: 1779.8, 1: 1796.0. Samples: 23817822. Policy #0 lag: (min: 21.0, avg: 26.3, max: 53.0) +[2023-10-08 13:37:41,876][101941] Avg episode reward: [(0, '6.650'), (1, '8.340')] +[2023-10-08 13:37:43,949][102897] Updated weights for policy 0, policy_version 46500 (0.0009) +[2023-10-08 13:37:44,319][102897] Updated weights for policy 0, policy_version 46510 (0.0009) +[2023-10-08 13:37:44,689][102897] Updated weights for policy 0, policy_version 46520 (0.0009) +[2023-10-08 13:37:44,934][102898] Updated weights for policy 1, policy_version 46530 (0.0008) +[2023-10-08 13:37:45,302][102898] Updated weights for policy 1, policy_version 46540 (0.0009) +[2023-10-08 13:37:45,666][102898] Updated weights for policy 1, policy_version 46550 (0.0007) +[2023-10-08 13:37:46,028][102898] Updated weights for policy 1, policy_version 46560 (0.0008) +[2023-10-08 13:37:46,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 95322112. Throughput: 0: 1782.3, 1: 1770.8. Samples: 23838926. Policy #0 lag: (min: 21.0, avg: 26.3, max: 53.0) +[2023-10-08 13:37:46,876][101941] Avg episode reward: [(0, '7.070'), (1, '7.940')] +[2023-10-08 13:37:48,383][102897] Updated weights for policy 0, policy_version 46530 (0.0008) +[2023-10-08 13:37:48,755][102897] Updated weights for policy 0, policy_version 46540 (0.0008) +[2023-10-08 13:37:49,132][102897] Updated weights for policy 0, policy_version 46550 (0.0008) +[2023-10-08 13:37:49,503][102897] Updated weights for policy 0, policy_version 46560 (0.0008) +[2023-10-08 13:37:49,807][102898] Updated weights for policy 1, policy_version 46570 (0.0009) +[2023-10-08 13:37:50,172][102898] Updated weights for policy 1, policy_version 46580 (0.0007) +[2023-10-08 13:37:50,539][102898] Updated weights for policy 1, policy_version 46590 (0.0009) +[2023-10-08 13:37:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 95387648. Throughput: 0: 1787.6, 1: 1804.7. Samples: 23850202. Policy #0 lag: (min: 21.0, avg: 26.3, max: 53.0) +[2023-10-08 13:37:51,876][101941] Avg episode reward: [(0, '7.200'), (1, '8.080')] +[2023-10-08 13:37:53,219][102897] Updated weights for policy 0, policy_version 46570 (0.0008) +[2023-10-08 13:37:53,594][102897] Updated weights for policy 0, policy_version 46580 (0.0009) +[2023-10-08 13:37:53,975][102897] Updated weights for policy 0, policy_version 46590 (0.0008) +[2023-10-08 13:37:54,176][102898] Updated weights for policy 1, policy_version 46600 (0.0007) +[2023-10-08 13:37:54,548][102898] Updated weights for policy 1, policy_version 46610 (0.0007) +[2023-10-08 13:37:54,906][102898] Updated weights for policy 1, policy_version 46620 (0.0009) +[2023-10-08 13:37:56,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 95453184. Throughput: 0: 1790.8, 1: 1775.1. Samples: 23871166. Policy #0 lag: (min: 21.0, avg: 26.3, max: 53.0) +[2023-10-08 13:37:56,876][101941] Avg episode reward: [(0, '7.040'), (1, '8.900')] +[2023-10-08 13:37:57,837][102897] Updated weights for policy 0, policy_version 46600 (0.0009) +[2023-10-08 13:37:58,199][102897] Updated weights for policy 0, policy_version 46610 (0.0009) +[2023-10-08 13:37:58,576][102897] Updated weights for policy 0, policy_version 46620 (0.0010) +[2023-10-08 13:37:58,596][102898] Updated weights for policy 1, policy_version 46630 (0.0008) +[2023-10-08 13:37:58,952][102898] Updated weights for policy 1, policy_version 46640 (0.0011) +[2023-10-08 13:37:59,322][102898] Updated weights for policy 1, policy_version 46650 (0.0009) +[2023-10-08 13:38:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 95518720. Throughput: 0: 1784.0, 1: 1787.5. Samples: 23893538. Policy #0 lag: (min: 21.0, avg: 26.3, max: 53.0) +[2023-10-08 13:38:01,876][101941] Avg episode reward: [(0, '7.310'), (1, '8.650')] +[2023-10-08 13:38:02,307][102897] Updated weights for policy 0, policy_version 46630 (0.0010) +[2023-10-08 13:38:02,671][102897] Updated weights for policy 0, policy_version 46640 (0.0010) +[2023-10-08 13:38:03,050][102897] Updated weights for policy 0, policy_version 46650 (0.0009) +[2023-10-08 13:38:03,155][102898] Updated weights for policy 1, policy_version 46660 (0.0007) +[2023-10-08 13:38:03,525][102898] Updated weights for policy 1, policy_version 46670 (0.0007) +[2023-10-08 13:38:03,881][102898] Updated weights for policy 1, policy_version 46680 (0.0007) +[2023-10-08 13:38:06,794][102897] Updated weights for policy 0, policy_version 46660 (0.0009) +[2023-10-08 13:38:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 95584256. Throughput: 0: 1782.2, 1: 1785.6. Samples: 23903316. Policy #0 lag: (min: 21.0, avg: 26.3, max: 53.0) +[2023-10-08 13:38:06,876][101941] Avg episode reward: [(0, '7.170'), (1, '8.660')] +[2023-10-08 13:38:07,164][102897] Updated weights for policy 0, policy_version 46670 (0.0010) +[2023-10-08 13:38:07,545][102897] Updated weights for policy 0, policy_version 46680 (0.0008) +[2023-10-08 13:38:07,581][102898] Updated weights for policy 1, policy_version 46690 (0.0008) +[2023-10-08 13:38:07,946][102898] Updated weights for policy 1, policy_version 46700 (0.0007) +[2023-10-08 13:38:08,319][102898] Updated weights for policy 1, policy_version 46710 (0.0010) +[2023-10-08 13:38:08,674][102898] Updated weights for policy 1, policy_version 46720 (0.0010) +[2023-10-08 13:38:11,297][102897] Updated weights for policy 0, policy_version 46690 (0.0008) +[2023-10-08 13:38:11,665][102897] Updated weights for policy 0, policy_version 46700 (0.0010) +[2023-10-08 13:38:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 95649792. Throughput: 0: 1785.4, 1: 1785.0. Samples: 23925700. Policy #0 lag: (min: 21.0, avg: 26.3, max: 53.0) +[2023-10-08 13:38:11,876][101941] Avg episode reward: [(0, '6.310'), (1, '8.560')] +[2023-10-08 13:38:12,029][102897] Updated weights for policy 0, policy_version 46710 (0.0010) +[2023-10-08 13:38:12,402][102897] Updated weights for policy 0, policy_version 46720 (0.0010) +[2023-10-08 13:38:12,534][102898] Updated weights for policy 1, policy_version 46730 (0.0008) +[2023-10-08 13:38:12,895][102898] Updated weights for policy 1, policy_version 46740 (0.0010) +[2023-10-08 13:38:13,264][102898] Updated weights for policy 1, policy_version 46750 (0.0010) +[2023-10-08 13:38:16,210][102897] Updated weights for policy 0, policy_version 46730 (0.0008) +[2023-10-08 13:38:16,582][102897] Updated weights for policy 0, policy_version 46740 (0.0007) +[2023-10-08 13:38:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 95715328. Throughput: 0: 1799.0, 1: 1801.8. Samples: 23947310. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 13:38:16,876][101941] Avg episode reward: [(0, '6.770'), (1, '8.580')] +[2023-10-08 13:38:16,944][102897] Updated weights for policy 0, policy_version 46750 (0.0008) +[2023-10-08 13:38:17,016][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000046752_47874048.pth... +[2023-10-08 13:38:17,054][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000045056_46137344.pth +[2023-10-08 13:38:17,183][102898] Updated weights for policy 1, policy_version 46760 (0.0009) +[2023-10-08 13:38:17,549][102898] Updated weights for policy 1, policy_version 46770 (0.0008) +[2023-10-08 13:38:17,925][102898] Updated weights for policy 1, policy_version 46780 (0.0009) +[2023-10-08 13:38:18,072][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000046784_47906816.pth... +[2023-10-08 13:38:18,110][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000045088_46170112.pth +[2023-10-08 13:38:20,605][102897] Updated weights for policy 0, policy_version 46760 (0.0009) +[2023-10-08 13:38:20,981][102897] Updated weights for policy 0, policy_version 46770 (0.0009) +[2023-10-08 13:38:21,349][102897] Updated weights for policy 0, policy_version 46780 (0.0009) +[2023-10-08 13:38:21,746][102898] Updated weights for policy 1, policy_version 46790 (0.0008) +[2023-10-08 13:38:21,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 95813632. Throughput: 0: 1781.7, 1: 1795.4. Samples: 23957670. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 13:38:21,876][101941] Avg episode reward: [(0, '7.520'), (1, '8.500')] +[2023-10-08 13:38:22,114][102898] Updated weights for policy 1, policy_version 46800 (0.0007) +[2023-10-08 13:38:22,482][102898] Updated weights for policy 1, policy_version 46810 (0.0007) +[2023-10-08 13:38:25,214][102897] Updated weights for policy 0, policy_version 46790 (0.0007) +[2023-10-08 13:38:25,589][102897] Updated weights for policy 0, policy_version 46800 (0.0009) +[2023-10-08 13:38:25,960][102897] Updated weights for policy 0, policy_version 46810 (0.0009) +[2023-10-08 13:38:26,169][102898] Updated weights for policy 1, policy_version 46820 (0.0008) +[2023-10-08 13:38:26,550][102898] Updated weights for policy 1, policy_version 46830 (0.0010) +[2023-10-08 13:38:26,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 95879168. Throughput: 0: 1800.1, 1: 1786.9. Samples: 23979238. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 13:38:26,876][101941] Avg episode reward: [(0, '7.770'), (1, '8.590')] +[2023-10-08 13:38:26,905][102898] Updated weights for policy 1, policy_version 46840 (0.0011) +[2023-10-08 13:38:29,798][102897] Updated weights for policy 0, policy_version 46820 (0.0009) +[2023-10-08 13:38:30,178][102897] Updated weights for policy 0, policy_version 46830 (0.0009) +[2023-10-08 13:38:30,540][102897] Updated weights for policy 0, policy_version 46840 (0.0008) +[2023-10-08 13:38:30,794][102898] Updated weights for policy 1, policy_version 46850 (0.0010) +[2023-10-08 13:38:31,161][102898] Updated weights for policy 1, policy_version 46860 (0.0011) +[2023-10-08 13:38:31,531][102898] Updated weights for policy 1, policy_version 46870 (0.0010) +[2023-10-08 13:38:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 95944704. Throughput: 0: 1777.5, 1: 1792.6. Samples: 23999578. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 13:38:31,876][101941] Avg episode reward: [(0, '7.610'), (1, '8.520')] +[2023-10-08 13:38:31,894][102898] Updated weights for policy 1, policy_version 46880 (0.0009) +[2023-10-08 13:38:34,195][102897] Updated weights for policy 0, policy_version 46850 (0.0007) +[2023-10-08 13:38:34,580][102897] Updated weights for policy 0, policy_version 46860 (0.0008) +[2023-10-08 13:38:34,943][102897] Updated weights for policy 0, policy_version 46870 (0.0010) +[2023-10-08 13:38:35,317][102897] Updated weights for policy 0, policy_version 46880 (0.0009) +[2023-10-08 13:38:35,795][102898] Updated weights for policy 1, policy_version 46890 (0.0008) +[2023-10-08 13:38:36,161][102898] Updated weights for policy 1, policy_version 46900 (0.0008) +[2023-10-08 13:38:36,531][102898] Updated weights for policy 1, policy_version 46910 (0.0008) +[2023-10-08 13:38:36,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 96043008. Throughput: 0: 1806.8, 1: 1776.3. Samples: 24011440. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 13:38:36,876][101941] Avg episode reward: [(0, '7.190'), (1, '7.760')] +[2023-10-08 13:38:39,054][102897] Updated weights for policy 0, policy_version 46890 (0.0007) +[2023-10-08 13:38:39,421][102897] Updated weights for policy 0, policy_version 46900 (0.0007) +[2023-10-08 13:38:39,790][102897] Updated weights for policy 0, policy_version 46910 (0.0008) +[2023-10-08 13:38:40,236][102898] Updated weights for policy 1, policy_version 46920 (0.0009) +[2023-10-08 13:38:40,603][102898] Updated weights for policy 1, policy_version 46930 (0.0010) +[2023-10-08 13:38:40,964][102898] Updated weights for policy 1, policy_version 46940 (0.0009) +[2023-10-08 13:38:41,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 96108544. Throughput: 0: 1780.6, 1: 1794.4. Samples: 24032038. Policy #0 lag: (min: 31.0, avg: 34.2, max: 63.0) +[2023-10-08 13:38:41,876][101941] Avg episode reward: [(0, '6.920'), (1, '8.450')] +[2023-10-08 13:38:43,570][102897] Updated weights for policy 0, policy_version 46920 (0.0010) +[2023-10-08 13:38:43,943][102897] Updated weights for policy 0, policy_version 46930 (0.0010) +[2023-10-08 13:38:44,308][102897] Updated weights for policy 0, policy_version 46940 (0.0008) +[2023-10-08 13:38:44,669][102898] Updated weights for policy 1, policy_version 46950 (0.0008) +[2023-10-08 13:38:45,033][102898] Updated weights for policy 1, policy_version 46960 (0.0007) +[2023-10-08 13:38:45,407][102898] Updated weights for policy 1, policy_version 46970 (0.0011) +[2023-10-08 13:38:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 96174080. Throughput: 0: 1785.6, 1: 1772.0. Samples: 24053632. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:38:46,876][101941] Avg episode reward: [(0, '6.820'), (1, '9.340')] +[2023-10-08 13:38:46,884][102760] Saving new best policy, reward=9.340! +[2023-10-08 13:38:48,259][102897] Updated weights for policy 0, policy_version 46950 (0.0009) +[2023-10-08 13:38:48,648][102897] Updated weights for policy 0, policy_version 46960 (0.0007) +[2023-10-08 13:38:49,012][102897] Updated weights for policy 0, policy_version 46970 (0.0008) +[2023-10-08 13:38:49,163][102898] Updated weights for policy 1, policy_version 46980 (0.0009) +[2023-10-08 13:38:49,533][102898] Updated weights for policy 1, policy_version 46990 (0.0008) +[2023-10-08 13:38:49,897][102898] Updated weights for policy 1, policy_version 47000 (0.0007) +[2023-10-08 13:38:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 96239616. Throughput: 0: 1781.5, 1: 1794.6. Samples: 24064240. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:38:51,876][101941] Avg episode reward: [(0, '7.090'), (1, '9.020')] +[2023-10-08 13:38:52,688][102897] Updated weights for policy 0, policy_version 46980 (0.0007) +[2023-10-08 13:38:53,064][102897] Updated weights for policy 0, policy_version 46990 (0.0008) +[2023-10-08 13:38:53,433][102897] Updated weights for policy 0, policy_version 47000 (0.0008) +[2023-10-08 13:38:53,676][102898] Updated weights for policy 1, policy_version 47010 (0.0008) +[2023-10-08 13:38:54,039][102898] Updated weights for policy 1, policy_version 47020 (0.0008) +[2023-10-08 13:38:54,403][102898] Updated weights for policy 1, policy_version 47030 (0.0009) +[2023-10-08 13:38:54,773][102898] Updated weights for policy 1, policy_version 47040 (0.0010) +[2023-10-08 13:38:56,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 96305152. Throughput: 0: 1780.8, 1: 1775.7. Samples: 24085744. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:38:56,876][101941] Avg episode reward: [(0, '6.910'), (1, '8.520')] +[2023-10-08 13:38:57,164][102897] Updated weights for policy 0, policy_version 47010 (0.0008) +[2023-10-08 13:38:57,539][102897] Updated weights for policy 0, policy_version 47020 (0.0008) +[2023-10-08 13:38:57,913][102897] Updated weights for policy 0, policy_version 47030 (0.0008) +[2023-10-08 13:38:58,276][102897] Updated weights for policy 0, policy_version 47040 (0.0008) +[2023-10-08 13:38:58,429][102898] Updated weights for policy 1, policy_version 47050 (0.0009) +[2023-10-08 13:38:58,788][102898] Updated weights for policy 1, policy_version 47060 (0.0007) +[2023-10-08 13:38:59,159][102898] Updated weights for policy 1, policy_version 47070 (0.0007) +[2023-10-08 13:39:01,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 96370688. Throughput: 0: 1791.6, 1: 1779.6. Samples: 24108012. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:39:01,876][101941] Avg episode reward: [(0, '7.070'), (1, '8.390')] +[2023-10-08 13:39:02,174][102897] Updated weights for policy 0, policy_version 47050 (0.0007) +[2023-10-08 13:39:02,553][102897] Updated weights for policy 0, policy_version 47060 (0.0008) +[2023-10-08 13:39:02,923][102897] Updated weights for policy 0, policy_version 47070 (0.0008) +[2023-10-08 13:39:03,050][102898] Updated weights for policy 1, policy_version 47080 (0.0007) +[2023-10-08 13:39:03,424][102898] Updated weights for policy 1, policy_version 47090 (0.0007) +[2023-10-08 13:39:03,799][102898] Updated weights for policy 1, policy_version 47100 (0.0007) +[2023-10-08 13:39:06,604][102897] Updated weights for policy 0, policy_version 47080 (0.0007) +[2023-10-08 13:39:06,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 96436224. Throughput: 0: 1775.2, 1: 1779.6. Samples: 24117636. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:39:06,876][101941] Avg episode reward: [(0, '7.240'), (1, '8.790')] +[2023-10-08 13:39:06,978][102897] Updated weights for policy 0, policy_version 47090 (0.0007) +[2023-10-08 13:39:07,345][102897] Updated weights for policy 0, policy_version 47100 (0.0008) +[2023-10-08 13:39:07,418][102898] Updated weights for policy 1, policy_version 47110 (0.0009) +[2023-10-08 13:39:07,785][102898] Updated weights for policy 1, policy_version 47120 (0.0007) +[2023-10-08 13:39:08,149][102898] Updated weights for policy 1, policy_version 47130 (0.0008) +[2023-10-08 13:39:11,058][102897] Updated weights for policy 0, policy_version 47110 (0.0008) +[2023-10-08 13:39:11,430][102897] Updated weights for policy 0, policy_version 47120 (0.0008) +[2023-10-08 13:39:11,800][102897] Updated weights for policy 0, policy_version 47130 (0.0007) +[2023-10-08 13:39:11,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 96501760. Throughput: 0: 1790.0, 1: 1789.5. Samples: 24140316. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:39:11,875][101941] Avg episode reward: [(0, '7.170'), (1, '9.030')] +[2023-10-08 13:39:11,906][102898] Updated weights for policy 1, policy_version 47140 (0.0009) +[2023-10-08 13:39:12,275][102898] Updated weights for policy 1, policy_version 47150 (0.0007) +[2023-10-08 13:39:12,640][102898] Updated weights for policy 1, policy_version 47160 (0.0007) +[2023-10-08 13:39:15,468][102897] Updated weights for policy 0, policy_version 47140 (0.0007) +[2023-10-08 13:39:15,836][102897] Updated weights for policy 0, policy_version 47150 (0.0010) +[2023-10-08 13:39:16,209][102897] Updated weights for policy 0, policy_version 47160 (0.0010) +[2023-10-08 13:39:16,326][102898] Updated weights for policy 1, policy_version 47170 (0.0009) +[2023-10-08 13:39:16,696][102898] Updated weights for policy 1, policy_version 47180 (0.0009) +[2023-10-08 13:39:16,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 96600064. Throughput: 0: 1786.5, 1: 1803.8. Samples: 24161144. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 13:39:16,876][101941] Avg episode reward: [(0, '6.790'), (1, '7.930')] +[2023-10-08 13:39:17,051][102898] Updated weights for policy 1, policy_version 47190 (0.0009) +[2023-10-08 13:39:17,418][102898] Updated weights for policy 1, policy_version 47200 (0.0007) +[2023-10-08 13:39:19,979][102897] Updated weights for policy 0, policy_version 47170 (0.0008) +[2023-10-08 13:39:20,353][102897] Updated weights for policy 0, policy_version 47180 (0.0008) +[2023-10-08 13:39:20,715][102897] Updated weights for policy 0, policy_version 47190 (0.0008) +[2023-10-08 13:39:21,090][102897] Updated weights for policy 0, policy_version 47200 (0.0007) +[2023-10-08 13:39:21,094][102898] Updated weights for policy 1, policy_version 47210 (0.0008) +[2023-10-08 13:39:21,464][102898] Updated weights for policy 1, policy_version 47220 (0.0009) +[2023-10-08 13:39:21,836][102898] Updated weights for policy 1, policy_version 47230 (0.0008) +[2023-10-08 13:39:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 96665600. Throughput: 0: 1786.5, 1: 1791.8. Samples: 24172466. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 13:39:21,875][101941] Avg episode reward: [(0, '6.860'), (1, '7.900')] +[2023-10-08 13:39:24,855][102897] Updated weights for policy 0, policy_version 47210 (0.0007) +[2023-10-08 13:39:25,219][102897] Updated weights for policy 0, policy_version 47220 (0.0008) +[2023-10-08 13:39:25,508][102898] Updated weights for policy 1, policy_version 47240 (0.0007) +[2023-10-08 13:39:25,594][102897] Updated weights for policy 0, policy_version 47230 (0.0008) +[2023-10-08 13:39:25,873][102898] Updated weights for policy 1, policy_version 47250 (0.0008) +[2023-10-08 13:39:26,234][102898] Updated weights for policy 1, policy_version 47260 (0.0008) +[2023-10-08 13:39:26,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 96763904. Throughput: 0: 1788.9, 1: 1806.8. Samples: 24193844. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 13:39:26,875][101941] Avg episode reward: [(0, '6.920'), (1, '8.740')] +[2023-10-08 13:39:29,490][102897] Updated weights for policy 0, policy_version 47240 (0.0009) +[2023-10-08 13:39:29,867][102897] Updated weights for policy 0, policy_version 47250 (0.0007) +[2023-10-08 13:39:30,060][102898] Updated weights for policy 1, policy_version 47270 (0.0007) +[2023-10-08 13:39:30,242][102897] Updated weights for policy 0, policy_version 47260 (0.0007) +[2023-10-08 13:39:30,421][102898] Updated weights for policy 1, policy_version 47280 (0.0007) +[2023-10-08 13:39:30,798][102898] Updated weights for policy 1, policy_version 47290 (0.0008) +[2023-10-08 13:39:31,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 96829440. Throughput: 0: 1778.7, 1: 1799.1. Samples: 24214634. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 13:39:31,876][101941] Avg episode reward: [(0, '6.740'), (1, '8.490')] +[2023-10-08 13:39:33,929][102897] Updated weights for policy 0, policy_version 47270 (0.0007) +[2023-10-08 13:39:34,301][102897] Updated weights for policy 0, policy_version 47280 (0.0008) +[2023-10-08 13:39:34,565][102898] Updated weights for policy 1, policy_version 47300 (0.0008) +[2023-10-08 13:39:34,661][102897] Updated weights for policy 0, policy_version 47290 (0.0008) +[2023-10-08 13:39:34,927][102898] Updated weights for policy 1, policy_version 47310 (0.0008) +[2023-10-08 13:39:35,298][102898] Updated weights for policy 1, policy_version 47320 (0.0009) +[2023-10-08 13:39:36,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 96894976. Throughput: 0: 1793.7, 1: 1811.2. Samples: 24226462. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 13:39:36,876][101941] Avg episode reward: [(0, '6.630'), (1, '8.230')] +[2023-10-08 13:39:38,655][102897] Updated weights for policy 0, policy_version 47300 (0.0007) +[2023-10-08 13:39:39,020][102897] Updated weights for policy 0, policy_version 47310 (0.0007) +[2023-10-08 13:39:39,090][102898] Updated weights for policy 1, policy_version 47330 (0.0008) +[2023-10-08 13:39:39,386][102897] Updated weights for policy 0, policy_version 47320 (0.0008) +[2023-10-08 13:39:39,467][102898] Updated weights for policy 1, policy_version 47340 (0.0009) +[2023-10-08 13:39:39,830][102898] Updated weights for policy 1, policy_version 47350 (0.0007) +[2023-10-08 13:39:40,203][102898] Updated weights for policy 1, policy_version 47360 (0.0010) +[2023-10-08 13:39:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 96960512. Throughput: 0: 1776.5, 1: 1798.7. Samples: 24246628. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 13:39:41,876][101941] Avg episode reward: [(0, '6.430'), (1, '8.180')] +[2023-10-08 13:39:43,108][102897] Updated weights for policy 0, policy_version 47330 (0.0007) +[2023-10-08 13:39:43,472][102897] Updated weights for policy 0, policy_version 47340 (0.0008) +[2023-10-08 13:39:43,840][102897] Updated weights for policy 0, policy_version 47350 (0.0007) +[2023-10-08 13:39:43,878][102898] Updated weights for policy 1, policy_version 47370 (0.0010) +[2023-10-08 13:39:44,219][102897] Updated weights for policy 0, policy_version 47360 (0.0008) +[2023-10-08 13:39:44,250][102898] Updated weights for policy 1, policy_version 47380 (0.0007) +[2023-10-08 13:39:44,625][102898] Updated weights for policy 1, policy_version 47390 (0.0007) +[2023-10-08 13:39:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 97026048. Throughput: 0: 1783.6, 1: 1795.2. Samples: 24269058. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 13:39:46,876][101941] Avg episode reward: [(0, '7.520'), (1, '8.640')] +[2023-10-08 13:39:48,045][102897] Updated weights for policy 0, policy_version 47370 (0.0009) +[2023-10-08 13:39:48,418][102897] Updated weights for policy 0, policy_version 47380 (0.0008) +[2023-10-08 13:39:48,559][102898] Updated weights for policy 1, policy_version 47400 (0.0008) +[2023-10-08 13:39:48,786][102897] Updated weights for policy 0, policy_version 47390 (0.0008) +[2023-10-08 13:39:48,933][102898] Updated weights for policy 1, policy_version 47410 (0.0010) +[2023-10-08 13:39:49,301][102898] Updated weights for policy 1, policy_version 47420 (0.0010) +[2023-10-08 13:39:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 97091584. Throughput: 0: 1781.2, 1: 1794.1. Samples: 24278524. Policy #0 lag: (min: 20.0, avg: 25.9, max: 52.0) +[2023-10-08 13:39:51,876][101941] Avg episode reward: [(0, '7.950'), (1, '9.450')] +[2023-10-08 13:39:51,878][102760] Saving new best policy, reward=9.450! +[2023-10-08 13:39:52,562][102897] Updated weights for policy 0, policy_version 47400 (0.0009) +[2023-10-08 13:39:52,922][102897] Updated weights for policy 0, policy_version 47410 (0.0008) +[2023-10-08 13:39:53,032][102898] Updated weights for policy 1, policy_version 47430 (0.0008) +[2023-10-08 13:39:53,294][102897] Updated weights for policy 0, policy_version 47420 (0.0007) +[2023-10-08 13:39:53,397][102898] Updated weights for policy 1, policy_version 47440 (0.0007) +[2023-10-08 13:39:53,765][102898] Updated weights for policy 1, policy_version 47450 (0.0009) +[2023-10-08 13:39:56,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 97157120. Throughput: 0: 1778.4, 1: 1783.0. Samples: 24300580. Policy #0 lag: (min: 20.0, avg: 25.9, max: 52.0) +[2023-10-08 13:39:56,875][101941] Avg episode reward: [(0, '7.090'), (1, '9.260')] +[2023-10-08 13:39:57,066][102897] Updated weights for policy 0, policy_version 47430 (0.0007) +[2023-10-08 13:39:57,440][102897] Updated weights for policy 0, policy_version 47440 (0.0008) +[2023-10-08 13:39:57,647][102898] Updated weights for policy 1, policy_version 47460 (0.0008) +[2023-10-08 13:39:57,806][102897] Updated weights for policy 0, policy_version 47450 (0.0009) +[2023-10-08 13:39:58,009][102898] Updated weights for policy 1, policy_version 47470 (0.0007) +[2023-10-08 13:39:58,379][102898] Updated weights for policy 1, policy_version 47480 (0.0009) +[2023-10-08 13:40:01,482][102897] Updated weights for policy 0, policy_version 47460 (0.0007) +[2023-10-08 13:40:01,858][102897] Updated weights for policy 0, policy_version 47470 (0.0009) +[2023-10-08 13:40:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 97222656. Throughput: 0: 1800.9, 1: 1795.2. Samples: 24322968. Policy #0 lag: (min: 20.0, avg: 25.9, max: 52.0) +[2023-10-08 13:40:01,876][101941] Avg episode reward: [(0, '6.760'), (1, '8.230')] +[2023-10-08 13:40:02,087][102898] Updated weights for policy 1, policy_version 47490 (0.0008) +[2023-10-08 13:40:02,227][102897] Updated weights for policy 0, policy_version 47480 (0.0007) +[2023-10-08 13:40:02,445][102898] Updated weights for policy 1, policy_version 47500 (0.0008) +[2023-10-08 13:40:02,812][102898] Updated weights for policy 1, policy_version 47510 (0.0009) +[2023-10-08 13:40:03,179][102898] Updated weights for policy 1, policy_version 47520 (0.0011) +[2023-10-08 13:40:06,109][102897] Updated weights for policy 0, policy_version 47490 (0.0007) +[2023-10-08 13:40:06,481][102897] Updated weights for policy 0, policy_version 47500 (0.0007) +[2023-10-08 13:40:06,854][102897] Updated weights for policy 0, policy_version 47510 (0.0010) +[2023-10-08 13:40:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 97288192. Throughput: 0: 1773.8, 1: 1793.9. Samples: 24333014. Policy #0 lag: (min: 20.0, avg: 25.9, max: 52.0) +[2023-10-08 13:40:06,876][101941] Avg episode reward: [(0, '6.430'), (1, '8.460')] +[2023-10-08 13:40:06,943][102898] Updated weights for policy 1, policy_version 47530 (0.0008) +[2023-10-08 13:40:07,212][102897] Updated weights for policy 0, policy_version 47520 (0.0007) +[2023-10-08 13:40:07,309][102898] Updated weights for policy 1, policy_version 47540 (0.0007) +[2023-10-08 13:40:07,687][102898] Updated weights for policy 1, policy_version 47550 (0.0009) +[2023-10-08 13:40:11,001][102897] Updated weights for policy 0, policy_version 47530 (0.0007) +[2023-10-08 13:40:11,372][102897] Updated weights for policy 0, policy_version 47540 (0.0007) +[2023-10-08 13:40:11,462][102898] Updated weights for policy 1, policy_version 47560 (0.0009) +[2023-10-08 13:40:11,753][102897] Updated weights for policy 0, policy_version 47550 (0.0007) +[2023-10-08 13:40:11,831][102898] Updated weights for policy 1, policy_version 47570 (0.0009) +[2023-10-08 13:40:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 97386496. Throughput: 0: 1789.5, 1: 1791.5. Samples: 24354988. Policy #0 lag: (min: 20.0, avg: 25.9, max: 52.0) +[2023-10-08 13:40:11,876][101941] Avg episode reward: [(0, '6.610'), (1, '7.960')] +[2023-10-08 13:40:12,198][102898] Updated weights for policy 1, policy_version 47580 (0.0007) +[2023-10-08 13:40:15,698][102897] Updated weights for policy 0, policy_version 47560 (0.0008) +[2023-10-08 13:40:15,953][102898] Updated weights for policy 1, policy_version 47590 (0.0009) +[2023-10-08 13:40:16,069][102897] Updated weights for policy 0, policy_version 47570 (0.0007) +[2023-10-08 13:40:16,322][102898] Updated weights for policy 1, policy_version 47600 (0.0009) +[2023-10-08 13:40:16,431][102897] Updated weights for policy 0, policy_version 47580 (0.0007) +[2023-10-08 13:40:16,692][102898] Updated weights for policy 1, policy_version 47610 (0.0007) +[2023-10-08 13:40:16,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 97452032. Throughput: 0: 1769.7, 1: 1796.6. Samples: 24375120. Policy #0 lag: (min: 20.0, avg: 25.9, max: 52.0) +[2023-10-08 13:40:16,876][101941] Avg episode reward: [(0, '6.740'), (1, '7.860')] +[2023-10-08 13:40:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000047584_48726016.pth... +[2023-10-08 13:40:16,907][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000047616_48758784.pth... +[2023-10-08 13:40:16,924][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000045920_47022080.pth +[2023-10-08 13:40:16,936][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000045952_47054848.pth +[2023-10-08 13:40:19,975][102897] Updated weights for policy 0, policy_version 47590 (0.0010) +[2023-10-08 13:40:20,342][102897] Updated weights for policy 0, policy_version 47600 (0.0009) +[2023-10-08 13:40:20,418][102898] Updated weights for policy 1, policy_version 47620 (0.0008) +[2023-10-08 13:40:20,722][102897] Updated weights for policy 0, policy_version 47610 (0.0009) +[2023-10-08 13:40:20,790][102898] Updated weights for policy 1, policy_version 47630 (0.0008) +[2023-10-08 13:40:21,159][102898] Updated weights for policy 1, policy_version 47640 (0.0008) +[2023-10-08 13:40:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 97550336. Throughput: 0: 1784.6, 1: 1783.4. Samples: 24387020. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 13:40:21,876][101941] Avg episode reward: [(0, '6.620'), (1, '8.100')] +[2023-10-08 13:40:24,483][102897] Updated weights for policy 0, policy_version 47620 (0.0009) +[2023-10-08 13:40:24,840][102898] Updated weights for policy 1, policy_version 47650 (0.0009) +[2023-10-08 13:40:24,852][102897] Updated weights for policy 0, policy_version 47630 (0.0007) +[2023-10-08 13:40:25,208][102898] Updated weights for policy 1, policy_version 47660 (0.0008) +[2023-10-08 13:40:25,234][102897] Updated weights for policy 0, policy_version 47640 (0.0008) +[2023-10-08 13:40:25,568][102898] Updated weights for policy 1, policy_version 47670 (0.0008) +[2023-10-08 13:40:25,937][102898] Updated weights for policy 1, policy_version 47680 (0.0008) +[2023-10-08 13:40:26,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 97615872. Throughput: 0: 1774.4, 1: 1800.4. Samples: 24407494. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 13:40:26,876][101941] Avg episode reward: [(0, '7.090'), (1, '8.270')] +[2023-10-08 13:40:29,057][102897] Updated weights for policy 0, policy_version 47650 (0.0007) +[2023-10-08 13:40:29,425][102897] Updated weights for policy 0, policy_version 47660 (0.0007) +[2023-10-08 13:40:29,788][102897] Updated weights for policy 0, policy_version 47670 (0.0010) +[2023-10-08 13:40:29,811][102898] Updated weights for policy 1, policy_version 47690 (0.0009) +[2023-10-08 13:40:30,168][102897] Updated weights for policy 0, policy_version 47680 (0.0008) +[2023-10-08 13:40:30,176][102898] Updated weights for policy 1, policy_version 47700 (0.0008) +[2023-10-08 13:40:30,539][102898] Updated weights for policy 1, policy_version 47710 (0.0011) +[2023-10-08 13:40:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 97681408. Throughput: 0: 1766.2, 1: 1785.8. Samples: 24428898. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 13:40:31,876][101941] Avg episode reward: [(0, '6.520'), (1, '8.070')] +[2023-10-08 13:40:34,082][102897] Updated weights for policy 0, policy_version 47690 (0.0007) +[2023-10-08 13:40:34,448][102897] Updated weights for policy 0, policy_version 47700 (0.0007) +[2023-10-08 13:40:34,480][102898] Updated weights for policy 1, policy_version 47720 (0.0009) +[2023-10-08 13:40:34,821][102897] Updated weights for policy 0, policy_version 47710 (0.0007) +[2023-10-08 13:40:34,853][102898] Updated weights for policy 1, policy_version 47730 (0.0008) +[2023-10-08 13:40:35,219][102898] Updated weights for policy 1, policy_version 47740 (0.0008) +[2023-10-08 13:40:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 97746944. Throughput: 0: 1784.6, 1: 1806.4. Samples: 24440118. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 13:40:36,876][101941] Avg episode reward: [(0, '6.550'), (1, '8.350')] +[2023-10-08 13:40:38,562][102897] Updated weights for policy 0, policy_version 47720 (0.0009) +[2023-10-08 13:40:38,909][102898] Updated weights for policy 1, policy_version 47750 (0.0008) +[2023-10-08 13:40:38,944][102897] Updated weights for policy 0, policy_version 47730 (0.0008) +[2023-10-08 13:40:39,272][102898] Updated weights for policy 1, policy_version 47760 (0.0007) +[2023-10-08 13:40:39,310][102897] Updated weights for policy 0, policy_version 47740 (0.0007) +[2023-10-08 13:40:39,649][102898] Updated weights for policy 1, policy_version 47770 (0.0008) +[2023-10-08 13:40:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 97812480. Throughput: 0: 1778.1, 1: 1786.8. Samples: 24461002. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 13:40:41,876][101941] Avg episode reward: [(0, '6.970'), (1, '8.620')] +[2023-10-08 13:40:43,081][102897] Updated weights for policy 0, policy_version 47750 (0.0009) +[2023-10-08 13:40:43,436][102898] Updated weights for policy 1, policy_version 47780 (0.0008) +[2023-10-08 13:40:43,448][102897] Updated weights for policy 0, policy_version 47760 (0.0010) +[2023-10-08 13:40:43,809][102898] Updated weights for policy 1, policy_version 47790 (0.0008) +[2023-10-08 13:40:43,821][102897] Updated weights for policy 0, policy_version 47770 (0.0009) +[2023-10-08 13:40:44,164][102898] Updated weights for policy 1, policy_version 47800 (0.0008) +[2023-10-08 13:40:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 97878016. Throughput: 0: 1777.5, 1: 1779.6. Samples: 24483034. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 13:40:46,876][101941] Avg episode reward: [(0, '7.160'), (1, '8.250')] +[2023-10-08 13:40:47,621][102897] Updated weights for policy 0, policy_version 47780 (0.0007) +[2023-10-08 13:40:47,811][102898] Updated weights for policy 1, policy_version 47810 (0.0007) +[2023-10-08 13:40:47,989][102897] Updated weights for policy 0, policy_version 47790 (0.0009) +[2023-10-08 13:40:48,176][102898] Updated weights for policy 1, policy_version 47820 (0.0007) +[2023-10-08 13:40:48,359][102897] Updated weights for policy 0, policy_version 47800 (0.0009) +[2023-10-08 13:40:48,533][102898] Updated weights for policy 1, policy_version 47830 (0.0007) +[2023-10-08 13:40:48,900][102898] Updated weights for policy 1, policy_version 47840 (0.0007) +[2023-10-08 13:40:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 97943552. Throughput: 0: 1771.8, 1: 1775.8. Samples: 24492654. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 13:40:51,875][101941] Avg episode reward: [(0, '7.590'), (1, '7.890')] +[2023-10-08 13:40:52,089][102897] Updated weights for policy 0, policy_version 47810 (0.0009) +[2023-10-08 13:40:52,462][102897] Updated weights for policy 0, policy_version 47820 (0.0009) +[2023-10-08 13:40:52,684][102898] Updated weights for policy 1, policy_version 47850 (0.0008) +[2023-10-08 13:40:52,835][102897] Updated weights for policy 0, policy_version 47830 (0.0008) +[2023-10-08 13:40:53,050][102898] Updated weights for policy 1, policy_version 47860 (0.0007) +[2023-10-08 13:40:53,209][102897] Updated weights for policy 0, policy_version 47840 (0.0008) +[2023-10-08 13:40:53,418][102898] Updated weights for policy 1, policy_version 47870 (0.0009) +[2023-10-08 13:40:56,769][102897] Updated weights for policy 0, policy_version 47850 (0.0011) +[2023-10-08 13:40:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 98009088. Throughput: 0: 1780.7, 1: 1776.6. Samples: 24515066. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 13:40:56,876][101941] Avg episode reward: [(0, '7.370'), (1, '8.340')] +[2023-10-08 13:40:57,143][102897] Updated weights for policy 0, policy_version 47860 (0.0007) +[2023-10-08 13:40:57,164][102898] Updated weights for policy 1, policy_version 47880 (0.0008) +[2023-10-08 13:40:57,517][102897] Updated weights for policy 0, policy_version 47870 (0.0009) +[2023-10-08 13:40:57,522][102898] Updated weights for policy 1, policy_version 47890 (0.0008) +[2023-10-08 13:40:57,886][102898] Updated weights for policy 1, policy_version 47900 (0.0010) +[2023-10-08 13:41:01,326][102897] Updated weights for policy 0, policy_version 47880 (0.0007) +[2023-10-08 13:41:01,604][102898] Updated weights for policy 1, policy_version 47910 (0.0008) +[2023-10-08 13:41:01,693][102897] Updated weights for policy 0, policy_version 47890 (0.0007) +[2023-10-08 13:41:01,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 98074624. Throughput: 0: 1798.7, 1: 1797.6. Samples: 24536952. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 13:41:01,876][101941] Avg episode reward: [(0, '7.760'), (1, '8.380')] +[2023-10-08 13:41:01,971][102898] Updated weights for policy 1, policy_version 47920 (0.0008) +[2023-10-08 13:41:02,063][102897] Updated weights for policy 0, policy_version 47900 (0.0009) +[2023-10-08 13:41:02,327][102898] Updated weights for policy 1, policy_version 47930 (0.0011) +[2023-10-08 13:41:05,811][102897] Updated weights for policy 0, policy_version 47910 (0.0008) +[2023-10-08 13:41:06,176][102898] Updated weights for policy 1, policy_version 47940 (0.0008) +[2023-10-08 13:41:06,180][102897] Updated weights for policy 0, policy_version 47920 (0.0008) +[2023-10-08 13:41:06,539][102897] Updated weights for policy 0, policy_version 47930 (0.0007) +[2023-10-08 13:41:06,543][102898] Updated weights for policy 1, policy_version 47950 (0.0007) +[2023-10-08 13:41:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 98172928. Throughput: 0: 1780.2, 1: 1777.3. Samples: 24547108. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 13:41:06,876][101941] Avg episode reward: [(0, '7.360'), (1, '8.250')] +[2023-10-08 13:41:06,906][102898] Updated weights for policy 1, policy_version 47960 (0.0010) +[2023-10-08 13:41:10,403][102897] Updated weights for policy 0, policy_version 47940 (0.0009) +[2023-10-08 13:41:10,768][102897] Updated weights for policy 0, policy_version 47950 (0.0008) +[2023-10-08 13:41:10,771][102898] Updated weights for policy 1, policy_version 47970 (0.0009) +[2023-10-08 13:41:11,132][102898] Updated weights for policy 1, policy_version 47980 (0.0008) +[2023-10-08 13:41:11,135][102897] Updated weights for policy 0, policy_version 47960 (0.0008) +[2023-10-08 13:41:11,497][102898] Updated weights for policy 1, policy_version 47990 (0.0009) +[2023-10-08 13:41:11,866][102898] Updated weights for policy 1, policy_version 48000 (0.0010) +[2023-10-08 13:41:11,875][101941] Fps is (10 sec: 19660.6, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 98271232. Throughput: 0: 1801.3, 1: 1789.5. Samples: 24569082. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 13:41:11,876][101941] Avg episode reward: [(0, '6.530'), (1, '7.900')] +[2023-10-08 13:41:14,955][102897] Updated weights for policy 0, policy_version 47970 (0.0007) +[2023-10-08 13:41:15,328][102897] Updated weights for policy 0, policy_version 47980 (0.0010) +[2023-10-08 13:41:15,692][102897] Updated weights for policy 0, policy_version 47990 (0.0007) +[2023-10-08 13:41:15,899][102898] Updated weights for policy 1, policy_version 48010 (0.0008) +[2023-10-08 13:41:16,062][102897] Updated weights for policy 0, policy_version 48000 (0.0007) +[2023-10-08 13:41:16,266][102898] Updated weights for policy 1, policy_version 48020 (0.0008) +[2023-10-08 13:41:16,633][102898] Updated weights for policy 1, policy_version 48030 (0.0007) +[2023-10-08 13:41:16,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 98336768. Throughput: 0: 1781.4, 1: 1776.4. Samples: 24588996. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 13:41:16,876][101941] Avg episode reward: [(0, '6.930'), (1, '7.850')] +[2023-10-08 13:41:20,045][102897] Updated weights for policy 0, policy_version 48010 (0.0009) +[2023-10-08 13:41:20,352][102898] Updated weights for policy 1, policy_version 48040 (0.0010) +[2023-10-08 13:41:20,421][102897] Updated weights for policy 0, policy_version 48020 (0.0009) +[2023-10-08 13:41:20,709][102898] Updated weights for policy 1, policy_version 48050 (0.0009) +[2023-10-08 13:41:20,784][102897] Updated weights for policy 0, policy_version 48030 (0.0008) +[2023-10-08 13:41:21,071][102898] Updated weights for policy 1, policy_version 48060 (0.0007) +[2023-10-08 13:41:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 98402304. Throughput: 0: 1795.2, 1: 1784.8. Samples: 24601220. Policy #0 lag: (min: 31.0, avg: 38.3, max: 63.0) +[2023-10-08 13:41:21,876][101941] Avg episode reward: [(0, '6.370'), (1, '8.210')] +[2023-10-08 13:41:24,427][102897] Updated weights for policy 0, policy_version 48040 (0.0008) +[2023-10-08 13:41:24,652][102898] Updated weights for policy 1, policy_version 48070 (0.0008) +[2023-10-08 13:41:24,795][102897] Updated weights for policy 0, policy_version 48050 (0.0007) +[2023-10-08 13:41:25,007][102898] Updated weights for policy 1, policy_version 48080 (0.0008) +[2023-10-08 13:41:25,179][102897] Updated weights for policy 0, policy_version 48060 (0.0007) +[2023-10-08 13:41:25,368][102898] Updated weights for policy 1, policy_version 48090 (0.0008) +[2023-10-08 13:41:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 98467840. Throughput: 0: 1771.2, 1: 1782.7. Samples: 24620924. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 13:41:26,876][101941] Avg episode reward: [(0, '6.700'), (1, '8.440')] +[2023-10-08 13:41:28,986][102897] Updated weights for policy 0, policy_version 48070 (0.0008) +[2023-10-08 13:41:29,225][102898] Updated weights for policy 1, policy_version 48100 (0.0009) +[2023-10-08 13:41:29,349][102897] Updated weights for policy 0, policy_version 48080 (0.0007) +[2023-10-08 13:41:29,593][102898] Updated weights for policy 1, policy_version 48110 (0.0008) +[2023-10-08 13:41:29,719][102897] Updated weights for policy 0, policy_version 48090 (0.0007) +[2023-10-08 13:41:29,955][102898] Updated weights for policy 1, policy_version 48120 (0.0008) +[2023-10-08 13:41:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 98533376. Throughput: 0: 1772.9, 1: 1777.7. Samples: 24642812. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 13:41:31,876][101941] Avg episode reward: [(0, '7.280'), (1, '8.860')] +[2023-10-08 13:41:33,626][102897] Updated weights for policy 0, policy_version 48100 (0.0007) +[2023-10-08 13:41:33,798][102898] Updated weights for policy 1, policy_version 48130 (0.0007) +[2023-10-08 13:41:33,998][102897] Updated weights for policy 0, policy_version 48110 (0.0007) +[2023-10-08 13:41:34,168][102898] Updated weights for policy 1, policy_version 48140 (0.0008) +[2023-10-08 13:41:34,359][102897] Updated weights for policy 0, policy_version 48120 (0.0007) +[2023-10-08 13:41:34,535][102898] Updated weights for policy 1, policy_version 48150 (0.0008) +[2023-10-08 13:41:34,896][102898] Updated weights for policy 1, policy_version 48160 (0.0007) +[2023-10-08 13:41:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 98598912. Throughput: 0: 1781.6, 1: 1795.0. Samples: 24653604. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 13:41:36,876][101941] Avg episode reward: [(0, '7.550'), (1, '8.720')] +[2023-10-08 13:41:37,925][102897] Updated weights for policy 0, policy_version 48130 (0.0008) +[2023-10-08 13:41:38,288][102897] Updated weights for policy 0, policy_version 48140 (0.0008) +[2023-10-08 13:41:38,653][102897] Updated weights for policy 0, policy_version 48150 (0.0007) +[2023-10-08 13:41:38,669][102898] Updated weights for policy 1, policy_version 48170 (0.0008) +[2023-10-08 13:41:39,021][102897] Updated weights for policy 0, policy_version 48160 (0.0008) +[2023-10-08 13:41:39,029][102898] Updated weights for policy 1, policy_version 48180 (0.0009) +[2023-10-08 13:41:39,395][102898] Updated weights for policy 1, policy_version 48190 (0.0009) +[2023-10-08 13:41:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 98664448. Throughput: 0: 1775.4, 1: 1778.0. Samples: 24674970. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 13:41:41,876][101941] Avg episode reward: [(0, '7.390'), (1, '8.380')] +[2023-10-08 13:41:42,920][102897] Updated weights for policy 0, policy_version 48170 (0.0009) +[2023-10-08 13:41:43,196][102898] Updated weights for policy 1, policy_version 48200 (0.0008) +[2023-10-08 13:41:43,286][102897] Updated weights for policy 0, policy_version 48180 (0.0007) +[2023-10-08 13:41:43,563][102898] Updated weights for policy 1, policy_version 48210 (0.0009) +[2023-10-08 13:41:43,660][102897] Updated weights for policy 0, policy_version 48190 (0.0007) +[2023-10-08 13:41:43,928][102898] Updated weights for policy 1, policy_version 48220 (0.0010) +[2023-10-08 13:41:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 98729984. Throughput: 0: 1782.4, 1: 1773.7. Samples: 24696976. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 13:41:46,875][101941] Avg episode reward: [(0, '7.190'), (1, '8.370')] +[2023-10-08 13:41:47,280][102897] Updated weights for policy 0, policy_version 48200 (0.0009) +[2023-10-08 13:41:47,648][102897] Updated weights for policy 0, policy_version 48210 (0.0007) +[2023-10-08 13:41:47,707][102898] Updated weights for policy 1, policy_version 48230 (0.0009) +[2023-10-08 13:41:48,019][102897] Updated weights for policy 0, policy_version 48220 (0.0008) +[2023-10-08 13:41:48,072][102898] Updated weights for policy 1, policy_version 48240 (0.0009) +[2023-10-08 13:41:48,436][102898] Updated weights for policy 1, policy_version 48250 (0.0008) +[2023-10-08 13:41:51,778][102897] Updated weights for policy 0, policy_version 48230 (0.0009) +[2023-10-08 13:41:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 98795520. Throughput: 0: 1774.7, 1: 1773.8. Samples: 24706792. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 13:41:51,876][101941] Avg episode reward: [(0, '6.970'), (1, '8.390')] +[2023-10-08 13:41:52,146][102897] Updated weights for policy 0, policy_version 48240 (0.0008) +[2023-10-08 13:41:52,199][102898] Updated weights for policy 1, policy_version 48260 (0.0007) +[2023-10-08 13:41:52,518][102897] Updated weights for policy 0, policy_version 48250 (0.0007) +[2023-10-08 13:41:52,560][102898] Updated weights for policy 1, policy_version 48270 (0.0008) +[2023-10-08 13:41:52,928][102898] Updated weights for policy 1, policy_version 48280 (0.0007) +[2023-10-08 13:41:56,419][102897] Updated weights for policy 0, policy_version 48260 (0.0010) +[2023-10-08 13:41:56,753][102898] Updated weights for policy 1, policy_version 48290 (0.0007) +[2023-10-08 13:41:56,798][102897] Updated weights for policy 0, policy_version 48270 (0.0007) +[2023-10-08 13:41:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 98861056. Throughput: 0: 1776.8, 1: 1775.2. Samples: 24728920. Policy #0 lag: (min: 31.0, avg: 34.3, max: 63.0) +[2023-10-08 13:41:56,875][101941] Avg episode reward: [(0, '6.930'), (1, '8.590')] +[2023-10-08 13:41:57,122][102898] Updated weights for policy 1, policy_version 48300 (0.0008) +[2023-10-08 13:41:57,175][102897] Updated weights for policy 0, policy_version 48280 (0.0007) +[2023-10-08 13:41:57,488][102898] Updated weights for policy 1, policy_version 48310 (0.0008) +[2023-10-08 13:41:57,847][102898] Updated weights for policy 1, policy_version 48320 (0.0008) +[2023-10-08 13:42:00,876][102897] Updated weights for policy 0, policy_version 48290 (0.0008) +[2023-10-08 13:42:01,245][102897] Updated weights for policy 0, policy_version 48300 (0.0007) +[2023-10-08 13:42:01,552][102898] Updated weights for policy 1, policy_version 48330 (0.0008) +[2023-10-08 13:42:01,617][102897] Updated weights for policy 0, policy_version 48310 (0.0007) +[2023-10-08 13:42:01,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 98926592. Throughput: 0: 1783.5, 1: 1795.6. Samples: 24750058. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:42:01,876][101941] Avg episode reward: [(0, '6.900'), (1, '8.660')] +[2023-10-08 13:42:01,908][102898] Updated weights for policy 1, policy_version 48340 (0.0008) +[2023-10-08 13:42:01,989][102897] Updated weights for policy 0, policy_version 48320 (0.0008) +[2023-10-08 13:42:02,275][102898] Updated weights for policy 1, policy_version 48350 (0.0010) +[2023-10-08 13:42:05,930][102897] Updated weights for policy 0, policy_version 48330 (0.0008) +[2023-10-08 13:42:06,184][102898] Updated weights for policy 1, policy_version 48360 (0.0007) +[2023-10-08 13:42:06,306][102897] Updated weights for policy 0, policy_version 48340 (0.0008) +[2023-10-08 13:42:06,554][102898] Updated weights for policy 1, policy_version 48370 (0.0007) +[2023-10-08 13:42:06,669][102897] Updated weights for policy 0, policy_version 48350 (0.0008) +[2023-10-08 13:42:06,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 99024896. Throughput: 0: 1769.1, 1: 1773.4. Samples: 24760632. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:42:06,876][101941] Avg episode reward: [(0, '7.520'), (1, '9.010')] +[2023-10-08 13:42:06,931][102898] Updated weights for policy 1, policy_version 48380 (0.0010) +[2023-10-08 13:42:10,684][102897] Updated weights for policy 0, policy_version 48360 (0.0007) +[2023-10-08 13:42:10,726][102898] Updated weights for policy 1, policy_version 48390 (0.0008) +[2023-10-08 13:42:11,051][102897] Updated weights for policy 0, policy_version 48370 (0.0008) +[2023-10-08 13:42:11,100][102898] Updated weights for policy 1, policy_version 48400 (0.0008) +[2023-10-08 13:42:11,426][102897] Updated weights for policy 0, policy_version 48380 (0.0008) +[2023-10-08 13:42:11,459][102898] Updated weights for policy 1, policy_version 48410 (0.0008) +[2023-10-08 13:42:11,875][101941] Fps is (10 sec: 19661.3, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 99123200. Throughput: 0: 1791.4, 1: 1793.6. Samples: 24782250. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:42:11,875][101941] Avg episode reward: [(0, '8.050'), (1, '8.100')] +[2023-10-08 13:42:15,185][102898] Updated weights for policy 1, policy_version 48420 (0.0008) +[2023-10-08 13:42:15,288][102897] Updated weights for policy 0, policy_version 48390 (0.0007) +[2023-10-08 13:42:15,549][102898] Updated weights for policy 1, policy_version 48430 (0.0009) +[2023-10-08 13:42:15,660][102897] Updated weights for policy 0, policy_version 48400 (0.0007) +[2023-10-08 13:42:15,911][102898] Updated weights for policy 1, policy_version 48440 (0.0009) +[2023-10-08 13:42:16,035][102897] Updated weights for policy 0, policy_version 48410 (0.0009) +[2023-10-08 13:42:16,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 99188736. Throughput: 0: 1755.9, 1: 1768.3. Samples: 24801404. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:42:16,876][101941] Avg episode reward: [(0, '6.990'), (1, '8.010')] +[2023-10-08 13:42:16,886][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000048416_49577984.pth... +[2023-10-08 13:42:16,887][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000048448_49610752.pth... +[2023-10-08 13:42:16,920][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000046752_47874048.pth +[2023-10-08 13:42:16,923][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000046784_47906816.pth +[2023-10-08 13:42:19,664][102898] Updated weights for policy 1, policy_version 48450 (0.0008) +[2023-10-08 13:42:19,809][102897] Updated weights for policy 0, policy_version 48420 (0.0008) +[2023-10-08 13:42:20,036][102898] Updated weights for policy 1, policy_version 48460 (0.0008) +[2023-10-08 13:42:20,177][102897] Updated weights for policy 0, policy_version 48430 (0.0007) +[2023-10-08 13:42:20,392][102898] Updated weights for policy 1, policy_version 48470 (0.0008) +[2023-10-08 13:42:20,555][102897] Updated weights for policy 0, policy_version 48440 (0.0007) +[2023-10-08 13:42:20,758][102898] Updated weights for policy 1, policy_version 48480 (0.0008) +[2023-10-08 13:42:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 99254272. Throughput: 0: 1780.7, 1: 1786.4. Samples: 24814122. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:42:21,876][101941] Avg episode reward: [(0, '6.580'), (1, '8.110')] +[2023-10-08 13:42:24,407][102897] Updated weights for policy 0, policy_version 48450 (0.0007) +[2023-10-08 13:42:24,746][102898] Updated weights for policy 1, policy_version 48490 (0.0009) +[2023-10-08 13:42:24,783][102897] Updated weights for policy 0, policy_version 48460 (0.0008) +[2023-10-08 13:42:25,121][102898] Updated weights for policy 1, policy_version 48500 (0.0009) +[2023-10-08 13:42:25,156][102897] Updated weights for policy 0, policy_version 48470 (0.0008) +[2023-10-08 13:42:25,490][102898] Updated weights for policy 1, policy_version 48510 (0.0008) +[2023-10-08 13:42:25,517][102897] Updated weights for policy 0, policy_version 48480 (0.0008) +[2023-10-08 13:42:26,875][101941] Fps is (10 sec: 13108.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 99319808. Throughput: 0: 1757.9, 1: 1773.0. Samples: 24833862. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:42:26,875][101941] Avg episode reward: [(0, '7.390'), (1, '8.120')] +[2023-10-08 13:42:29,208][102897] Updated weights for policy 0, policy_version 48490 (0.0009) +[2023-10-08 13:42:29,398][102898] Updated weights for policy 1, policy_version 48520 (0.0007) +[2023-10-08 13:42:29,578][102897] Updated weights for policy 0, policy_version 48500 (0.0008) +[2023-10-08 13:42:29,760][102898] Updated weights for policy 1, policy_version 48530 (0.0007) +[2023-10-08 13:42:29,953][102897] Updated weights for policy 0, policy_version 48510 (0.0009) +[2023-10-08 13:42:30,123][102898] Updated weights for policy 1, policy_version 48540 (0.0007) +[2023-10-08 13:42:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 99385344. Throughput: 0: 1754.0, 1: 1774.1. Samples: 24855742. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 13:42:31,876][101941] Avg episode reward: [(0, '8.090'), (1, '8.310')] +[2023-10-08 13:42:33,829][102897] Updated weights for policy 0, policy_version 48520 (0.0007) +[2023-10-08 13:42:33,942][102898] Updated weights for policy 1, policy_version 48550 (0.0008) +[2023-10-08 13:42:34,202][102897] Updated weights for policy 0, policy_version 48530 (0.0008) +[2023-10-08 13:42:34,316][102898] Updated weights for policy 1, policy_version 48560 (0.0007) +[2023-10-08 13:42:34,574][102897] Updated weights for policy 0, policy_version 48540 (0.0008) +[2023-10-08 13:42:34,681][102898] Updated weights for policy 1, policy_version 48570 (0.0007) +[2023-10-08 13:42:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 99450880. Throughput: 0: 1764.2, 1: 1782.5. Samples: 24866396. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 13:42:36,876][101941] Avg episode reward: [(0, '7.360'), (1, '8.570')] +[2023-10-08 13:42:38,352][102898] Updated weights for policy 1, policy_version 48580 (0.0008) +[2023-10-08 13:42:38,374][102897] Updated weights for policy 0, policy_version 48550 (0.0008) +[2023-10-08 13:42:38,720][102898] Updated weights for policy 1, policy_version 48590 (0.0008) +[2023-10-08 13:42:38,748][102897] Updated weights for policy 0, policy_version 48560 (0.0008) +[2023-10-08 13:42:39,079][102898] Updated weights for policy 1, policy_version 48600 (0.0008) +[2023-10-08 13:42:39,113][102897] Updated weights for policy 0, policy_version 48570 (0.0010) +[2023-10-08 13:42:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 99516416. Throughput: 0: 1755.0, 1: 1773.6. Samples: 24887708. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 13:42:41,875][101941] Avg episode reward: [(0, '7.140'), (1, '8.960')] +[2023-10-08 13:42:42,860][102898] Updated weights for policy 1, policy_version 48610 (0.0009) +[2023-10-08 13:42:42,924][102897] Updated weights for policy 0, policy_version 48580 (0.0008) +[2023-10-08 13:42:43,223][102898] Updated weights for policy 1, policy_version 48620 (0.0008) +[2023-10-08 13:42:43,301][102897] Updated weights for policy 0, policy_version 48590 (0.0008) +[2023-10-08 13:42:43,590][102898] Updated weights for policy 1, policy_version 48630 (0.0007) +[2023-10-08 13:42:43,662][102897] Updated weights for policy 0, policy_version 48600 (0.0007) +[2023-10-08 13:42:43,954][102898] Updated weights for policy 1, policy_version 48640 (0.0007) +[2023-10-08 13:42:46,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 99581952. Throughput: 0: 1772.5, 1: 1777.8. Samples: 24909822. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 13:42:46,876][101941] Avg episode reward: [(0, '7.460'), (1, '9.250')] +[2023-10-08 13:42:47,311][102897] Updated weights for policy 0, policy_version 48610 (0.0009) +[2023-10-08 13:42:47,686][102897] Updated weights for policy 0, policy_version 48620 (0.0008) +[2023-10-08 13:42:47,833][102898] Updated weights for policy 1, policy_version 48650 (0.0008) +[2023-10-08 13:42:48,051][102897] Updated weights for policy 0, policy_version 48630 (0.0009) +[2023-10-08 13:42:48,201][102898] Updated weights for policy 1, policy_version 48660 (0.0008) +[2023-10-08 13:42:48,416][102897] Updated weights for policy 0, policy_version 48640 (0.0007) +[2023-10-08 13:42:48,564][102898] Updated weights for policy 1, policy_version 48670 (0.0009) +[2023-10-08 13:42:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 99647488. Throughput: 0: 1760.5, 1: 1773.2. Samples: 24919646. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 13:42:51,876][101941] Avg episode reward: [(0, '6.800'), (1, '8.820')] +[2023-10-08 13:42:52,284][102898] Updated weights for policy 1, policy_version 48680 (0.0009) +[2023-10-08 13:42:52,295][102897] Updated weights for policy 0, policy_version 48650 (0.0008) +[2023-10-08 13:42:52,652][102898] Updated weights for policy 1, policy_version 48690 (0.0008) +[2023-10-08 13:42:52,667][102897] Updated weights for policy 0, policy_version 48660 (0.0008) +[2023-10-08 13:42:53,009][102898] Updated weights for policy 1, policy_version 48700 (0.0008) +[2023-10-08 13:42:53,044][102897] Updated weights for policy 0, policy_version 48670 (0.0007) +[2023-10-08 13:42:56,838][102897] Updated weights for policy 0, policy_version 48680 (0.0009) +[2023-10-08 13:42:56,870][102898] Updated weights for policy 1, policy_version 48710 (0.0007) +[2023-10-08 13:42:56,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 99713024. Throughput: 0: 1767.7, 1: 1778.8. Samples: 24941842. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 13:42:56,876][101941] Avg episode reward: [(0, '7.050'), (1, '8.670')] +[2023-10-08 13:42:57,205][102897] Updated weights for policy 0, policy_version 48690 (0.0008) +[2023-10-08 13:42:57,256][102898] Updated weights for policy 1, policy_version 48720 (0.0010) +[2023-10-08 13:42:57,572][102897] Updated weights for policy 0, policy_version 48700 (0.0007) +[2023-10-08 13:42:57,617][102898] Updated weights for policy 1, policy_version 48730 (0.0007) +[2023-10-08 13:43:01,369][102898] Updated weights for policy 1, policy_version 48740 (0.0009) +[2023-10-08 13:43:01,386][102897] Updated weights for policy 0, policy_version 48710 (0.0007) +[2023-10-08 13:43:01,741][102898] Updated weights for policy 1, policy_version 48750 (0.0009) +[2023-10-08 13:43:01,759][102897] Updated weights for policy 0, policy_version 48720 (0.0008) +[2023-10-08 13:43:01,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 99778560. Throughput: 0: 1797.9, 1: 1798.3. Samples: 24963232. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 13:43:01,876][101941] Avg episode reward: [(0, '7.690'), (1, '8.450')] +[2023-10-08 13:43:02,106][102898] Updated weights for policy 1, policy_version 48760 (0.0007) +[2023-10-08 13:43:02,128][102897] Updated weights for policy 0, policy_version 48730 (0.0007) +[2023-10-08 13:43:05,796][102898] Updated weights for policy 1, policy_version 48770 (0.0008) +[2023-10-08 13:43:06,023][102897] Updated weights for policy 0, policy_version 48740 (0.0007) +[2023-10-08 13:43:06,165][102898] Updated weights for policy 1, policy_version 48780 (0.0008) +[2023-10-08 13:43:06,396][102897] Updated weights for policy 0, policy_version 48750 (0.0007) +[2023-10-08 13:43:06,531][102898] Updated weights for policy 1, policy_version 48790 (0.0008) +[2023-10-08 13:43:06,755][102897] Updated weights for policy 0, policy_version 48760 (0.0008) +[2023-10-08 13:43:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 13653.4, 300 sec: 14218.0). Total num frames: 99844096. Throughput: 0: 1772.5, 1: 1772.3. Samples: 24973640. Policy #0 lag: (min: 31.0, avg: 36.4, max: 63.0) +[2023-10-08 13:43:06,875][101941] Avg episode reward: [(0, '7.490'), (1, '8.330')] +[2023-10-08 13:43:06,892][102898] Updated weights for policy 1, policy_version 48800 (0.0007) +[2023-10-08 13:43:10,555][102897] Updated weights for policy 0, policy_version 48770 (0.0008) +[2023-10-08 13:43:10,567][102898] Updated weights for policy 1, policy_version 48810 (0.0007) +[2023-10-08 13:43:10,928][102897] Updated weights for policy 0, policy_version 48780 (0.0009) +[2023-10-08 13:43:10,931][102898] Updated weights for policy 1, policy_version 48820 (0.0007) +[2023-10-08 13:43:11,299][102897] Updated weights for policy 0, policy_version 48790 (0.0008) +[2023-10-08 13:43:11,307][102898] Updated weights for policy 1, policy_version 48830 (0.0009) +[2023-10-08 13:43:11,670][102897] Updated weights for policy 0, policy_version 48800 (0.0009) +[2023-10-08 13:43:11,875][101941] Fps is (10 sec: 19660.8, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 99975168. Throughput: 0: 1798.8, 1: 1805.9. Samples: 24996072. Policy #0 lag: (min: 31.0, avg: 36.4, max: 63.0) +[2023-10-08 13:43:11,876][101941] Avg episode reward: [(0, '7.960'), (1, '7.940')] +[2023-10-08 13:43:15,032][102898] Updated weights for policy 1, policy_version 48840 (0.0009) +[2023-10-08 13:43:15,290][102897] Updated weights for policy 0, policy_version 48810 (0.0008) +[2023-10-08 13:43:15,395][102898] Updated weights for policy 1, policy_version 48850 (0.0007) +[2023-10-08 13:43:15,664][102897] Updated weights for policy 0, policy_version 48820 (0.0008) +[2023-10-08 13:43:15,760][102898] Updated weights for policy 1, policy_version 48860 (0.0007) +[2023-10-08 13:43:16,033][102897] Updated weights for policy 0, policy_version 48830 (0.0009) +[2023-10-08 13:43:16,875][101941] Fps is (10 sec: 19660.5, 60 sec: 14199.6, 300 sec: 14329.1). Total num frames: 100040704. Throughput: 0: 1776.8, 1: 1782.2. Samples: 25015898. Policy #0 lag: (min: 31.0, avg: 36.4, max: 63.0) +[2023-10-08 13:43:16,876][101941] Avg episode reward: [(0, '7.890'), (1, '7.930')] +[2023-10-08 13:43:19,435][102898] Updated weights for policy 1, policy_version 48870 (0.0008) +[2023-10-08 13:43:19,796][102897] Updated weights for policy 0, policy_version 48840 (0.0008) +[2023-10-08 13:43:19,800][102898] Updated weights for policy 1, policy_version 48880 (0.0007) +[2023-10-08 13:43:20,167][102897] Updated weights for policy 0, policy_version 48850 (0.0007) +[2023-10-08 13:43:20,169][102898] Updated weights for policy 1, policy_version 48890 (0.0008) +[2023-10-08 13:43:20,541][102897] Updated weights for policy 0, policy_version 48860 (0.0008) +[2023-10-08 13:43:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 100106240. Throughput: 0: 1798.7, 1: 1797.9. Samples: 25028242. Policy #0 lag: (min: 31.0, avg: 36.4, max: 63.0) +[2023-10-08 13:43:21,876][101941] Avg episode reward: [(0, '7.350'), (1, '8.370')] +[2023-10-08 13:43:24,006][102898] Updated weights for policy 1, policy_version 48900 (0.0009) +[2023-10-08 13:43:24,375][102898] Updated weights for policy 1, policy_version 48910 (0.0008) +[2023-10-08 13:43:24,434][102897] Updated weights for policy 0, policy_version 48870 (0.0008) +[2023-10-08 13:43:24,752][102898] Updated weights for policy 1, policy_version 48920 (0.0008) +[2023-10-08 13:43:24,804][102897] Updated weights for policy 0, policy_version 48880 (0.0008) +[2023-10-08 13:43:25,177][102897] Updated weights for policy 0, policy_version 48890 (0.0008) +[2023-10-08 13:43:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 100171776. Throughput: 0: 1778.2, 1: 1781.3. Samples: 25047888. Policy #0 lag: (min: 31.0, avg: 36.4, max: 63.0) +[2023-10-08 13:43:26,875][101941] Avg episode reward: [(0, '7.370'), (1, '7.700')] +[2023-10-08 13:43:28,618][102898] Updated weights for policy 1, policy_version 48930 (0.0008) +[2023-10-08 13:43:28,985][102898] Updated weights for policy 1, policy_version 48940 (0.0007) +[2023-10-08 13:43:29,016][102897] Updated weights for policy 0, policy_version 48900 (0.0008) +[2023-10-08 13:43:29,344][102898] Updated weights for policy 1, policy_version 48950 (0.0008) +[2023-10-08 13:43:29,393][102897] Updated weights for policy 0, policy_version 48910 (0.0009) +[2023-10-08 13:43:29,710][102898] Updated weights for policy 1, policy_version 48960 (0.0007) +[2023-10-08 13:43:29,764][102897] Updated weights for policy 0, policy_version 48920 (0.0008) +[2023-10-08 13:43:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 100237312. Throughput: 0: 1772.6, 1: 1783.5. Samples: 25069848. Policy #0 lag: (min: 31.0, avg: 36.4, max: 63.0) +[2023-10-08 13:43:31,876][101941] Avg episode reward: [(0, '7.670'), (1, '8.270')] +[2023-10-08 13:43:33,538][102897] Updated weights for policy 0, policy_version 48930 (0.0008) +[2023-10-08 13:43:33,620][102898] Updated weights for policy 1, policy_version 48970 (0.0009) +[2023-10-08 13:43:33,915][102897] Updated weights for policy 0, policy_version 48940 (0.0007) +[2023-10-08 13:43:33,978][102898] Updated weights for policy 1, policy_version 48980 (0.0010) +[2023-10-08 13:43:34,283][102897] Updated weights for policy 0, policy_version 48950 (0.0008) +[2023-10-08 13:43:34,348][102898] Updated weights for policy 1, policy_version 48990 (0.0007) +[2023-10-08 13:43:34,656][102897] Updated weights for policy 0, policy_version 48960 (0.0007) +[2023-10-08 13:43:36,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 100302848. Throughput: 0: 1778.0, 1: 1781.4. Samples: 25079820. Policy #0 lag: (min: 21.0, avg: 26.9, max: 53.0) +[2023-10-08 13:43:36,876][101941] Avg episode reward: [(0, '7.110'), (1, '8.510')] +[2023-10-08 13:43:38,175][102898] Updated weights for policy 1, policy_version 49000 (0.0007) +[2023-10-08 13:43:38,534][102898] Updated weights for policy 1, policy_version 49010 (0.0009) +[2023-10-08 13:43:38,685][102897] Updated weights for policy 0, policy_version 48970 (0.0010) +[2023-10-08 13:43:38,906][102898] Updated weights for policy 1, policy_version 49020 (0.0008) +[2023-10-08 13:43:39,049][102897] Updated weights for policy 0, policy_version 48980 (0.0008) +[2023-10-08 13:43:39,417][102897] Updated weights for policy 0, policy_version 48990 (0.0008) +[2023-10-08 13:43:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 100368384. Throughput: 0: 1765.1, 1: 1783.2. Samples: 25101512. Policy #0 lag: (min: 21.0, avg: 26.9, max: 53.0) +[2023-10-08 13:43:41,876][101941] Avg episode reward: [(0, '7.000'), (1, '8.610')] +[2023-10-08 13:43:42,687][102898] Updated weights for policy 1, policy_version 49030 (0.0010) +[2023-10-08 13:43:43,059][102898] Updated weights for policy 1, policy_version 49040 (0.0009) +[2023-10-08 13:43:43,225][102897] Updated weights for policy 0, policy_version 49000 (0.0007) +[2023-10-08 13:43:43,429][102898] Updated weights for policy 1, policy_version 49050 (0.0008) +[2023-10-08 13:43:43,599][102897] Updated weights for policy 0, policy_version 49010 (0.0008) +[2023-10-08 13:43:43,968][102897] Updated weights for policy 0, policy_version 49020 (0.0008) +[2023-10-08 13:43:46,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 100433920. Throughput: 0: 1771.3, 1: 1791.7. Samples: 25123564. Policy #0 lag: (min: 21.0, avg: 26.9, max: 53.0) +[2023-10-08 13:43:46,875][101941] Avg episode reward: [(0, '7.440'), (1, '8.680')] +[2023-10-08 13:43:47,173][102898] Updated weights for policy 1, policy_version 49060 (0.0007) +[2023-10-08 13:43:47,543][102898] Updated weights for policy 1, policy_version 49070 (0.0007) +[2023-10-08 13:43:47,662][102897] Updated weights for policy 0, policy_version 49030 (0.0008) +[2023-10-08 13:43:47,911][102898] Updated weights for policy 1, policy_version 49080 (0.0008) +[2023-10-08 13:43:48,036][102897] Updated weights for policy 0, policy_version 49040 (0.0009) +[2023-10-08 13:43:48,401][102897] Updated weights for policy 0, policy_version 49050 (0.0009) +[2023-10-08 13:43:51,820][102898] Updated weights for policy 1, policy_version 49090 (0.0008) +[2023-10-08 13:43:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 100499456. Throughput: 0: 1766.5, 1: 1785.6. Samples: 25133486. Policy #0 lag: (min: 21.0, avg: 26.9, max: 53.0) +[2023-10-08 13:43:51,876][101941] Avg episode reward: [(0, '7.430'), (1, '8.380')] +[2023-10-08 13:43:52,063][102897] Updated weights for policy 0, policy_version 49060 (0.0010) +[2023-10-08 13:43:52,182][102898] Updated weights for policy 1, policy_version 49100 (0.0007) +[2023-10-08 13:43:52,436][102897] Updated weights for policy 0, policy_version 49070 (0.0007) +[2023-10-08 13:43:52,553][102898] Updated weights for policy 1, policy_version 49110 (0.0008) +[2023-10-08 13:43:52,806][102897] Updated weights for policy 0, policy_version 49080 (0.0009) +[2023-10-08 13:43:52,912][102898] Updated weights for policy 1, policy_version 49120 (0.0009) +[2023-10-08 13:43:56,539][102897] Updated weights for policy 0, policy_version 49090 (0.0007) +[2023-10-08 13:43:56,651][102898] Updated weights for policy 1, policy_version 49130 (0.0008) +[2023-10-08 13:43:56,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 100564992. Throughput: 0: 1769.6, 1: 1777.6. Samples: 25155696. Policy #0 lag: (min: 21.0, avg: 26.9, max: 53.0) +[2023-10-08 13:43:56,876][101941] Avg episode reward: [(0, '7.930'), (1, '8.940')] +[2023-10-08 13:43:56,909][102897] Updated weights for policy 0, policy_version 49100 (0.0008) +[2023-10-08 13:43:57,022][102898] Updated weights for policy 1, policy_version 49140 (0.0007) +[2023-10-08 13:43:57,283][102897] Updated weights for policy 0, policy_version 49110 (0.0007) +[2023-10-08 13:43:57,387][102898] Updated weights for policy 1, policy_version 49150 (0.0008) +[2023-10-08 13:43:57,644][102897] Updated weights for policy 0, policy_version 49120 (0.0008) +[2023-10-08 13:44:01,108][102898] Updated weights for policy 1, policy_version 49160 (0.0008) +[2023-10-08 13:44:01,440][102897] Updated weights for policy 0, policy_version 49130 (0.0008) +[2023-10-08 13:44:01,472][102898] Updated weights for policy 1, policy_version 49170 (0.0007) +[2023-10-08 13:44:01,805][102897] Updated weights for policy 0, policy_version 49140 (0.0008) +[2023-10-08 13:44:01,846][102898] Updated weights for policy 1, policy_version 49180 (0.0008) +[2023-10-08 13:44:01,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 100630528. Throughput: 0: 1791.6, 1: 1783.6. Samples: 25176782. Policy #0 lag: (min: 21.0, avg: 26.9, max: 53.0) +[2023-10-08 13:44:01,876][101941] Avg episode reward: [(0, '8.810'), (1, '9.000')] +[2023-10-08 13:44:02,180][102897] Updated weights for policy 0, policy_version 49150 (0.0009) +[2023-10-08 13:44:02,250][102634] Saving new best policy, reward=8.810! +[2023-10-08 13:44:05,662][102898] Updated weights for policy 1, policy_version 49190 (0.0009) +[2023-10-08 13:44:06,026][102898] Updated weights for policy 1, policy_version 49200 (0.0008) +[2023-10-08 13:44:06,087][102897] Updated weights for policy 0, policy_version 49160 (0.0008) +[2023-10-08 13:44:06,393][102898] Updated weights for policy 1, policy_version 49210 (0.0007) +[2023-10-08 13:44:06,453][102897] Updated weights for policy 0, policy_version 49170 (0.0007) +[2023-10-08 13:44:06,815][102897] Updated weights for policy 0, policy_version 49180 (0.0007) +[2023-10-08 13:44:06,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 100728832. Throughput: 0: 1764.3, 1: 1776.1. Samples: 25187560. Policy #0 lag: (min: 21.0, avg: 26.9, max: 53.0) +[2023-10-08 13:44:06,876][101941] Avg episode reward: [(0, '8.170'), (1, '8.100')] +[2023-10-08 13:44:10,173][102898] Updated weights for policy 1, policy_version 49220 (0.0007) +[2023-10-08 13:44:10,445][102897] Updated weights for policy 0, policy_version 49190 (0.0009) +[2023-10-08 13:44:10,544][102898] Updated weights for policy 1, policy_version 49230 (0.0009) +[2023-10-08 13:44:10,823][102897] Updated weights for policy 0, policy_version 49200 (0.0008) +[2023-10-08 13:44:10,907][102898] Updated weights for policy 1, policy_version 49240 (0.0008) +[2023-10-08 13:44:11,190][102897] Updated weights for policy 0, policy_version 49210 (0.0008) +[2023-10-08 13:44:11,875][101941] Fps is (10 sec: 19661.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 100827136. Throughput: 0: 1793.6, 1: 1790.9. Samples: 25209192. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:44:11,875][101941] Avg episode reward: [(0, '7.240'), (1, '8.230')] +[2023-10-08 13:44:14,784][102898] Updated weights for policy 1, policy_version 49250 (0.0008) +[2023-10-08 13:44:14,977][102897] Updated weights for policy 0, policy_version 49220 (0.0007) +[2023-10-08 13:44:15,160][102898] Updated weights for policy 1, policy_version 49260 (0.0007) +[2023-10-08 13:44:15,348][102897] Updated weights for policy 0, policy_version 49230 (0.0007) +[2023-10-08 13:44:15,528][102898] Updated weights for policy 1, policy_version 49270 (0.0008) +[2023-10-08 13:44:15,713][102897] Updated weights for policy 0, policy_version 49240 (0.0008) +[2023-10-08 13:44:15,904][102898] Updated weights for policy 1, policy_version 49280 (0.0010) +[2023-10-08 13:44:16,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 100892672. Throughput: 0: 1772.2, 1: 1766.4. Samples: 25229088. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:44:16,876][101941] Avg episode reward: [(0, '7.350'), (1, '8.350')] +[2023-10-08 13:44:16,887][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000049280_50462720.pth... +[2023-10-08 13:44:16,887][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000049248_50429952.pth... +[2023-10-08 13:44:16,922][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000047616_48758784.pth +[2023-10-08 13:44:16,930][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000047584_48726016.pth +[2023-10-08 13:44:19,515][102897] Updated weights for policy 0, policy_version 49250 (0.0010) +[2023-10-08 13:44:19,791][102898] Updated weights for policy 1, policy_version 49290 (0.0008) +[2023-10-08 13:44:19,879][102897] Updated weights for policy 0, policy_version 49260 (0.0007) +[2023-10-08 13:44:20,152][102898] Updated weights for policy 1, policy_version 49300 (0.0008) +[2023-10-08 13:44:20,246][102897] Updated weights for policy 0, policy_version 49270 (0.0008) +[2023-10-08 13:44:20,513][102898] Updated weights for policy 1, policy_version 49310 (0.0010) +[2023-10-08 13:44:20,618][102897] Updated weights for policy 0, policy_version 49280 (0.0009) +[2023-10-08 13:44:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 100958208. Throughput: 0: 1800.9, 1: 1798.1. Samples: 25241774. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:44:21,876][101941] Avg episode reward: [(0, '7.940'), (1, '8.630')] +[2023-10-08 13:44:24,319][102897] Updated weights for policy 0, policy_version 49290 (0.0008) +[2023-10-08 13:44:24,321][102898] Updated weights for policy 1, policy_version 49320 (0.0008) +[2023-10-08 13:44:24,693][102898] Updated weights for policy 1, policy_version 49330 (0.0008) +[2023-10-08 13:44:24,697][102897] Updated weights for policy 0, policy_version 49300 (0.0009) +[2023-10-08 13:44:25,064][102897] Updated weights for policy 0, policy_version 49310 (0.0008) +[2023-10-08 13:44:25,067][102898] Updated weights for policy 1, policy_version 49340 (0.0007) +[2023-10-08 13:44:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 101023744. Throughput: 0: 1780.8, 1: 1761.1. Samples: 25260898. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:44:26,876][101941] Avg episode reward: [(0, '8.200'), (1, '8.200')] +[2023-10-08 13:44:28,891][102897] Updated weights for policy 0, policy_version 49320 (0.0008) +[2023-10-08 13:44:28,935][102898] Updated weights for policy 1, policy_version 49350 (0.0008) +[2023-10-08 13:44:29,263][102897] Updated weights for policy 0, policy_version 49330 (0.0007) +[2023-10-08 13:44:29,316][102898] Updated weights for policy 1, policy_version 49360 (0.0008) +[2023-10-08 13:44:29,635][102897] Updated weights for policy 0, policy_version 49340 (0.0007) +[2023-10-08 13:44:29,685][102898] Updated weights for policy 1, policy_version 49370 (0.0007) +[2023-10-08 13:44:31,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 101089280. Throughput: 0: 1778.4, 1: 1757.2. Samples: 25282670. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:44:31,876][101941] Avg episode reward: [(0, '7.480'), (1, '8.330')] +[2023-10-08 13:44:33,417][102897] Updated weights for policy 0, policy_version 49350 (0.0007) +[2023-10-08 13:44:33,476][102898] Updated weights for policy 1, policy_version 49380 (0.0008) +[2023-10-08 13:44:33,787][102897] Updated weights for policy 0, policy_version 49360 (0.0008) +[2023-10-08 13:44:33,848][102898] Updated weights for policy 1, policy_version 49390 (0.0007) +[2023-10-08 13:44:34,162][102897] Updated weights for policy 0, policy_version 49370 (0.0008) +[2023-10-08 13:44:34,213][102898] Updated weights for policy 1, policy_version 49400 (0.0008) +[2023-10-08 13:44:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 101154816. Throughput: 0: 1780.0, 1: 1762.0. Samples: 25292876. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:44:36,875][101941] Avg episode reward: [(0, '7.080'), (1, '8.370')] +[2023-10-08 13:44:37,884][102897] Updated weights for policy 0, policy_version 49380 (0.0008) +[2023-10-08 13:44:37,996][102898] Updated weights for policy 1, policy_version 49410 (0.0008) +[2023-10-08 13:44:38,252][102897] Updated weights for policy 0, policy_version 49390 (0.0010) +[2023-10-08 13:44:38,364][102898] Updated weights for policy 1, policy_version 49420 (0.0008) +[2023-10-08 13:44:38,627][102897] Updated weights for policy 0, policy_version 49400 (0.0008) +[2023-10-08 13:44:38,727][102898] Updated weights for policy 1, policy_version 49430 (0.0007) +[2023-10-08 13:44:39,101][102898] Updated weights for policy 1, policy_version 49440 (0.0010) +[2023-10-08 13:44:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 101220352. Throughput: 0: 1773.5, 1: 1762.0. Samples: 25314790. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 13:44:41,876][101941] Avg episode reward: [(0, '7.650'), (1, '9.270')] +[2023-10-08 13:44:42,497][102897] Updated weights for policy 0, policy_version 49410 (0.0008) +[2023-10-08 13:44:42,759][102898] Updated weights for policy 1, policy_version 49450 (0.0008) +[2023-10-08 13:44:42,862][102897] Updated weights for policy 0, policy_version 49420 (0.0008) +[2023-10-08 13:44:43,126][102898] Updated weights for policy 1, policy_version 49460 (0.0007) +[2023-10-08 13:44:43,240][102897] Updated weights for policy 0, policy_version 49430 (0.0009) +[2023-10-08 13:44:43,501][102898] Updated weights for policy 1, policy_version 49470 (0.0008) +[2023-10-08 13:44:43,612][102897] Updated weights for policy 0, policy_version 49440 (0.0009) +[2023-10-08 13:44:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 101285888. Throughput: 0: 1779.3, 1: 1779.9. Samples: 25336944. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 13:44:46,876][101941] Avg episode reward: [(0, '7.200'), (1, '8.530')] +[2023-10-08 13:44:47,298][102897] Updated weights for policy 0, policy_version 49450 (0.0008) +[2023-10-08 13:44:47,375][102898] Updated weights for policy 1, policy_version 49480 (0.0008) +[2023-10-08 13:44:47,666][102897] Updated weights for policy 0, policy_version 49460 (0.0008) +[2023-10-08 13:44:47,742][102898] Updated weights for policy 1, policy_version 49490 (0.0008) +[2023-10-08 13:44:48,039][102897] Updated weights for policy 0, policy_version 49470 (0.0008) +[2023-10-08 13:44:48,106][102898] Updated weights for policy 1, policy_version 49500 (0.0009) +[2023-10-08 13:44:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 101351424. Throughput: 0: 1771.7, 1: 1758.4. Samples: 25346418. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 13:44:51,876][101941] Avg episode reward: [(0, '7.130'), (1, '8.050')] +[2023-10-08 13:44:51,959][102898] Updated weights for policy 1, policy_version 49510 (0.0007) +[2023-10-08 13:44:52,063][102897] Updated weights for policy 0, policy_version 49480 (0.0010) +[2023-10-08 13:44:52,321][102898] Updated weights for policy 1, policy_version 49520 (0.0007) +[2023-10-08 13:44:52,428][102897] Updated weights for policy 0, policy_version 49490 (0.0007) +[2023-10-08 13:44:52,682][102898] Updated weights for policy 1, policy_version 49530 (0.0007) +[2023-10-08 13:44:52,803][102897] Updated weights for policy 0, policy_version 49500 (0.0008) +[2023-10-08 13:44:56,515][102898] Updated weights for policy 1, policy_version 49540 (0.0008) +[2023-10-08 13:44:56,756][102897] Updated weights for policy 0, policy_version 49510 (0.0008) +[2023-10-08 13:44:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 101416960. Throughput: 0: 1769.8, 1: 1769.6. Samples: 25368466. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 13:44:56,877][101941] Avg episode reward: [(0, '7.010'), (1, '9.100')] +[2023-10-08 13:44:56,881][102898] Updated weights for policy 1, policy_version 49550 (0.0008) +[2023-10-08 13:44:57,123][102897] Updated weights for policy 0, policy_version 49520 (0.0008) +[2023-10-08 13:44:57,240][102898] Updated weights for policy 1, policy_version 49560 (0.0007) +[2023-10-08 13:44:57,487][102897] Updated weights for policy 0, policy_version 49530 (0.0007) +[2023-10-08 13:45:01,057][102898] Updated weights for policy 1, policy_version 49570 (0.0008) +[2023-10-08 13:45:01,333][102897] Updated weights for policy 0, policy_version 49540 (0.0007) +[2023-10-08 13:45:01,421][102898] Updated weights for policy 1, policy_version 49580 (0.0008) +[2023-10-08 13:45:01,700][102897] Updated weights for policy 0, policy_version 49550 (0.0008) +[2023-10-08 13:45:01,790][102898] Updated weights for policy 1, policy_version 49590 (0.0008) +[2023-10-08 13:45:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 101482496. Throughput: 0: 1788.7, 1: 1780.5. Samples: 25389702. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 13:45:01,876][101941] Avg episode reward: [(0, '7.190'), (1, '9.660')] +[2023-10-08 13:45:02,077][102897] Updated weights for policy 0, policy_version 49560 (0.0008) +[2023-10-08 13:45:02,146][102760] Saving new best policy, reward=9.660! +[2023-10-08 13:45:02,150][102898] Updated weights for policy 1, policy_version 49600 (0.0008) +[2023-10-08 13:45:05,775][102898] Updated weights for policy 1, policy_version 49610 (0.0007) +[2023-10-08 13:45:05,883][102897] Updated weights for policy 0, policy_version 49570 (0.0008) +[2023-10-08 13:45:06,148][102898] Updated weights for policy 1, policy_version 49620 (0.0007) +[2023-10-08 13:45:06,249][102897] Updated weights for policy 0, policy_version 49580 (0.0007) +[2023-10-08 13:45:06,516][102898] Updated weights for policy 1, policy_version 49630 (0.0009) +[2023-10-08 13:45:06,624][102897] Updated weights for policy 0, policy_version 49590 (0.0007) +[2023-10-08 13:45:06,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 101580800. Throughput: 0: 1759.3, 1: 1763.7. Samples: 25400308. Policy #0 lag: (min: 31.0, avg: 37.8, max: 63.0) +[2023-10-08 13:45:06,876][101941] Avg episode reward: [(0, '7.810'), (1, '8.320')] +[2023-10-08 13:45:06,994][102897] Updated weights for policy 0, policy_version 49600 (0.0007) +[2023-10-08 13:45:10,466][102898] Updated weights for policy 1, policy_version 49640 (0.0008) +[2023-10-08 13:45:10,732][102897] Updated weights for policy 0, policy_version 49610 (0.0007) +[2023-10-08 13:45:10,831][102898] Updated weights for policy 1, policy_version 49650 (0.0007) +[2023-10-08 13:45:11,098][102897] Updated weights for policy 0, policy_version 49620 (0.0010) +[2023-10-08 13:45:11,199][102898] Updated weights for policy 1, policy_version 49660 (0.0007) +[2023-10-08 13:45:11,473][102897] Updated weights for policy 0, policy_version 49630 (0.0008) +[2023-10-08 13:45:11,875][101941] Fps is (10 sec: 19660.4, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 101679104. Throughput: 0: 1789.1, 1: 1791.1. Samples: 25422004. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:45:11,876][101941] Avg episode reward: [(0, '7.510'), (1, '7.410')] +[2023-10-08 13:45:15,010][102898] Updated weights for policy 1, policy_version 49670 (0.0007) +[2023-10-08 13:45:15,367][102897] Updated weights for policy 0, policy_version 49640 (0.0008) +[2023-10-08 13:45:15,394][102898] Updated weights for policy 1, policy_version 49680 (0.0009) +[2023-10-08 13:45:15,739][102897] Updated weights for policy 0, policy_version 49650 (0.0009) +[2023-10-08 13:45:15,762][102898] Updated weights for policy 1, policy_version 49690 (0.0008) +[2023-10-08 13:45:16,100][102897] Updated weights for policy 0, policy_version 49660 (0.0009) +[2023-10-08 13:45:16,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 101744640. Throughput: 0: 1756.6, 1: 1774.8. Samples: 25441586. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:45:16,876][101941] Avg episode reward: [(0, '7.330'), (1, '7.670')] +[2023-10-08 13:45:19,507][102898] Updated weights for policy 1, policy_version 49700 (0.0007) +[2023-10-08 13:45:19,822][102897] Updated weights for policy 0, policy_version 49670 (0.0008) +[2023-10-08 13:45:19,874][102898] Updated weights for policy 1, policy_version 49710 (0.0007) +[2023-10-08 13:45:20,198][102897] Updated weights for policy 0, policy_version 49680 (0.0008) +[2023-10-08 13:45:20,224][102898] Updated weights for policy 1, policy_version 49720 (0.0009) +[2023-10-08 13:45:20,568][102897] Updated weights for policy 0, policy_version 49690 (0.0008) +[2023-10-08 13:45:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 101810176. Throughput: 0: 1786.7, 1: 1793.1. Samples: 25453966. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:45:21,876][101941] Avg episode reward: [(0, '7.580'), (1, '8.810')] +[2023-10-08 13:45:24,022][102898] Updated weights for policy 1, policy_version 49730 (0.0011) +[2023-10-08 13:45:24,391][102898] Updated weights for policy 1, policy_version 49740 (0.0009) +[2023-10-08 13:45:24,541][102897] Updated weights for policy 0, policy_version 49700 (0.0008) +[2023-10-08 13:45:24,760][102898] Updated weights for policy 1, policy_version 49750 (0.0007) +[2023-10-08 13:45:24,919][102897] Updated weights for policy 0, policy_version 49710 (0.0009) +[2023-10-08 13:45:25,128][102898] Updated weights for policy 1, policy_version 49760 (0.0007) +[2023-10-08 13:45:25,287][102897] Updated weights for policy 0, policy_version 49720 (0.0009) +[2023-10-08 13:45:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 101875712. Throughput: 0: 1759.7, 1: 1766.3. Samples: 25473460. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:45:26,876][101941] Avg episode reward: [(0, '8.060'), (1, '9.430')] +[2023-10-08 13:45:28,788][102897] Updated weights for policy 0, policy_version 49730 (0.0009) +[2023-10-08 13:45:29,012][102898] Updated weights for policy 1, policy_version 49770 (0.0009) +[2023-10-08 13:45:29,152][102897] Updated weights for policy 0, policy_version 49740 (0.0008) +[2023-10-08 13:45:29,376][102898] Updated weights for policy 1, policy_version 49780 (0.0008) +[2023-10-08 13:45:29,526][102897] Updated weights for policy 0, policy_version 49750 (0.0008) +[2023-10-08 13:45:29,744][102898] Updated weights for policy 1, policy_version 49790 (0.0009) +[2023-10-08 13:45:29,894][102897] Updated weights for policy 0, policy_version 49760 (0.0007) +[2023-10-08 13:45:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 101941248. Throughput: 0: 1760.1, 1: 1765.2. Samples: 25495584. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:45:31,876][101941] Avg episode reward: [(0, '7.840'), (1, '9.120')] +[2023-10-08 13:45:33,461][102898] Updated weights for policy 1, policy_version 49800 (0.0008) +[2023-10-08 13:45:33,704][102897] Updated weights for policy 0, policy_version 49770 (0.0008) +[2023-10-08 13:45:33,827][102898] Updated weights for policy 1, policy_version 49810 (0.0009) +[2023-10-08 13:45:34,081][102897] Updated weights for policy 0, policy_version 49780 (0.0008) +[2023-10-08 13:45:34,186][102898] Updated weights for policy 1, policy_version 49820 (0.0008) +[2023-10-08 13:45:34,445][102897] Updated weights for policy 0, policy_version 49790 (0.0008) +[2023-10-08 13:45:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 102006784. Throughput: 0: 1767.8, 1: 1768.5. Samples: 25505552. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:45:36,876][101941] Avg episode reward: [(0, '7.390'), (1, '8.930')] +[2023-10-08 13:45:38,057][102898] Updated weights for policy 1, policy_version 49830 (0.0007) +[2023-10-08 13:45:38,089][102897] Updated weights for policy 0, policy_version 49800 (0.0008) +[2023-10-08 13:45:38,418][102898] Updated weights for policy 1, policy_version 49840 (0.0007) +[2023-10-08 13:45:38,460][102897] Updated weights for policy 0, policy_version 49810 (0.0007) +[2023-10-08 13:45:38,786][102898] Updated weights for policy 1, policy_version 49850 (0.0009) +[2023-10-08 13:45:38,834][102897] Updated weights for policy 0, policy_version 49820 (0.0008) +[2023-10-08 13:45:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 102072320. Throughput: 0: 1771.1, 1: 1768.2. Samples: 25527734. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:45:41,876][101941] Avg episode reward: [(0, '7.520'), (1, '9.180')] +[2023-10-08 13:45:42,400][102898] Updated weights for policy 1, policy_version 49860 (0.0009) +[2023-10-08 13:45:42,688][102897] Updated weights for policy 0, policy_version 49830 (0.0008) +[2023-10-08 13:45:42,767][102898] Updated weights for policy 1, policy_version 49870 (0.0007) +[2023-10-08 13:45:43,059][102897] Updated weights for policy 0, policy_version 49840 (0.0009) +[2023-10-08 13:45:43,140][102898] Updated weights for policy 1, policy_version 49880 (0.0008) +[2023-10-08 13:45:43,434][102897] Updated weights for policy 0, policy_version 49850 (0.0008) +[2023-10-08 13:45:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 102137856. Throughput: 0: 1774.3, 1: 1783.6. Samples: 25549808. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 13:45:46,876][101941] Avg episode reward: [(0, '7.570'), (1, '8.850')] +[2023-10-08 13:45:47,009][102898] Updated weights for policy 1, policy_version 49890 (0.0008) +[2023-10-08 13:45:47,384][102898] Updated weights for policy 1, policy_version 49900 (0.0008) +[2023-10-08 13:45:47,404][102897] Updated weights for policy 0, policy_version 49860 (0.0008) +[2023-10-08 13:45:47,747][102898] Updated weights for policy 1, policy_version 49910 (0.0010) +[2023-10-08 13:45:47,775][102897] Updated weights for policy 0, policy_version 49870 (0.0007) +[2023-10-08 13:45:48,107][102898] Updated weights for policy 1, policy_version 49920 (0.0009) +[2023-10-08 13:45:48,142][102897] Updated weights for policy 0, policy_version 49880 (0.0009) +[2023-10-08 13:45:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 102203392. Throughput: 0: 1766.0, 1: 1773.7. Samples: 25559592. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 13:45:51,876][101941] Avg episode reward: [(0, '7.830'), (1, '8.580')] +[2023-10-08 13:45:51,907][102898] Updated weights for policy 1, policy_version 49930 (0.0007) +[2023-10-08 13:45:51,925][102897] Updated weights for policy 0, policy_version 49890 (0.0007) +[2023-10-08 13:45:52,278][102898] Updated weights for policy 1, policy_version 49940 (0.0008) +[2023-10-08 13:45:52,292][102897] Updated weights for policy 0, policy_version 49900 (0.0009) +[2023-10-08 13:45:52,646][102898] Updated weights for policy 1, policy_version 49950 (0.0009) +[2023-10-08 13:45:52,671][102897] Updated weights for policy 0, policy_version 49910 (0.0008) +[2023-10-08 13:45:53,040][102897] Updated weights for policy 0, policy_version 49920 (0.0008) +[2023-10-08 13:45:56,506][102898] Updated weights for policy 1, policy_version 49960 (0.0010) +[2023-10-08 13:45:56,873][102898] Updated weights for policy 1, policy_version 49970 (0.0009) +[2023-10-08 13:45:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 102268928. Throughput: 0: 1768.2, 1: 1782.0. Samples: 25581760. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 13:45:56,876][101941] Avg episode reward: [(0, '7.700'), (1, '8.690')] +[2023-10-08 13:45:56,882][102897] Updated weights for policy 0, policy_version 49930 (0.0007) +[2023-10-08 13:45:57,244][102898] Updated weights for policy 1, policy_version 49980 (0.0007) +[2023-10-08 13:45:57,247][102897] Updated weights for policy 0, policy_version 49940 (0.0008) +[2023-10-08 13:45:57,622][102897] Updated weights for policy 0, policy_version 49950 (0.0010) +[2023-10-08 13:46:01,137][102898] Updated weights for policy 1, policy_version 49990 (0.0008) +[2023-10-08 13:46:01,523][102898] Updated weights for policy 1, policy_version 50000 (0.0008) +[2023-10-08 13:46:01,647][102897] Updated weights for policy 0, policy_version 49960 (0.0008) +[2023-10-08 13:46:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14106.9). Total num frames: 102334464. Throughput: 0: 1799.2, 1: 1788.1. Samples: 25603012. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 13:46:01,876][101941] Avg episode reward: [(0, '7.830'), (1, '9.040')] +[2023-10-08 13:46:01,886][102898] Updated weights for policy 1, policy_version 50010 (0.0008) +[2023-10-08 13:46:02,027][102897] Updated weights for policy 0, policy_version 49970 (0.0009) +[2023-10-08 13:46:02,399][102897] Updated weights for policy 0, policy_version 49980 (0.0007) +[2023-10-08 13:46:05,504][102898] Updated weights for policy 1, policy_version 50020 (0.0009) +[2023-10-08 13:46:05,874][102898] Updated weights for policy 1, policy_version 50030 (0.0009) +[2023-10-08 13:46:06,188][102897] Updated weights for policy 0, policy_version 49990 (0.0008) +[2023-10-08 13:46:06,247][102898] Updated weights for policy 1, policy_version 50040 (0.0010) +[2023-10-08 13:46:06,557][102897] Updated weights for policy 0, policy_version 50000 (0.0008) +[2023-10-08 13:46:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14106.9). Total num frames: 102432768. Throughput: 0: 1763.7, 1: 1777.9. Samples: 25613338. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 13:46:06,875][101941] Avg episode reward: [(0, '6.800'), (1, '8.520')] +[2023-10-08 13:46:06,929][102897] Updated weights for policy 0, policy_version 50010 (0.0007) +[2023-10-08 13:46:09,995][102898] Updated weights for policy 1, policy_version 50050 (0.0008) +[2023-10-08 13:46:10,366][102898] Updated weights for policy 1, policy_version 50060 (0.0007) +[2023-10-08 13:46:10,615][102897] Updated weights for policy 0, policy_version 50020 (0.0008) +[2023-10-08 13:46:10,727][102898] Updated weights for policy 1, policy_version 50070 (0.0007) +[2023-10-08 13:46:10,976][102897] Updated weights for policy 0, policy_version 50030 (0.0009) +[2023-10-08 13:46:11,089][102898] Updated weights for policy 1, policy_version 50080 (0.0009) +[2023-10-08 13:46:11,347][102897] Updated weights for policy 0, policy_version 50040 (0.0011) +[2023-10-08 13:46:11,875][101941] Fps is (10 sec: 19660.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 102531072. Throughput: 0: 1800.6, 1: 1796.0. Samples: 25635304. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 13:46:11,875][101941] Avg episode reward: [(0, '7.420'), (1, '8.050')] +[2023-10-08 13:46:14,960][102898] Updated weights for policy 1, policy_version 50090 (0.0010) +[2023-10-08 13:46:15,067][102897] Updated weights for policy 0, policy_version 50050 (0.0010) +[2023-10-08 13:46:15,322][102898] Updated weights for policy 1, policy_version 50100 (0.0007) +[2023-10-08 13:46:15,430][102897] Updated weights for policy 0, policy_version 50060 (0.0009) +[2023-10-08 13:46:15,699][102898] Updated weights for policy 1, policy_version 50110 (0.0007) +[2023-10-08 13:46:15,808][102897] Updated weights for policy 0, policy_version 50070 (0.0008) +[2023-10-08 13:46:16,172][102897] Updated weights for policy 0, policy_version 50080 (0.0007) +[2023-10-08 13:46:16,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 102596608. Throughput: 0: 1769.2, 1: 1783.0. Samples: 25655432. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:46:16,876][101941] Avg episode reward: [(0, '7.320'), (1, '8.250')] +[2023-10-08 13:46:16,888][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000050080_51281920.pth... +[2023-10-08 13:46:16,889][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000050112_51314688.pth... +[2023-10-08 13:46:16,925][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000048448_49610752.pth +[2023-10-08 13:46:16,929][102760] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p1/milestones/checkpoint_000050112_51314688.pth +[2023-10-08 13:46:16,933][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000048416_49577984.pth +[2023-10-08 13:46:16,939][102634] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p0/milestones/checkpoint_000050080_51281920.pth +[2023-10-08 13:46:19,457][102898] Updated weights for policy 1, policy_version 50120 (0.0009) +[2023-10-08 13:46:19,801][102897] Updated weights for policy 0, policy_version 50090 (0.0008) +[2023-10-08 13:46:19,826][102898] Updated weights for policy 1, policy_version 50130 (0.0008) +[2023-10-08 13:46:20,176][102897] Updated weights for policy 0, policy_version 50100 (0.0009) +[2023-10-08 13:46:20,185][102898] Updated weights for policy 1, policy_version 50140 (0.0009) +[2023-10-08 13:46:20,540][102897] Updated weights for policy 0, policy_version 50110 (0.0009) +[2023-10-08 13:46:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 102662144. Throughput: 0: 1796.9, 1: 1806.3. Samples: 25667694. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:46:21,875][101941] Avg episode reward: [(0, '7.030'), (1, '9.150')] +[2023-10-08 13:46:24,049][102898] Updated weights for policy 1, policy_version 50150 (0.0009) +[2023-10-08 13:46:24,413][102898] Updated weights for policy 1, policy_version 50160 (0.0009) +[2023-10-08 13:46:24,418][102897] Updated weights for policy 0, policy_version 50120 (0.0009) +[2023-10-08 13:46:24,783][102898] Updated weights for policy 1, policy_version 50170 (0.0007) +[2023-10-08 13:46:24,788][102897] Updated weights for policy 0, policy_version 50130 (0.0008) +[2023-10-08 13:46:25,164][102897] Updated weights for policy 0, policy_version 50140 (0.0010) +[2023-10-08 13:46:26,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 102727680. Throughput: 0: 1759.3, 1: 1774.9. Samples: 25686768. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:46:26,875][101941] Avg episode reward: [(0, '7.470'), (1, '9.620')] +[2023-10-08 13:46:28,621][102898] Updated weights for policy 1, policy_version 50180 (0.0007) +[2023-10-08 13:46:28,943][102897] Updated weights for policy 0, policy_version 50150 (0.0008) +[2023-10-08 13:46:28,994][102898] Updated weights for policy 1, policy_version 50190 (0.0008) +[2023-10-08 13:46:29,311][102897] Updated weights for policy 0, policy_version 50160 (0.0008) +[2023-10-08 13:46:29,348][102898] Updated weights for policy 1, policy_version 50200 (0.0008) +[2023-10-08 13:46:29,673][102897] Updated weights for policy 0, policy_version 50170 (0.0008) +[2023-10-08 13:46:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 102793216. Throughput: 0: 1763.2, 1: 1774.4. Samples: 25708998. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:46:31,876][101941] Avg episode reward: [(0, '7.290'), (1, '8.910')] +[2023-10-08 13:46:33,126][102898] Updated weights for policy 1, policy_version 50210 (0.0007) +[2023-10-08 13:46:33,493][102898] Updated weights for policy 1, policy_version 50220 (0.0009) +[2023-10-08 13:46:33,613][102897] Updated weights for policy 0, policy_version 50180 (0.0010) +[2023-10-08 13:46:33,858][102898] Updated weights for policy 1, policy_version 50230 (0.0008) +[2023-10-08 13:46:33,972][102897] Updated weights for policy 0, policy_version 50190 (0.0010) +[2023-10-08 13:46:34,222][102898] Updated weights for policy 1, policy_version 50240 (0.0008) +[2023-10-08 13:46:34,342][102897] Updated weights for policy 0, policy_version 50200 (0.0008) +[2023-10-08 13:46:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 102858752. Throughput: 0: 1771.2, 1: 1771.7. Samples: 25719022. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:46:36,876][101941] Avg episode reward: [(0, '7.830'), (1, '7.830')] +[2023-10-08 13:46:37,914][102898] Updated weights for policy 1, policy_version 50250 (0.0007) +[2023-10-08 13:46:38,132][102897] Updated weights for policy 0, policy_version 50210 (0.0008) +[2023-10-08 13:46:38,280][102898] Updated weights for policy 1, policy_version 50260 (0.0009) +[2023-10-08 13:46:38,497][102897] Updated weights for policy 0, policy_version 50220 (0.0008) +[2023-10-08 13:46:38,643][102898] Updated weights for policy 1, policy_version 50270 (0.0008) +[2023-10-08 13:46:38,872][102897] Updated weights for policy 0, policy_version 50230 (0.0008) +[2023-10-08 13:46:39,251][102897] Updated weights for policy 0, policy_version 50240 (0.0007) +[2023-10-08 13:46:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 102924288. Throughput: 0: 1767.5, 1: 1777.5. Samples: 25741286. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:46:41,876][101941] Avg episode reward: [(0, '7.520'), (1, '8.340')] +[2023-10-08 13:46:42,375][102898] Updated weights for policy 1, policy_version 50280 (0.0008) +[2023-10-08 13:46:42,738][102898] Updated weights for policy 1, policy_version 50290 (0.0009) +[2023-10-08 13:46:43,058][102897] Updated weights for policy 0, policy_version 50250 (0.0007) +[2023-10-08 13:46:43,101][102898] Updated weights for policy 1, policy_version 50300 (0.0008) +[2023-10-08 13:46:43,424][102897] Updated weights for policy 0, policy_version 50260 (0.0007) +[2023-10-08 13:46:43,801][102897] Updated weights for policy 0, policy_version 50270 (0.0008) +[2023-10-08 13:46:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 102989824. Throughput: 0: 1770.3, 1: 1802.9. Samples: 25763804. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:46:46,876][101941] Avg episode reward: [(0, '7.750'), (1, '9.370')] +[2023-10-08 13:46:46,925][102898] Updated weights for policy 1, policy_version 50310 (0.0008) +[2023-10-08 13:46:47,295][102898] Updated weights for policy 1, policy_version 50320 (0.0007) +[2023-10-08 13:46:47,658][102898] Updated weights for policy 1, policy_version 50330 (0.0007) +[2023-10-08 13:46:47,699][102897] Updated weights for policy 0, policy_version 50280 (0.0008) +[2023-10-08 13:46:48,077][102897] Updated weights for policy 0, policy_version 50290 (0.0008) +[2023-10-08 13:46:48,457][102897] Updated weights for policy 0, policy_version 50300 (0.0008) +[2023-10-08 13:46:51,265][102898] Updated weights for policy 1, policy_version 50340 (0.0007) +[2023-10-08 13:46:51,635][102898] Updated weights for policy 1, policy_version 50350 (0.0008) +[2023-10-08 13:46:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 103055360. Throughput: 0: 1770.2, 1: 1785.1. Samples: 25773326. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:46:51,876][101941] Avg episode reward: [(0, '7.790'), (1, '9.350')] +[2023-10-08 13:46:51,999][102898] Updated weights for policy 1, policy_version 50360 (0.0009) +[2023-10-08 13:46:52,384][102897] Updated weights for policy 0, policy_version 50310 (0.0008) +[2023-10-08 13:46:52,758][102897] Updated weights for policy 0, policy_version 50320 (0.0010) +[2023-10-08 13:46:53,127][102897] Updated weights for policy 0, policy_version 50330 (0.0010) +[2023-10-08 13:46:55,828][102898] Updated weights for policy 1, policy_version 50370 (0.0009) +[2023-10-08 13:46:56,199][102898] Updated weights for policy 1, policy_version 50380 (0.0009) +[2023-10-08 13:46:56,578][102898] Updated weights for policy 1, policy_version 50390 (0.0010) +[2023-10-08 13:46:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 103120896. Throughput: 0: 1754.3, 1: 1798.7. Samples: 25795188. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:46:56,875][101941] Avg episode reward: [(0, '8.140'), (1, '8.840')] +[2023-10-08 13:46:56,925][102897] Updated weights for policy 0, policy_version 50340 (0.0009) +[2023-10-08 13:46:56,933][102898] Updated weights for policy 1, policy_version 50400 (0.0009) +[2023-10-08 13:46:57,303][102897] Updated weights for policy 0, policy_version 50350 (0.0007) +[2023-10-08 13:46:57,666][102897] Updated weights for policy 0, policy_version 50360 (0.0008) +[2023-10-08 13:47:00,814][102898] Updated weights for policy 1, policy_version 50410 (0.0008) +[2023-10-08 13:47:01,193][102898] Updated weights for policy 1, policy_version 50420 (0.0009) +[2023-10-08 13:47:01,477][102897] Updated weights for policy 0, policy_version 50370 (0.0007) +[2023-10-08 13:47:01,559][102898] Updated weights for policy 1, policy_version 50430 (0.0007) +[2023-10-08 13:47:01,848][102897] Updated weights for policy 0, policy_version 50380 (0.0008) +[2023-10-08 13:47:01,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14218.0). Total num frames: 103219200. Throughput: 0: 1789.2, 1: 1786.6. Samples: 25816342. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:47:01,876][101941] Avg episode reward: [(0, '7.150'), (1, '8.500')] +[2023-10-08 13:47:02,217][102897] Updated weights for policy 0, policy_version 50390 (0.0007) +[2023-10-08 13:47:02,589][102897] Updated weights for policy 0, policy_version 50400 (0.0009) +[2023-10-08 13:47:05,237][102898] Updated weights for policy 1, policy_version 50440 (0.0009) +[2023-10-08 13:47:05,605][102898] Updated weights for policy 1, policy_version 50450 (0.0008) +[2023-10-08 13:47:05,962][102898] Updated weights for policy 1, policy_version 50460 (0.0007) +[2023-10-08 13:47:06,227][102897] Updated weights for policy 0, policy_version 50410 (0.0008) +[2023-10-08 13:47:06,592][102897] Updated weights for policy 0, policy_version 50420 (0.0009) +[2023-10-08 13:47:06,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14106.9). Total num frames: 103284736. Throughput: 0: 1755.7, 1: 1793.5. Samples: 25827408. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:47:06,876][101941] Avg episode reward: [(0, '6.820'), (1, '8.900')] +[2023-10-08 13:47:06,967][102897] Updated weights for policy 0, policy_version 50430 (0.0007) +[2023-10-08 13:47:09,641][102898] Updated weights for policy 1, policy_version 50470 (0.0007) +[2023-10-08 13:47:10,000][102898] Updated weights for policy 1, policy_version 50480 (0.0009) +[2023-10-08 13:47:10,374][102898] Updated weights for policy 1, policy_version 50490 (0.0010) +[2023-10-08 13:47:10,705][102897] Updated weights for policy 0, policy_version 50440 (0.0010) +[2023-10-08 13:47:11,067][102897] Updated weights for policy 0, policy_version 50450 (0.0011) +[2023-10-08 13:47:11,442][102897] Updated weights for policy 0, policy_version 50460 (0.0011) +[2023-10-08 13:47:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 103383040. Throughput: 0: 1800.5, 1: 1795.5. Samples: 25848590. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:47:11,876][101941] Avg episode reward: [(0, '7.230'), (1, '8.550')] +[2023-10-08 13:47:14,171][102898] Updated weights for policy 1, policy_version 50500 (0.0007) +[2023-10-08 13:47:14,534][102898] Updated weights for policy 1, policy_version 50510 (0.0008) +[2023-10-08 13:47:14,906][102898] Updated weights for policy 1, policy_version 50520 (0.0008) +[2023-10-08 13:47:15,299][102897] Updated weights for policy 0, policy_version 50470 (0.0010) +[2023-10-08 13:47:15,677][102897] Updated weights for policy 0, policy_version 50480 (0.0009) +[2023-10-08 13:47:16,040][102897] Updated weights for policy 0, policy_version 50490 (0.0008) +[2023-10-08 13:47:16,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 103448576. Throughput: 0: 1769.1, 1: 1793.9. Samples: 25869332. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:47:16,876][101941] Avg episode reward: [(0, '7.480'), (1, '8.500')] +[2023-10-08 13:47:18,774][102898] Updated weights for policy 1, policy_version 50530 (0.0008) +[2023-10-08 13:47:19,131][102898] Updated weights for policy 1, policy_version 50540 (0.0008) +[2023-10-08 13:47:19,501][102898] Updated weights for policy 1, policy_version 50550 (0.0007) +[2023-10-08 13:47:19,604][102897] Updated weights for policy 0, policy_version 50500 (0.0007) +[2023-10-08 13:47:19,873][102898] Updated weights for policy 1, policy_version 50560 (0.0007) +[2023-10-08 13:47:19,972][102897] Updated weights for policy 0, policy_version 50510 (0.0008) +[2023-10-08 13:47:20,353][102897] Updated weights for policy 0, policy_version 50520 (0.0012) +[2023-10-08 13:47:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 103514112. Throughput: 0: 1797.2, 1: 1804.8. Samples: 25881112. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 13:47:21,876][101941] Avg episode reward: [(0, '7.740'), (1, '9.320')] +[2023-10-08 13:47:23,750][102898] Updated weights for policy 1, policy_version 50570 (0.0007) +[2023-10-08 13:47:24,122][102898] Updated weights for policy 1, policy_version 50580 (0.0007) +[2023-10-08 13:47:24,188][102897] Updated weights for policy 0, policy_version 50530 (0.0008) +[2023-10-08 13:47:24,483][102898] Updated weights for policy 1, policy_version 50590 (0.0007) +[2023-10-08 13:47:24,561][102897] Updated weights for policy 0, policy_version 50540 (0.0008) +[2023-10-08 13:47:24,933][102897] Updated weights for policy 0, policy_version 50550 (0.0008) +[2023-10-08 13:47:25,310][102897] Updated weights for policy 0, policy_version 50560 (0.0009) +[2023-10-08 13:47:26,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 103579648. Throughput: 0: 1769.1, 1: 1786.9. Samples: 25901304. Policy #0 lag: (min: 10.0, avg: 11.9, max: 40.0) +[2023-10-08 13:47:26,876][101941] Avg episode reward: [(0, '7.150'), (1, '9.540')] +[2023-10-08 13:47:28,123][102898] Updated weights for policy 1, policy_version 50600 (0.0008) +[2023-10-08 13:47:28,481][102898] Updated weights for policy 1, policy_version 50610 (0.0008) +[2023-10-08 13:47:28,855][102898] Updated weights for policy 1, policy_version 50620 (0.0007) +[2023-10-08 13:47:29,043][102897] Updated weights for policy 0, policy_version 50570 (0.0008) +[2023-10-08 13:47:29,427][102897] Updated weights for policy 0, policy_version 50580 (0.0007) +[2023-10-08 13:47:29,795][102897] Updated weights for policy 0, policy_version 50590 (0.0007) +[2023-10-08 13:47:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 103645184. Throughput: 0: 1772.3, 1: 1781.3. Samples: 25923718. Policy #0 lag: (min: 10.0, avg: 11.9, max: 40.0) +[2023-10-08 13:47:31,876][101941] Avg episode reward: [(0, '6.890'), (1, '9.110')] +[2023-10-08 13:47:32,727][102898] Updated weights for policy 1, policy_version 50630 (0.0008) +[2023-10-08 13:47:33,109][102898] Updated weights for policy 1, policy_version 50640 (0.0007) +[2023-10-08 13:47:33,485][102898] Updated weights for policy 1, policy_version 50650 (0.0007) +[2023-10-08 13:47:33,699][102897] Updated weights for policy 0, policy_version 50600 (0.0007) +[2023-10-08 13:47:34,076][102897] Updated weights for policy 0, policy_version 50610 (0.0008) +[2023-10-08 13:47:34,449][102897] Updated weights for policy 0, policy_version 50620 (0.0007) +[2023-10-08 13:47:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 103710720. Throughput: 0: 1778.0, 1: 1784.0. Samples: 25933618. Policy #0 lag: (min: 10.0, avg: 11.9, max: 40.0) +[2023-10-08 13:47:36,876][101941] Avg episode reward: [(0, '7.340'), (1, '8.690')] +[2023-10-08 13:47:37,160][102898] Updated weights for policy 1, policy_version 50660 (0.0008) +[2023-10-08 13:47:37,536][102898] Updated weights for policy 1, policy_version 50670 (0.0010) +[2023-10-08 13:47:37,904][102898] Updated weights for policy 1, policy_version 50680 (0.0008) +[2023-10-08 13:47:38,124][102897] Updated weights for policy 0, policy_version 50630 (0.0007) +[2023-10-08 13:47:38,494][102897] Updated weights for policy 0, policy_version 50640 (0.0010) +[2023-10-08 13:47:38,874][102897] Updated weights for policy 0, policy_version 50650 (0.0009) +[2023-10-08 13:47:41,605][102898] Updated weights for policy 1, policy_version 50690 (0.0009) +[2023-10-08 13:47:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 103776256. Throughput: 0: 1782.8, 1: 1784.9. Samples: 25955736. Policy #0 lag: (min: 10.0, avg: 11.9, max: 40.0) +[2023-10-08 13:47:41,875][101941] Avg episode reward: [(0, '6.720'), (1, '7.990')] +[2023-10-08 13:47:41,975][102898] Updated weights for policy 1, policy_version 50700 (0.0011) +[2023-10-08 13:47:42,336][102898] Updated weights for policy 1, policy_version 50710 (0.0011) +[2023-10-08 13:47:42,698][102898] Updated weights for policy 1, policy_version 50720 (0.0008) +[2023-10-08 13:47:42,746][102897] Updated weights for policy 0, policy_version 50660 (0.0010) +[2023-10-08 13:47:43,110][102897] Updated weights for policy 0, policy_version 50670 (0.0010) +[2023-10-08 13:47:43,475][102897] Updated weights for policy 0, policy_version 50680 (0.0007) +[2023-10-08 13:47:46,455][102898] Updated weights for policy 1, policy_version 50730 (0.0007) +[2023-10-08 13:47:46,822][102898] Updated weights for policy 1, policy_version 50740 (0.0008) +[2023-10-08 13:47:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 103841792. Throughput: 0: 1776.4, 1: 1802.4. Samples: 25977386. Policy #0 lag: (min: 10.0, avg: 11.9, max: 40.0) +[2023-10-08 13:47:46,875][101941] Avg episode reward: [(0, '6.960'), (1, '8.660')] +[2023-10-08 13:47:47,183][102898] Updated weights for policy 1, policy_version 50750 (0.0009) +[2023-10-08 13:47:47,195][102897] Updated weights for policy 0, policy_version 50690 (0.0009) +[2023-10-08 13:47:47,568][102897] Updated weights for policy 0, policy_version 50700 (0.0009) +[2023-10-08 13:47:47,944][102897] Updated weights for policy 0, policy_version 50710 (0.0009) +[2023-10-08 13:47:48,311][102897] Updated weights for policy 0, policy_version 50720 (0.0007) +[2023-10-08 13:47:51,033][102898] Updated weights for policy 1, policy_version 50760 (0.0008) +[2023-10-08 13:47:51,405][102898] Updated weights for policy 1, policy_version 50770 (0.0008) +[2023-10-08 13:47:51,762][102898] Updated weights for policy 1, policy_version 50780 (0.0007) +[2023-10-08 13:47:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 103907328. Throughput: 0: 1777.3, 1: 1782.7. Samples: 25987606. Policy #0 lag: (min: 10.0, avg: 11.9, max: 40.0) +[2023-10-08 13:47:51,876][101941] Avg episode reward: [(0, '7.510'), (1, '8.730')] +[2023-10-08 13:47:52,148][102897] Updated weights for policy 0, policy_version 50730 (0.0008) +[2023-10-08 13:47:52,520][102897] Updated weights for policy 0, policy_version 50740 (0.0010) +[2023-10-08 13:47:52,890][102897] Updated weights for policy 0, policy_version 50750 (0.0010) +[2023-10-08 13:47:55,511][102898] Updated weights for policy 1, policy_version 50790 (0.0008) +[2023-10-08 13:47:55,886][102898] Updated weights for policy 1, policy_version 50800 (0.0007) +[2023-10-08 13:47:56,255][102898] Updated weights for policy 1, policy_version 50810 (0.0007) +[2023-10-08 13:47:56,668][102897] Updated weights for policy 0, policy_version 50760 (0.0008) +[2023-10-08 13:47:56,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.5, 300 sec: 14329.1). Total num frames: 104005632. Throughput: 0: 1769.9, 1: 1805.8. Samples: 26009494. Policy #0 lag: (min: 10.0, avg: 11.9, max: 40.0) +[2023-10-08 13:47:56,876][101941] Avg episode reward: [(0, '7.700'), (1, '7.980')] +[2023-10-08 13:47:57,039][102897] Updated weights for policy 0, policy_version 50770 (0.0007) +[2023-10-08 13:47:57,426][102897] Updated weights for policy 0, policy_version 50780 (0.0007) +[2023-10-08 13:48:00,020][102898] Updated weights for policy 1, policy_version 50820 (0.0007) +[2023-10-08 13:48:00,380][102898] Updated weights for policy 1, policy_version 50830 (0.0007) +[2023-10-08 13:48:00,754][102898] Updated weights for policy 1, policy_version 50840 (0.0007) +[2023-10-08 13:48:01,086][102897] Updated weights for policy 0, policy_version 50790 (0.0009) +[2023-10-08 13:48:01,457][102897] Updated weights for policy 0, policy_version 50800 (0.0008) +[2023-10-08 13:48:01,824][102897] Updated weights for policy 0, policy_version 50810 (0.0010) +[2023-10-08 13:48:01,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 104071168. Throughput: 0: 1789.5, 1: 1780.6. Samples: 26029986. Policy #0 lag: (min: 31.0, avg: 33.5, max: 63.0) +[2023-10-08 13:48:01,876][101941] Avg episode reward: [(0, '8.210'), (1, '8.790')] +[2023-10-08 13:48:04,521][102898] Updated weights for policy 1, policy_version 50850 (0.0007) +[2023-10-08 13:48:04,884][102898] Updated weights for policy 1, policy_version 50860 (0.0009) +[2023-10-08 13:48:05,257][102898] Updated weights for policy 1, policy_version 50870 (0.0007) +[2023-10-08 13:48:05,614][102898] Updated weights for policy 1, policy_version 50880 (0.0007) +[2023-10-08 13:48:05,729][102897] Updated weights for policy 0, policy_version 50820 (0.0009) +[2023-10-08 13:48:06,096][102897] Updated weights for policy 0, policy_version 50830 (0.0007) +[2023-10-08 13:48:06,463][102897] Updated weights for policy 0, policy_version 50840 (0.0007) +[2023-10-08 13:48:06,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.6, 300 sec: 14218.0). Total num frames: 104169472. Throughput: 0: 1764.7, 1: 1801.0. Samples: 26041570. Policy #0 lag: (min: 31.0, avg: 33.5, max: 63.0) +[2023-10-08 13:48:06,875][101941] Avg episode reward: [(0, '7.700'), (1, '9.440')] +[2023-10-08 13:48:09,542][102898] Updated weights for policy 1, policy_version 50890 (0.0007) +[2023-10-08 13:48:09,921][102898] Updated weights for policy 1, policy_version 50900 (0.0009) +[2023-10-08 13:48:10,247][102897] Updated weights for policy 0, policy_version 50850 (0.0007) +[2023-10-08 13:48:10,286][102898] Updated weights for policy 1, policy_version 50910 (0.0008) +[2023-10-08 13:48:10,610][102897] Updated weights for policy 0, policy_version 50860 (0.0009) +[2023-10-08 13:48:10,978][102897] Updated weights for policy 0, policy_version 50870 (0.0008) +[2023-10-08 13:48:11,356][102897] Updated weights for policy 0, policy_version 50880 (0.0009) +[2023-10-08 13:48:11,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 104235008. Throughput: 0: 1800.0, 1: 1777.6. Samples: 26062298. Policy #0 lag: (min: 31.0, avg: 33.5, max: 63.0) +[2023-10-08 13:48:11,876][101941] Avg episode reward: [(0, '7.430'), (1, '9.230')] +[2023-10-08 13:48:13,979][102898] Updated weights for policy 1, policy_version 50920 (0.0008) +[2023-10-08 13:48:14,341][102898] Updated weights for policy 1, policy_version 50930 (0.0010) +[2023-10-08 13:48:14,711][102898] Updated weights for policy 1, policy_version 50940 (0.0010) +[2023-10-08 13:48:15,081][102897] Updated weights for policy 0, policy_version 50890 (0.0009) +[2023-10-08 13:48:15,449][102897] Updated weights for policy 0, policy_version 50900 (0.0008) +[2023-10-08 13:48:15,810][102897] Updated weights for policy 0, policy_version 50910 (0.0008) +[2023-10-08 13:48:16,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 104300544. Throughput: 0: 1775.0, 1: 1779.4. Samples: 26083666. Policy #0 lag: (min: 31.0, avg: 33.5, max: 63.0) +[2023-10-08 13:48:16,876][101941] Avg episode reward: [(0, '7.220'), (1, '8.600')] +[2023-10-08 13:48:16,886][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000050944_52166656.pth... +[2023-10-08 13:48:16,886][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000050912_52133888.pth... +[2023-10-08 13:48:16,928][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000049248_50429952.pth +[2023-10-08 13:48:16,928][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000049280_50462720.pth +[2023-10-08 13:48:18,659][102898] Updated weights for policy 1, policy_version 50950 (0.0007) +[2023-10-08 13:48:19,039][102898] Updated weights for policy 1, policy_version 50960 (0.0008) +[2023-10-08 13:48:19,409][102898] Updated weights for policy 1, policy_version 50970 (0.0008) +[2023-10-08 13:48:19,426][102897] Updated weights for policy 0, policy_version 50920 (0.0007) +[2023-10-08 13:48:19,810][102897] Updated weights for policy 0, policy_version 50930 (0.0007) +[2023-10-08 13:48:20,177][102897] Updated weights for policy 0, policy_version 50940 (0.0010) +[2023-10-08 13:48:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 104366080. Throughput: 0: 1799.5, 1: 1779.5. Samples: 26094676. Policy #0 lag: (min: 31.0, avg: 33.5, max: 63.0) +[2023-10-08 13:48:21,876][101941] Avg episode reward: [(0, '7.520'), (1, '8.530')] +[2023-10-08 13:48:23,222][102898] Updated weights for policy 1, policy_version 50980 (0.0008) +[2023-10-08 13:48:23,594][102898] Updated weights for policy 1, policy_version 50990 (0.0009) +[2023-10-08 13:48:23,870][102897] Updated weights for policy 0, policy_version 50950 (0.0009) +[2023-10-08 13:48:23,966][102898] Updated weights for policy 1, policy_version 51000 (0.0008) +[2023-10-08 13:48:24,236][102897] Updated weights for policy 0, policy_version 50960 (0.0007) +[2023-10-08 13:48:24,607][102897] Updated weights for policy 0, policy_version 50970 (0.0010) +[2023-10-08 13:48:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 104431616. Throughput: 0: 1779.7, 1: 1768.6. Samples: 26115412. Policy #0 lag: (min: 31.0, avg: 33.5, max: 63.0) +[2023-10-08 13:48:26,876][101941] Avg episode reward: [(0, '8.250'), (1, '9.020')] +[2023-10-08 13:48:27,622][102898] Updated weights for policy 1, policy_version 51010 (0.0008) +[2023-10-08 13:48:27,992][102898] Updated weights for policy 1, policy_version 51020 (0.0009) +[2023-10-08 13:48:28,348][102898] Updated weights for policy 1, policy_version 51030 (0.0009) +[2023-10-08 13:48:28,534][102897] Updated weights for policy 0, policy_version 50980 (0.0010) +[2023-10-08 13:48:28,724][102898] Updated weights for policy 1, policy_version 51040 (0.0008) +[2023-10-08 13:48:28,912][102897] Updated weights for policy 0, policy_version 50990 (0.0009) +[2023-10-08 13:48:29,282][102897] Updated weights for policy 0, policy_version 51000 (0.0010) +[2023-10-08 13:48:31,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 104497152. Throughput: 0: 1780.0, 1: 1776.1. Samples: 26137412. Policy #0 lag: (min: 31.0, avg: 33.5, max: 63.0) +[2023-10-08 13:48:31,876][101941] Avg episode reward: [(0, '7.650'), (1, '9.060')] +[2023-10-08 13:48:32,694][102898] Updated weights for policy 1, policy_version 51050 (0.0008) +[2023-10-08 13:48:33,061][102897] Updated weights for policy 0, policy_version 51010 (0.0009) +[2023-10-08 13:48:33,066][102898] Updated weights for policy 1, policy_version 51060 (0.0008) +[2023-10-08 13:48:33,432][102898] Updated weights for policy 1, policy_version 51070 (0.0007) +[2023-10-08 13:48:33,439][102897] Updated weights for policy 0, policy_version 51020 (0.0007) +[2023-10-08 13:48:33,814][102897] Updated weights for policy 0, policy_version 51030 (0.0010) +[2023-10-08 13:48:34,182][102897] Updated weights for policy 0, policy_version 51040 (0.0009) +[2023-10-08 13:48:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 104562688. Throughput: 0: 1779.3, 1: 1765.1. Samples: 26147104. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:48:36,875][101941] Avg episode reward: [(0, '7.300'), (1, '9.470')] +[2023-10-08 13:48:37,132][102898] Updated weights for policy 1, policy_version 51080 (0.0007) +[2023-10-08 13:48:37,510][102898] Updated weights for policy 1, policy_version 51090 (0.0007) +[2023-10-08 13:48:37,868][102898] Updated weights for policy 1, policy_version 51100 (0.0008) +[2023-10-08 13:48:37,943][102897] Updated weights for policy 0, policy_version 51050 (0.0009) +[2023-10-08 13:48:38,312][102897] Updated weights for policy 0, policy_version 51060 (0.0009) +[2023-10-08 13:48:38,679][102897] Updated weights for policy 0, policy_version 51070 (0.0008) +[2023-10-08 13:48:41,596][102898] Updated weights for policy 1, policy_version 51110 (0.0008) +[2023-10-08 13:48:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 104628224. Throughput: 0: 1787.8, 1: 1772.3. Samples: 26169698. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:48:41,875][101941] Avg episode reward: [(0, '7.550'), (1, '9.320')] +[2023-10-08 13:48:41,960][102898] Updated weights for policy 1, policy_version 51120 (0.0010) +[2023-10-08 13:48:42,327][102898] Updated weights for policy 1, policy_version 51130 (0.0010) +[2023-10-08 13:48:42,481][102897] Updated weights for policy 0, policy_version 51080 (0.0008) +[2023-10-08 13:48:42,845][102897] Updated weights for policy 0, policy_version 51090 (0.0007) +[2023-10-08 13:48:43,221][102897] Updated weights for policy 0, policy_version 51100 (0.0007) +[2023-10-08 13:48:46,017][102898] Updated weights for policy 1, policy_version 51140 (0.0008) +[2023-10-08 13:48:46,390][102898] Updated weights for policy 1, policy_version 51150 (0.0010) +[2023-10-08 13:48:46,758][102898] Updated weights for policy 1, policy_version 51160 (0.0008) +[2023-10-08 13:48:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 104693760. Throughput: 0: 1798.0, 1: 1789.5. Samples: 26191422. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:48:46,875][101941] Avg episode reward: [(0, '7.280'), (1, '9.470')] +[2023-10-08 13:48:47,039][102897] Updated weights for policy 0, policy_version 51110 (0.0008) +[2023-10-08 13:48:47,405][102897] Updated weights for policy 0, policy_version 51120 (0.0008) +[2023-10-08 13:48:47,780][102897] Updated weights for policy 0, policy_version 51130 (0.0009) +[2023-10-08 13:48:50,492][102898] Updated weights for policy 1, policy_version 51170 (0.0008) +[2023-10-08 13:48:50,861][102898] Updated weights for policy 1, policy_version 51180 (0.0008) +[2023-10-08 13:48:51,222][102898] Updated weights for policy 1, policy_version 51190 (0.0008) +[2023-10-08 13:48:51,585][102898] Updated weights for policy 1, policy_version 51200 (0.0008) +[2023-10-08 13:48:51,681][102897] Updated weights for policy 0, policy_version 51140 (0.0008) +[2023-10-08 13:48:51,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 104792064. Throughput: 0: 1787.8, 1: 1774.7. Samples: 26201884. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:48:51,875][101941] Avg episode reward: [(0, '7.420'), (1, '8.890')] +[2023-10-08 13:48:52,060][102897] Updated weights for policy 0, policy_version 51150 (0.0010) +[2023-10-08 13:48:52,426][102897] Updated weights for policy 0, policy_version 51160 (0.0010) +[2023-10-08 13:48:55,178][102898] Updated weights for policy 1, policy_version 51210 (0.0007) +[2023-10-08 13:48:55,544][102898] Updated weights for policy 1, policy_version 51220 (0.0007) +[2023-10-08 13:48:55,914][102898] Updated weights for policy 1, policy_version 51230 (0.0008) +[2023-10-08 13:48:56,229][102897] Updated weights for policy 0, policy_version 51170 (0.0008) +[2023-10-08 13:48:56,599][102897] Updated weights for policy 0, policy_version 51180 (0.0009) +[2023-10-08 13:48:56,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 104857600. Throughput: 0: 1788.6, 1: 1800.3. Samples: 26223798. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:48:56,876][101941] Avg episode reward: [(0, '7.340'), (1, '7.780')] +[2023-10-08 13:48:56,976][102897] Updated weights for policy 0, policy_version 51190 (0.0010) +[2023-10-08 13:48:57,341][102897] Updated weights for policy 0, policy_version 51200 (0.0009) +[2023-10-08 13:48:59,793][102898] Updated weights for policy 1, policy_version 51240 (0.0009) +[2023-10-08 13:49:00,157][102898] Updated weights for policy 1, policy_version 51250 (0.0010) +[2023-10-08 13:49:00,523][102898] Updated weights for policy 1, policy_version 51260 (0.0010) +[2023-10-08 13:49:01,105][102897] Updated weights for policy 0, policy_version 51210 (0.0007) +[2023-10-08 13:49:01,479][102897] Updated weights for policy 0, policy_version 51220 (0.0009) +[2023-10-08 13:49:01,845][102897] Updated weights for policy 0, policy_version 51230 (0.0010) +[2023-10-08 13:49:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 104923136. Throughput: 0: 1791.5, 1: 1783.5. Samples: 26244540. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:49:01,875][101941] Avg episode reward: [(0, '7.250'), (1, '8.280')] +[2023-10-08 13:49:04,354][102898] Updated weights for policy 1, policy_version 51270 (0.0008) +[2023-10-08 13:49:04,741][102898] Updated weights for policy 1, policy_version 51280 (0.0007) +[2023-10-08 13:49:05,109][102898] Updated weights for policy 1, policy_version 51290 (0.0007) +[2023-10-08 13:49:05,629][102897] Updated weights for policy 0, policy_version 51240 (0.0009) +[2023-10-08 13:49:06,002][102897] Updated weights for policy 0, policy_version 51250 (0.0007) +[2023-10-08 13:49:06,367][102897] Updated weights for policy 0, policy_version 51260 (0.0008) +[2023-10-08 13:49:06,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 105021440. Throughput: 0: 1779.2, 1: 1803.1. Samples: 26255878. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:49:06,876][101941] Avg episode reward: [(0, '6.990'), (1, '9.190')] +[2023-10-08 13:49:08,872][102898] Updated weights for policy 1, policy_version 51300 (0.0009) +[2023-10-08 13:49:09,234][102898] Updated weights for policy 1, policy_version 51310 (0.0008) +[2023-10-08 13:49:09,605][102898] Updated weights for policy 1, policy_version 51320 (0.0008) +[2023-10-08 13:49:10,149][102897] Updated weights for policy 0, policy_version 51270 (0.0009) +[2023-10-08 13:49:10,531][102897] Updated weights for policy 0, policy_version 51280 (0.0007) +[2023-10-08 13:49:10,900][102897] Updated weights for policy 0, policy_version 51290 (0.0007) +[2023-10-08 13:49:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 105086976. Throughput: 0: 1789.4, 1: 1787.8. Samples: 26276388. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:49:11,875][101941] Avg episode reward: [(0, '6.480'), (1, '8.610')] +[2023-10-08 13:49:13,311][102898] Updated weights for policy 1, policy_version 51330 (0.0008) +[2023-10-08 13:49:13,681][102898] Updated weights for policy 1, policy_version 51340 (0.0008) +[2023-10-08 13:49:14,052][102898] Updated weights for policy 1, policy_version 51350 (0.0008) +[2023-10-08 13:49:14,424][102898] Updated weights for policy 1, policy_version 51360 (0.0008) +[2023-10-08 13:49:14,517][102897] Updated weights for policy 0, policy_version 51300 (0.0007) +[2023-10-08 13:49:14,880][102897] Updated weights for policy 0, policy_version 51310 (0.0010) +[2023-10-08 13:49:15,253][102897] Updated weights for policy 0, policy_version 51320 (0.0009) +[2023-10-08 13:49:16,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 105152512. Throughput: 0: 1779.4, 1: 1791.2. Samples: 26298092. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:49:16,876][101941] Avg episode reward: [(0, '7.010'), (1, '8.690')] +[2023-10-08 13:49:18,168][102898] Updated weights for policy 1, policy_version 51370 (0.0008) +[2023-10-08 13:49:18,538][102898] Updated weights for policy 1, policy_version 51380 (0.0007) +[2023-10-08 13:49:18,897][102898] Updated weights for policy 1, policy_version 51390 (0.0007) +[2023-10-08 13:49:19,047][102897] Updated weights for policy 0, policy_version 51330 (0.0010) +[2023-10-08 13:49:19,416][102897] Updated weights for policy 0, policy_version 51340 (0.0010) +[2023-10-08 13:49:19,795][102897] Updated weights for policy 0, policy_version 51350 (0.0009) +[2023-10-08 13:49:20,153][102897] Updated weights for policy 0, policy_version 51360 (0.0009) +[2023-10-08 13:49:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 105218048. Throughput: 0: 1799.4, 1: 1795.6. Samples: 26308876. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:49:21,875][101941] Avg episode reward: [(0, '6.830'), (1, '8.900')] +[2023-10-08 13:49:22,651][102898] Updated weights for policy 1, policy_version 51400 (0.0009) +[2023-10-08 13:49:23,025][102898] Updated weights for policy 1, policy_version 51410 (0.0009) +[2023-10-08 13:49:23,392][102898] Updated weights for policy 1, policy_version 51420 (0.0009) +[2023-10-08 13:49:23,860][102897] Updated weights for policy 0, policy_version 51370 (0.0007) +[2023-10-08 13:49:24,231][102897] Updated weights for policy 0, policy_version 51380 (0.0007) +[2023-10-08 13:49:24,610][102897] Updated weights for policy 0, policy_version 51390 (0.0007) +[2023-10-08 13:49:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 105283584. Throughput: 0: 1772.8, 1: 1795.1. Samples: 26330254. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:49:26,876][101941] Avg episode reward: [(0, '6.380'), (1, '9.730')] +[2023-10-08 13:49:26,878][102760] Saving new best policy, reward=9.730! +[2023-10-08 13:49:27,251][102898] Updated weights for policy 1, policy_version 51430 (0.0008) +[2023-10-08 13:49:27,623][102898] Updated weights for policy 1, policy_version 51440 (0.0009) +[2023-10-08 13:49:27,997][102898] Updated weights for policy 1, policy_version 51450 (0.0008) +[2023-10-08 13:49:28,395][102897] Updated weights for policy 0, policy_version 51400 (0.0008) +[2023-10-08 13:49:28,764][102897] Updated weights for policy 0, policy_version 51410 (0.0010) +[2023-10-08 13:49:29,144][102897] Updated weights for policy 0, policy_version 51420 (0.0007) +[2023-10-08 13:49:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 105349120. Throughput: 0: 1780.7, 1: 1796.7. Samples: 26352404. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:49:31,875][101941] Avg episode reward: [(0, '7.230'), (1, '8.990')] +[2023-10-08 13:49:31,891][102898] Updated weights for policy 1, policy_version 51460 (0.0007) +[2023-10-08 13:49:32,257][102898] Updated weights for policy 1, policy_version 51470 (0.0007) +[2023-10-08 13:49:32,621][102898] Updated weights for policy 1, policy_version 51480 (0.0007) +[2023-10-08 13:49:32,789][102897] Updated weights for policy 0, policy_version 51430 (0.0009) +[2023-10-08 13:49:33,155][102897] Updated weights for policy 0, policy_version 51440 (0.0010) +[2023-10-08 13:49:33,535][102897] Updated weights for policy 0, policy_version 51450 (0.0008) +[2023-10-08 13:49:36,533][102898] Updated weights for policy 1, policy_version 51490 (0.0007) +[2023-10-08 13:49:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 105414656. Throughput: 0: 1780.0, 1: 1779.4. Samples: 26362058. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:49:36,876][101941] Avg episode reward: [(0, '8.160'), (1, '8.730')] +[2023-10-08 13:49:36,893][102898] Updated weights for policy 1, policy_version 51500 (0.0007) +[2023-10-08 13:49:37,259][102898] Updated weights for policy 1, policy_version 51510 (0.0007) +[2023-10-08 13:49:37,309][102897] Updated weights for policy 0, policy_version 51460 (0.0008) +[2023-10-08 13:49:37,624][102898] Updated weights for policy 1, policy_version 51520 (0.0008) +[2023-10-08 13:49:37,686][102897] Updated weights for policy 0, policy_version 51470 (0.0008) +[2023-10-08 13:49:38,053][102897] Updated weights for policy 0, policy_version 51480 (0.0011) +[2023-10-08 13:49:41,476][102898] Updated weights for policy 1, policy_version 51530 (0.0008) +[2023-10-08 13:49:41,803][102897] Updated weights for policy 0, policy_version 51490 (0.0009) +[2023-10-08 13:49:41,844][102898] Updated weights for policy 1, policy_version 51540 (0.0009) +[2023-10-08 13:49:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 105480192. Throughput: 0: 1778.9, 1: 1786.4. Samples: 26384238. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:49:41,876][101941] Avg episode reward: [(0, '7.900'), (1, '8.280')] +[2023-10-08 13:49:42,177][102897] Updated weights for policy 0, policy_version 51500 (0.0007) +[2023-10-08 13:49:42,220][102898] Updated weights for policy 1, policy_version 51550 (0.0008) +[2023-10-08 13:49:42,543][102897] Updated weights for policy 0, policy_version 51510 (0.0007) +[2023-10-08 13:49:42,911][102897] Updated weights for policy 0, policy_version 51520 (0.0008) +[2023-10-08 13:49:46,022][102898] Updated weights for policy 1, policy_version 51560 (0.0007) +[2023-10-08 13:49:46,385][102898] Updated weights for policy 1, policy_version 51570 (0.0008) +[2023-10-08 13:49:46,718][102897] Updated weights for policy 0, policy_version 51530 (0.0007) +[2023-10-08 13:49:46,747][102898] Updated weights for policy 1, policy_version 51580 (0.0008) +[2023-10-08 13:49:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 105545728. Throughput: 0: 1801.0, 1: 1779.8. Samples: 26405676. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:49:46,876][101941] Avg episode reward: [(0, '7.080'), (1, '8.150')] +[2023-10-08 13:49:47,090][102897] Updated weights for policy 0, policy_version 51540 (0.0007) +[2023-10-08 13:49:47,479][102897] Updated weights for policy 0, policy_version 51550 (0.0008) +[2023-10-08 13:49:50,560][102898] Updated weights for policy 1, policy_version 51590 (0.0008) +[2023-10-08 13:49:50,935][102898] Updated weights for policy 1, policy_version 51600 (0.0009) +[2023-10-08 13:49:51,302][102898] Updated weights for policy 1, policy_version 51610 (0.0008) +[2023-10-08 13:49:51,353][102897] Updated weights for policy 0, policy_version 51560 (0.0007) +[2023-10-08 13:49:51,720][102897] Updated weights for policy 0, policy_version 51570 (0.0007) +[2023-10-08 13:49:51,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 105644032. Throughput: 0: 1785.4, 1: 1777.8. Samples: 26416222. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 13:49:51,875][101941] Avg episode reward: [(0, '7.210'), (1, '8.900')] +[2023-10-08 13:49:52,094][102897] Updated weights for policy 0, policy_version 51580 (0.0007) +[2023-10-08 13:49:55,057][102898] Updated weights for policy 1, policy_version 51620 (0.0007) +[2023-10-08 13:49:55,422][102898] Updated weights for policy 1, policy_version 51630 (0.0008) +[2023-10-08 13:49:55,790][102898] Updated weights for policy 1, policy_version 51640 (0.0008) +[2023-10-08 13:49:55,945][102897] Updated weights for policy 0, policy_version 51590 (0.0009) +[2023-10-08 13:49:56,321][102897] Updated weights for policy 0, policy_version 51600 (0.0008) +[2023-10-08 13:49:56,693][102897] Updated weights for policy 0, policy_version 51610 (0.0008) +[2023-10-08 13:49:56,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 105709568. Throughput: 0: 1793.9, 1: 1789.8. Samples: 26437654. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 13:49:56,876][101941] Avg episode reward: [(0, '7.490'), (1, '9.970')] +[2023-10-08 13:49:56,877][102760] Saving new best policy, reward=9.970! +[2023-10-08 13:49:59,669][102898] Updated weights for policy 1, policy_version 51650 (0.0007) +[2023-10-08 13:50:00,028][102898] Updated weights for policy 1, policy_version 51660 (0.0011) +[2023-10-08 13:50:00,395][102898] Updated weights for policy 1, policy_version 51670 (0.0009) +[2023-10-08 13:50:00,475][102897] Updated weights for policy 0, policy_version 51620 (0.0010) +[2023-10-08 13:50:00,757][102898] Updated weights for policy 1, policy_version 51680 (0.0007) +[2023-10-08 13:50:00,855][102897] Updated weights for policy 0, policy_version 51630 (0.0008) +[2023-10-08 13:50:01,228][102897] Updated weights for policy 0, policy_version 51640 (0.0008) +[2023-10-08 13:50:01,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 105807872. Throughput: 0: 1780.8, 1: 1764.0. Samples: 26457606. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 13:50:01,876][101941] Avg episode reward: [(0, '7.550'), (1, '8.710')] +[2023-10-08 13:50:04,629][102898] Updated weights for policy 1, policy_version 51690 (0.0007) +[2023-10-08 13:50:04,998][102898] Updated weights for policy 1, policy_version 51700 (0.0009) +[2023-10-08 13:50:05,046][102897] Updated weights for policy 0, policy_version 51650 (0.0007) +[2023-10-08 13:50:05,354][102898] Updated weights for policy 1, policy_version 51710 (0.0009) +[2023-10-08 13:50:05,415][102897] Updated weights for policy 0, policy_version 51660 (0.0007) +[2023-10-08 13:50:05,789][102897] Updated weights for policy 0, policy_version 51670 (0.0009) +[2023-10-08 13:50:06,158][102897] Updated weights for policy 0, policy_version 51680 (0.0010) +[2023-10-08 13:50:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 105873408. Throughput: 0: 1787.3, 1: 1786.6. Samples: 26469704. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 13:50:06,876][101941] Avg episode reward: [(0, '7.400'), (1, '8.980')] +[2023-10-08 13:50:09,054][102898] Updated weights for policy 1, policy_version 51720 (0.0009) +[2023-10-08 13:50:09,411][102898] Updated weights for policy 1, policy_version 51730 (0.0008) +[2023-10-08 13:50:09,780][102898] Updated weights for policy 1, policy_version 51740 (0.0007) +[2023-10-08 13:50:09,812][102897] Updated weights for policy 0, policy_version 51690 (0.0008) +[2023-10-08 13:50:10,179][102897] Updated weights for policy 0, policy_version 51700 (0.0008) +[2023-10-08 13:50:10,541][102897] Updated weights for policy 0, policy_version 51710 (0.0009) +[2023-10-08 13:50:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 105938944. Throughput: 0: 1786.7, 1: 1761.8. Samples: 26489938. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 13:50:11,876][101941] Avg episode reward: [(0, '7.560'), (1, '8.720')] +[2023-10-08 13:50:13,574][102898] Updated weights for policy 1, policy_version 51750 (0.0007) +[2023-10-08 13:50:13,938][102898] Updated weights for policy 1, policy_version 51760 (0.0008) +[2023-10-08 13:50:14,301][102898] Updated weights for policy 1, policy_version 51770 (0.0007) +[2023-10-08 13:50:14,339][102897] Updated weights for policy 0, policy_version 51720 (0.0009) +[2023-10-08 13:50:14,710][102897] Updated weights for policy 0, policy_version 51730 (0.0008) +[2023-10-08 13:50:15,072][102897] Updated weights for policy 0, policy_version 51740 (0.0008) +[2023-10-08 13:50:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 106004480. Throughput: 0: 1768.0, 1: 1772.5. Samples: 26511728. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 13:50:16,876][101941] Avg episode reward: [(0, '6.750'), (1, '8.460')] +[2023-10-08 13:50:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000051744_52985856.pth... +[2023-10-08 13:50:16,884][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000051776_53018624.pth... +[2023-10-08 13:50:16,916][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000050080_51281920.pth +[2023-10-08 13:50:16,921][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000050112_51314688.pth +[2023-10-08 13:50:17,923][102898] Updated weights for policy 1, policy_version 51780 (0.0008) +[2023-10-08 13:50:18,286][102898] Updated weights for policy 1, policy_version 51790 (0.0009) +[2023-10-08 13:50:18,647][102898] Updated weights for policy 1, policy_version 51800 (0.0007) +[2023-10-08 13:50:18,873][102897] Updated weights for policy 0, policy_version 51750 (0.0009) +[2023-10-08 13:50:19,236][102897] Updated weights for policy 0, policy_version 51760 (0.0008) +[2023-10-08 13:50:19,610][102897] Updated weights for policy 0, policy_version 51770 (0.0008) +[2023-10-08 13:50:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 106070016. Throughput: 0: 1785.7, 1: 1773.2. Samples: 26522210. Policy #0 lag: (min: 31.0, avg: 33.8, max: 63.0) +[2023-10-08 13:50:21,876][101941] Avg episode reward: [(0, '6.620'), (1, '8.840')] +[2023-10-08 13:50:22,508][102898] Updated weights for policy 1, policy_version 51810 (0.0009) +[2023-10-08 13:50:22,865][102898] Updated weights for policy 1, policy_version 51820 (0.0009) +[2023-10-08 13:50:23,234][102898] Updated weights for policy 1, policy_version 51830 (0.0010) +[2023-10-08 13:50:23,391][102897] Updated weights for policy 0, policy_version 51780 (0.0008) +[2023-10-08 13:50:23,599][102898] Updated weights for policy 1, policy_version 51840 (0.0008) +[2023-10-08 13:50:23,753][102897] Updated weights for policy 0, policy_version 51790 (0.0009) +[2023-10-08 13:50:24,124][102897] Updated weights for policy 0, policy_version 51800 (0.0008) +[2023-10-08 13:50:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 106135552. Throughput: 0: 1772.7, 1: 1776.8. Samples: 26543970. Policy #0 lag: (min: 5.0, avg: 6.1, max: 25.0) +[2023-10-08 13:50:26,876][101941] Avg episode reward: [(0, '7.660'), (1, '8.970')] +[2023-10-08 13:50:27,139][102898] Updated weights for policy 1, policy_version 51850 (0.0007) +[2023-10-08 13:50:27,503][102898] Updated weights for policy 1, policy_version 51860 (0.0009) +[2023-10-08 13:50:27,807][102897] Updated weights for policy 0, policy_version 51810 (0.0008) +[2023-10-08 13:50:27,864][102898] Updated weights for policy 1, policy_version 51870 (0.0007) +[2023-10-08 13:50:28,171][102897] Updated weights for policy 0, policy_version 51820 (0.0010) +[2023-10-08 13:50:28,548][102897] Updated weights for policy 0, policy_version 51830 (0.0008) +[2023-10-08 13:50:28,909][102897] Updated weights for policy 0, policy_version 51840 (0.0007) +[2023-10-08 13:50:31,793][102898] Updated weights for policy 1, policy_version 51880 (0.0008) +[2023-10-08 13:50:31,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 106201088. Throughput: 0: 1778.9, 1: 1796.7. Samples: 26566576. Policy #0 lag: (min: 5.0, avg: 6.1, max: 25.0) +[2023-10-08 13:50:31,876][101941] Avg episode reward: [(0, '7.480'), (1, '9.600')] +[2023-10-08 13:50:32,154][102898] Updated weights for policy 1, policy_version 51890 (0.0007) +[2023-10-08 13:50:32,521][102898] Updated weights for policy 1, policy_version 51900 (0.0008) +[2023-10-08 13:50:32,586][102897] Updated weights for policy 0, policy_version 51850 (0.0007) +[2023-10-08 13:50:32,970][102897] Updated weights for policy 0, policy_version 51860 (0.0008) +[2023-10-08 13:50:33,345][102897] Updated weights for policy 0, policy_version 51870 (0.0010) +[2023-10-08 13:50:36,389][102898] Updated weights for policy 1, policy_version 51910 (0.0008) +[2023-10-08 13:50:36,762][102898] Updated weights for policy 1, policy_version 51920 (0.0008) +[2023-10-08 13:50:36,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 106266624. Throughput: 0: 1779.4, 1: 1777.4. Samples: 26576280. Policy #0 lag: (min: 5.0, avg: 6.1, max: 25.0) +[2023-10-08 13:50:36,875][101941] Avg episode reward: [(0, '7.860'), (1, '9.340')] +[2023-10-08 13:50:37,139][102898] Updated weights for policy 1, policy_version 51930 (0.0008) +[2023-10-08 13:50:37,371][102897] Updated weights for policy 0, policy_version 51880 (0.0009) +[2023-10-08 13:50:37,753][102897] Updated weights for policy 0, policy_version 51890 (0.0009) +[2023-10-08 13:50:38,119][102897] Updated weights for policy 0, policy_version 51900 (0.0010) +[2023-10-08 13:50:40,974][102898] Updated weights for policy 1, policy_version 51940 (0.0007) +[2023-10-08 13:50:41,343][102898] Updated weights for policy 1, policy_version 51950 (0.0008) +[2023-10-08 13:50:41,717][102898] Updated weights for policy 1, policy_version 51960 (0.0008) +[2023-10-08 13:50:41,854][102897] Updated weights for policy 0, policy_version 51910 (0.0008) +[2023-10-08 13:50:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 106332160. Throughput: 0: 1780.8, 1: 1788.9. Samples: 26598288. Policy #0 lag: (min: 5.0, avg: 6.1, max: 25.0) +[2023-10-08 13:50:41,876][101941] Avg episode reward: [(0, '7.530'), (1, '8.850')] +[2023-10-08 13:50:42,228][102897] Updated weights for policy 0, policy_version 51920 (0.0009) +[2023-10-08 13:50:42,600][102897] Updated weights for policy 0, policy_version 51930 (0.0010) +[2023-10-08 13:50:45,441][102898] Updated weights for policy 1, policy_version 51970 (0.0008) +[2023-10-08 13:50:45,814][102898] Updated weights for policy 1, policy_version 51980 (0.0010) +[2023-10-08 13:50:46,186][102898] Updated weights for policy 1, policy_version 51990 (0.0008) +[2023-10-08 13:50:46,360][102897] Updated weights for policy 0, policy_version 51940 (0.0009) +[2023-10-08 13:50:46,550][102898] Updated weights for policy 1, policy_version 52000 (0.0008) +[2023-10-08 13:50:46,730][102897] Updated weights for policy 0, policy_version 51950 (0.0009) +[2023-10-08 13:50:46,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 106430464. Throughput: 0: 1803.2, 1: 1786.0. Samples: 26619118. Policy #0 lag: (min: 5.0, avg: 6.1, max: 25.0) +[2023-10-08 13:50:46,876][101941] Avg episode reward: [(0, '7.520'), (1, '9.780')] +[2023-10-08 13:50:47,099][102897] Updated weights for policy 0, policy_version 51960 (0.0010) +[2023-10-08 13:50:50,280][102898] Updated weights for policy 1, policy_version 52010 (0.0007) +[2023-10-08 13:50:50,641][102898] Updated weights for policy 1, policy_version 52020 (0.0008) +[2023-10-08 13:50:50,876][102897] Updated weights for policy 0, policy_version 51970 (0.0010) +[2023-10-08 13:50:51,010][102898] Updated weights for policy 1, policy_version 52030 (0.0008) +[2023-10-08 13:50:51,244][102897] Updated weights for policy 0, policy_version 51980 (0.0007) +[2023-10-08 13:50:51,613][102897] Updated weights for policy 0, policy_version 51990 (0.0008) +[2023-10-08 13:50:51,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 106496000. Throughput: 0: 1779.1, 1: 1790.3. Samples: 26630328. Policy #0 lag: (min: 5.0, avg: 6.1, max: 25.0) +[2023-10-08 13:50:51,876][101941] Avg episode reward: [(0, '7.600'), (1, '9.640')] +[2023-10-08 13:50:51,973][102897] Updated weights for policy 0, policy_version 52000 (0.0008) +[2023-10-08 13:50:54,713][102898] Updated weights for policy 1, policy_version 52040 (0.0007) +[2023-10-08 13:50:55,072][102898] Updated weights for policy 1, policy_version 52050 (0.0009) +[2023-10-08 13:50:55,442][102898] Updated weights for policy 1, policy_version 52060 (0.0010) +[2023-10-08 13:50:55,858][102897] Updated weights for policy 0, policy_version 52010 (0.0007) +[2023-10-08 13:50:56,228][102897] Updated weights for policy 0, policy_version 52020 (0.0008) +[2023-10-08 13:50:56,605][102897] Updated weights for policy 0, policy_version 52030 (0.0008) +[2023-10-08 13:50:56,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 106594304. Throughput: 0: 1802.5, 1: 1787.0. Samples: 26651468. Policy #0 lag: (min: 5.0, avg: 6.1, max: 25.0) +[2023-10-08 13:50:56,876][101941] Avg episode reward: [(0, '7.080'), (1, '10.460')] +[2023-10-08 13:50:56,878][102760] Saving new best policy, reward=10.460! +[2023-10-08 13:50:58,999][102898] Updated weights for policy 1, policy_version 52070 (0.0008) +[2023-10-08 13:50:59,365][102898] Updated weights for policy 1, policy_version 52080 (0.0007) +[2023-10-08 13:50:59,732][102898] Updated weights for policy 1, policy_version 52090 (0.0007) +[2023-10-08 13:51:00,416][102897] Updated weights for policy 0, policy_version 52040 (0.0010) +[2023-10-08 13:51:00,790][102897] Updated weights for policy 0, policy_version 52050 (0.0010) +[2023-10-08 13:51:01,160][102897] Updated weights for policy 0, policy_version 52060 (0.0010) +[2023-10-08 13:51:01,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 106659840. Throughput: 0: 1779.7, 1: 1788.5. Samples: 26672298. Policy #0 lag: (min: 31.0, avg: 47.0, max: 63.0) +[2023-10-08 13:51:01,876][101941] Avg episode reward: [(0, '7.120'), (1, '9.670')] +[2023-10-08 13:51:03,400][102898] Updated weights for policy 1, policy_version 52100 (0.0007) +[2023-10-08 13:51:03,771][102898] Updated weights for policy 1, policy_version 52110 (0.0008) +[2023-10-08 13:51:04,135][102898] Updated weights for policy 1, policy_version 52120 (0.0007) +[2023-10-08 13:51:04,905][102897] Updated weights for policy 0, policy_version 52070 (0.0008) +[2023-10-08 13:51:05,281][102897] Updated weights for policy 0, policy_version 52080 (0.0009) +[2023-10-08 13:51:05,647][102897] Updated weights for policy 0, policy_version 52090 (0.0009) +[2023-10-08 13:51:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 106725376. Throughput: 0: 1796.8, 1: 1789.5. Samples: 26683590. Policy #0 lag: (min: 31.0, avg: 47.0, max: 63.0) +[2023-10-08 13:51:06,876][101941] Avg episode reward: [(0, '8.150'), (1, '8.890')] +[2023-10-08 13:51:07,958][102898] Updated weights for policy 1, policy_version 52130 (0.0009) +[2023-10-08 13:51:08,320][102898] Updated weights for policy 1, policy_version 52140 (0.0009) +[2023-10-08 13:51:08,685][102898] Updated weights for policy 1, policy_version 52150 (0.0009) +[2023-10-08 13:51:09,055][102898] Updated weights for policy 1, policy_version 52160 (0.0010) +[2023-10-08 13:51:09,288][102897] Updated weights for policy 0, policy_version 52100 (0.0008) +[2023-10-08 13:51:09,661][102897] Updated weights for policy 0, policy_version 52110 (0.0007) +[2023-10-08 13:51:10,036][102897] Updated weights for policy 0, policy_version 52120 (0.0008) +[2023-10-08 13:51:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 106790912. Throughput: 0: 1778.1, 1: 1785.4. Samples: 26704330. Policy #0 lag: (min: 31.0, avg: 47.0, max: 63.0) +[2023-10-08 13:51:11,876][101941] Avg episode reward: [(0, '7.620'), (1, '8.770')] +[2023-10-08 13:51:13,077][102898] Updated weights for policy 1, policy_version 52170 (0.0008) +[2023-10-08 13:51:13,442][102898] Updated weights for policy 1, policy_version 52180 (0.0007) +[2023-10-08 13:51:13,808][102898] Updated weights for policy 1, policy_version 52190 (0.0007) +[2023-10-08 13:51:13,855][102897] Updated weights for policy 0, policy_version 52130 (0.0007) +[2023-10-08 13:51:14,225][102897] Updated weights for policy 0, policy_version 52140 (0.0009) +[2023-10-08 13:51:14,584][102897] Updated weights for policy 0, policy_version 52150 (0.0011) +[2023-10-08 13:51:14,955][102897] Updated weights for policy 0, policy_version 52160 (0.0010) +[2023-10-08 13:51:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 106856448. Throughput: 0: 1769.6, 1: 1782.4. Samples: 26726414. Policy #0 lag: (min: 31.0, avg: 47.0, max: 63.0) +[2023-10-08 13:51:16,876][101941] Avg episode reward: [(0, '7.130'), (1, '9.180')] +[2023-10-08 13:51:17,428][102898] Updated weights for policy 1, policy_version 52200 (0.0008) +[2023-10-08 13:51:17,782][102898] Updated weights for policy 1, policy_version 52210 (0.0009) +[2023-10-08 13:51:18,150][102898] Updated weights for policy 1, policy_version 52220 (0.0008) +[2023-10-08 13:51:18,683][102897] Updated weights for policy 0, policy_version 52170 (0.0008) +[2023-10-08 13:51:19,053][102897] Updated weights for policy 0, policy_version 52180 (0.0007) +[2023-10-08 13:51:19,423][102897] Updated weights for policy 0, policy_version 52190 (0.0008) +[2023-10-08 13:51:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 106921984. Throughput: 0: 1772.4, 1: 1787.7. Samples: 26736488. Policy #0 lag: (min: 31.0, avg: 47.0, max: 63.0) +[2023-10-08 13:51:21,876][101941] Avg episode reward: [(0, '7.620'), (1, '9.860')] +[2023-10-08 13:51:21,980][102898] Updated weights for policy 1, policy_version 52230 (0.0007) +[2023-10-08 13:51:22,338][102898] Updated weights for policy 1, policy_version 52240 (0.0007) +[2023-10-08 13:51:22,700][102898] Updated weights for policy 1, policy_version 52250 (0.0007) +[2023-10-08 13:51:23,223][102897] Updated weights for policy 0, policy_version 52200 (0.0010) +[2023-10-08 13:51:23,592][102897] Updated weights for policy 0, policy_version 52210 (0.0010) +[2023-10-08 13:51:23,968][102897] Updated weights for policy 0, policy_version 52220 (0.0011) +[2023-10-08 13:51:26,362][102898] Updated weights for policy 1, policy_version 52260 (0.0008) +[2023-10-08 13:51:26,728][102898] Updated weights for policy 1, policy_version 52270 (0.0008) +[2023-10-08 13:51:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 106987520. Throughput: 0: 1772.9, 1: 1793.9. Samples: 26758792. Policy #0 lag: (min: 31.0, avg: 47.0, max: 63.0) +[2023-10-08 13:51:26,876][101941] Avg episode reward: [(0, '8.150'), (1, '9.330')] +[2023-10-08 13:51:27,097][102898] Updated weights for policy 1, policy_version 52280 (0.0007) +[2023-10-08 13:51:27,748][102897] Updated weights for policy 0, policy_version 52230 (0.0009) +[2023-10-08 13:51:28,117][102897] Updated weights for policy 0, policy_version 52240 (0.0007) +[2023-10-08 13:51:28,491][102897] Updated weights for policy 0, policy_version 52250 (0.0008) +[2023-10-08 13:51:30,978][102898] Updated weights for policy 1, policy_version 52290 (0.0008) +[2023-10-08 13:51:31,339][102898] Updated weights for policy 1, policy_version 52300 (0.0007) +[2023-10-08 13:51:31,711][102898] Updated weights for policy 1, policy_version 52310 (0.0007) +[2023-10-08 13:51:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 107053056. Throughput: 0: 1777.1, 1: 1807.2. Samples: 26780410. Policy #0 lag: (min: 31.0, avg: 47.0, max: 63.0) +[2023-10-08 13:51:31,875][101941] Avg episode reward: [(0, '7.370'), (1, '10.030')] +[2023-10-08 13:51:32,078][102898] Updated weights for policy 1, policy_version 52320 (0.0007) +[2023-10-08 13:51:32,353][102897] Updated weights for policy 0, policy_version 52260 (0.0009) +[2023-10-08 13:51:32,721][102897] Updated weights for policy 0, policy_version 52270 (0.0010) +[2023-10-08 13:51:33,099][102897] Updated weights for policy 0, policy_version 52280 (0.0008) +[2023-10-08 13:51:35,688][102898] Updated weights for policy 1, policy_version 52330 (0.0007) +[2023-10-08 13:51:36,058][102898] Updated weights for policy 1, policy_version 52340 (0.0007) +[2023-10-08 13:51:36,427][102898] Updated weights for policy 1, policy_version 52350 (0.0007) +[2023-10-08 13:51:36,871][102897] Updated weights for policy 0, policy_version 52290 (0.0009) +[2023-10-08 13:51:36,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 107151360. Throughput: 0: 1774.9, 1: 1796.2. Samples: 26791030. Policy #0 lag: (min: 31.0, avg: 47.0, max: 63.0) +[2023-10-08 13:51:36,875][101941] Avg episode reward: [(0, '7.180'), (1, '9.270')] +[2023-10-08 13:51:37,243][102897] Updated weights for policy 0, policy_version 52300 (0.0007) +[2023-10-08 13:51:37,618][102897] Updated weights for policy 0, policy_version 52310 (0.0007) +[2023-10-08 13:51:37,997][102897] Updated weights for policy 0, policy_version 52320 (0.0008) +[2023-10-08 13:51:40,203][102898] Updated weights for policy 1, policy_version 52360 (0.0008) +[2023-10-08 13:51:40,562][102898] Updated weights for policy 1, policy_version 52370 (0.0009) +[2023-10-08 13:51:40,938][102898] Updated weights for policy 1, policy_version 52380 (0.0007) +[2023-10-08 13:51:41,737][102897] Updated weights for policy 0, policy_version 52330 (0.0007) +[2023-10-08 13:51:41,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 107216896. Throughput: 0: 1772.4, 1: 1809.6. Samples: 26812662. Policy #0 lag: (min: 22.0, avg: 27.0, max: 54.0) +[2023-10-08 13:51:41,876][101941] Avg episode reward: [(0, '7.760'), (1, '8.840')] +[2023-10-08 13:51:42,113][102897] Updated weights for policy 0, policy_version 52340 (0.0008) +[2023-10-08 13:51:42,490][102897] Updated weights for policy 0, policy_version 52350 (0.0009) +[2023-10-08 13:51:44,837][102898] Updated weights for policy 1, policy_version 52390 (0.0007) +[2023-10-08 13:51:45,208][102898] Updated weights for policy 1, policy_version 52400 (0.0007) +[2023-10-08 13:51:45,575][102898] Updated weights for policy 1, policy_version 52410 (0.0008) +[2023-10-08 13:51:46,276][102897] Updated weights for policy 0, policy_version 52360 (0.0008) +[2023-10-08 13:51:46,647][102897] Updated weights for policy 0, policy_version 52370 (0.0011) +[2023-10-08 13:51:46,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 107282432. Throughput: 0: 1802.7, 1: 1788.0. Samples: 26833876. Policy #0 lag: (min: 22.0, avg: 27.0, max: 54.0) +[2023-10-08 13:51:46,876][101941] Avg episode reward: [(0, '8.250'), (1, '8.860')] +[2023-10-08 13:51:47,024][102897] Updated weights for policy 0, policy_version 52380 (0.0010) +[2023-10-08 13:51:49,480][102898] Updated weights for policy 1, policy_version 52420 (0.0007) +[2023-10-08 13:51:49,844][102898] Updated weights for policy 1, policy_version 52430 (0.0007) +[2023-10-08 13:51:50,217][102898] Updated weights for policy 1, policy_version 52440 (0.0007) +[2023-10-08 13:51:50,679][102897] Updated weights for policy 0, policy_version 52390 (0.0009) +[2023-10-08 13:51:51,044][102897] Updated weights for policy 0, policy_version 52400 (0.0007) +[2023-10-08 13:51:51,407][102897] Updated weights for policy 0, policy_version 52410 (0.0009) +[2023-10-08 13:51:51,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 107380736. Throughput: 0: 1780.6, 1: 1812.4. Samples: 26845274. Policy #0 lag: (min: 22.0, avg: 27.0, max: 54.0) +[2023-10-08 13:51:51,875][101941] Avg episode reward: [(0, '8.230'), (1, '8.770')] +[2023-10-08 13:51:53,795][102898] Updated weights for policy 1, policy_version 52450 (0.0007) +[2023-10-08 13:51:54,161][102898] Updated weights for policy 1, policy_version 52460 (0.0007) +[2023-10-08 13:51:54,522][102898] Updated weights for policy 1, policy_version 52470 (0.0007) +[2023-10-08 13:51:54,886][102898] Updated weights for policy 1, policy_version 52480 (0.0010) +[2023-10-08 13:51:55,209][102897] Updated weights for policy 0, policy_version 52420 (0.0008) +[2023-10-08 13:51:55,575][102897] Updated weights for policy 0, policy_version 52430 (0.0009) +[2023-10-08 13:51:55,950][102897] Updated weights for policy 0, policy_version 52440 (0.0008) +[2023-10-08 13:51:56,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 107446272. Throughput: 0: 1805.5, 1: 1794.4. Samples: 26866322. Policy #0 lag: (min: 22.0, avg: 27.0, max: 54.0) +[2023-10-08 13:51:56,876][101941] Avg episode reward: [(0, '7.490'), (1, '8.160')] +[2023-10-08 13:51:58,623][102898] Updated weights for policy 1, policy_version 52490 (0.0010) +[2023-10-08 13:51:58,994][102898] Updated weights for policy 1, policy_version 52500 (0.0011) +[2023-10-08 13:51:59,365][102898] Updated weights for policy 1, policy_version 52510 (0.0009) +[2023-10-08 13:51:59,724][102897] Updated weights for policy 0, policy_version 52450 (0.0008) +[2023-10-08 13:52:00,098][102897] Updated weights for policy 0, policy_version 52460 (0.0007) +[2023-10-08 13:52:00,469][102897] Updated weights for policy 0, policy_version 52470 (0.0009) +[2023-10-08 13:52:00,846][102897] Updated weights for policy 0, policy_version 52480 (0.0010) +[2023-10-08 13:52:01,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 107511808. Throughput: 0: 1784.2, 1: 1796.7. Samples: 26887556. Policy #0 lag: (min: 22.0, avg: 27.0, max: 54.0) +[2023-10-08 13:52:01,876][101941] Avg episode reward: [(0, '6.970'), (1, '8.830')] +[2023-10-08 13:52:03,112][102898] Updated weights for policy 1, policy_version 52520 (0.0008) +[2023-10-08 13:52:03,480][102898] Updated weights for policy 1, policy_version 52530 (0.0008) +[2023-10-08 13:52:03,851][102898] Updated weights for policy 1, policy_version 52540 (0.0009) +[2023-10-08 13:52:04,553][102897] Updated weights for policy 0, policy_version 52490 (0.0007) +[2023-10-08 13:52:04,932][102897] Updated weights for policy 0, policy_version 52500 (0.0008) +[2023-10-08 13:52:05,301][102897] Updated weights for policy 0, policy_version 52510 (0.0009) +[2023-10-08 13:52:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 107577344. Throughput: 0: 1812.6, 1: 1791.0. Samples: 26898650. Policy #0 lag: (min: 22.0, avg: 27.0, max: 54.0) +[2023-10-08 13:52:06,876][101941] Avg episode reward: [(0, '7.120'), (1, '9.900')] +[2023-10-08 13:52:07,688][102898] Updated weights for policy 1, policy_version 52550 (0.0008) +[2023-10-08 13:52:08,070][102898] Updated weights for policy 1, policy_version 52560 (0.0008) +[2023-10-08 13:52:08,440][102898] Updated weights for policy 1, policy_version 52570 (0.0009) +[2023-10-08 13:52:09,117][102897] Updated weights for policy 0, policy_version 52520 (0.0009) +[2023-10-08 13:52:09,491][102897] Updated weights for policy 0, policy_version 52530 (0.0007) +[2023-10-08 13:52:09,864][102897] Updated weights for policy 0, policy_version 52540 (0.0007) +[2023-10-08 13:52:11,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 107642880. Throughput: 0: 1787.2, 1: 1783.4. Samples: 26919468. Policy #0 lag: (min: 22.0, avg: 27.0, max: 54.0) +[2023-10-08 13:52:11,875][101941] Avg episode reward: [(0, '7.580'), (1, '9.170')] +[2023-10-08 13:52:12,319][102898] Updated weights for policy 1, policy_version 52580 (0.0008) +[2023-10-08 13:52:12,680][102898] Updated weights for policy 1, policy_version 52590 (0.0009) +[2023-10-08 13:52:13,047][102898] Updated weights for policy 1, policy_version 52600 (0.0007) +[2023-10-08 13:52:13,563][102897] Updated weights for policy 0, policy_version 52550 (0.0009) +[2023-10-08 13:52:13,948][102897] Updated weights for policy 0, policy_version 52560 (0.0008) +[2023-10-08 13:52:14,319][102897] Updated weights for policy 0, policy_version 52570 (0.0007) +[2023-10-08 13:52:16,784][102898] Updated weights for policy 1, policy_version 52610 (0.0008) +[2023-10-08 13:52:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 107708416. Throughput: 0: 1787.0, 1: 1796.3. Samples: 26941656. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:52:16,876][101941] Avg episode reward: [(0, '7.250'), (1, '9.330')] +[2023-10-08 13:52:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000052576_53837824.pth... +[2023-10-08 13:52:16,912][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000050912_52133888.pth +[2023-10-08 13:52:17,146][102898] Updated weights for policy 1, policy_version 52620 (0.0007) +[2023-10-08 13:52:17,508][102898] Updated weights for policy 1, policy_version 52630 (0.0009) +[2023-10-08 13:52:17,872][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000052640_53903360.pth... +[2023-10-08 13:52:17,876][102898] Updated weights for policy 1, policy_version 52640 (0.0007) +[2023-10-08 13:52:17,900][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000050944_52166656.pth +[2023-10-08 13:52:18,072][102897] Updated weights for policy 0, policy_version 52580 (0.0008) +[2023-10-08 13:52:18,434][102897] Updated weights for policy 0, policy_version 52590 (0.0007) +[2023-10-08 13:52:18,812][102897] Updated weights for policy 0, policy_version 52600 (0.0009) +[2023-10-08 13:52:21,553][102898] Updated weights for policy 1, policy_version 52650 (0.0007) +[2023-10-08 13:52:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 107773952. Throughput: 0: 1789.3, 1: 1779.7. Samples: 26951636. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:52:21,876][101941] Avg episode reward: [(0, '7.030'), (1, '9.440')] +[2023-10-08 13:52:21,917][102898] Updated weights for policy 1, policy_version 52660 (0.0007) +[2023-10-08 13:52:22,295][102898] Updated weights for policy 1, policy_version 52670 (0.0009) +[2023-10-08 13:52:22,624][102897] Updated weights for policy 0, policy_version 52610 (0.0008) +[2023-10-08 13:52:22,995][102897] Updated weights for policy 0, policy_version 52620 (0.0008) +[2023-10-08 13:52:23,367][102897] Updated weights for policy 0, policy_version 52630 (0.0007) +[2023-10-08 13:52:23,735][102897] Updated weights for policy 0, policy_version 52640 (0.0010) +[2023-10-08 13:52:26,106][102898] Updated weights for policy 1, policy_version 52680 (0.0009) +[2023-10-08 13:52:26,471][102898] Updated weights for policy 1, policy_version 52690 (0.0009) +[2023-10-08 13:52:26,848][102898] Updated weights for policy 1, policy_version 52700 (0.0008) +[2023-10-08 13:52:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 107839488. Throughput: 0: 1789.8, 1: 1796.9. Samples: 26974062. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:52:26,876][101941] Avg episode reward: [(0, '7.120'), (1, '8.980')] +[2023-10-08 13:52:27,512][102897] Updated weights for policy 0, policy_version 52650 (0.0010) +[2023-10-08 13:52:27,895][102897] Updated weights for policy 0, policy_version 52660 (0.0009) +[2023-10-08 13:52:28,259][102897] Updated weights for policy 0, policy_version 52670 (0.0010) +[2023-10-08 13:52:30,591][102898] Updated weights for policy 1, policy_version 52710 (0.0008) +[2023-10-08 13:52:30,956][102898] Updated weights for policy 1, policy_version 52720 (0.0008) +[2023-10-08 13:52:31,337][102898] Updated weights for policy 1, policy_version 52730 (0.0007) +[2023-10-08 13:52:31,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 107937792. Throughput: 0: 1802.5, 1: 1785.8. Samples: 26995350. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:52:31,876][101941] Avg episode reward: [(0, '6.830'), (1, '9.350')] +[2023-10-08 13:52:32,052][102897] Updated weights for policy 0, policy_version 52680 (0.0008) +[2023-10-08 13:52:32,421][102897] Updated weights for policy 0, policy_version 52690 (0.0007) +[2023-10-08 13:52:32,789][102897] Updated weights for policy 0, policy_version 52700 (0.0007) +[2023-10-08 13:52:34,936][102898] Updated weights for policy 1, policy_version 52740 (0.0007) +[2023-10-08 13:52:35,307][102898] Updated weights for policy 1, policy_version 52750 (0.0008) +[2023-10-08 13:52:35,672][102898] Updated weights for policy 1, policy_version 52760 (0.0009) +[2023-10-08 13:52:36,441][102897] Updated weights for policy 0, policy_version 52710 (0.0009) +[2023-10-08 13:52:36,814][102897] Updated weights for policy 0, policy_version 52720 (0.0010) +[2023-10-08 13:52:36,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 108003328. Throughput: 0: 1790.2, 1: 1796.1. Samples: 27006660. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:52:36,875][101941] Avg episode reward: [(0, '6.660'), (1, '8.960')] +[2023-10-08 13:52:37,189][102897] Updated weights for policy 0, policy_version 52730 (0.0007) +[2023-10-08 13:52:39,353][102898] Updated weights for policy 1, policy_version 52770 (0.0007) +[2023-10-08 13:52:39,719][102898] Updated weights for policy 1, policy_version 52780 (0.0008) +[2023-10-08 13:52:40,093][102898] Updated weights for policy 1, policy_version 52790 (0.0007) +[2023-10-08 13:52:40,459][102898] Updated weights for policy 1, policy_version 52800 (0.0008) +[2023-10-08 13:52:40,877][102897] Updated weights for policy 0, policy_version 52740 (0.0007) +[2023-10-08 13:52:41,249][102897] Updated weights for policy 0, policy_version 52750 (0.0010) +[2023-10-08 13:52:41,611][102897] Updated weights for policy 0, policy_version 52760 (0.0008) +[2023-10-08 13:52:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 108068864. Throughput: 0: 1802.1, 1: 1787.3. Samples: 27027844. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:52:41,876][101941] Avg episode reward: [(0, '7.160'), (1, '10.040')] +[2023-10-08 13:52:44,189][102898] Updated weights for policy 1, policy_version 52810 (0.0011) +[2023-10-08 13:52:44,557][102898] Updated weights for policy 1, policy_version 52820 (0.0007) +[2023-10-08 13:52:44,929][102898] Updated weights for policy 1, policy_version 52830 (0.0007) +[2023-10-08 13:52:45,340][102897] Updated weights for policy 0, policy_version 52770 (0.0009) +[2023-10-08 13:52:45,714][102897] Updated weights for policy 0, policy_version 52780 (0.0009) +[2023-10-08 13:52:46,078][102897] Updated weights for policy 0, policy_version 52790 (0.0007) +[2023-10-08 13:52:46,452][102897] Updated weights for policy 0, policy_version 52800 (0.0007) +[2023-10-08 13:52:46,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 108167168. Throughput: 0: 1798.9, 1: 1789.6. Samples: 27049040. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:52:46,876][101941] Avg episode reward: [(0, '7.550'), (1, '10.010')] +[2023-10-08 13:52:48,655][102898] Updated weights for policy 1, policy_version 52840 (0.0008) +[2023-10-08 13:52:49,015][102898] Updated weights for policy 1, policy_version 52850 (0.0007) +[2023-10-08 13:52:49,380][102898] Updated weights for policy 1, policy_version 52860 (0.0010) +[2023-10-08 13:52:50,087][102897] Updated weights for policy 0, policy_version 52810 (0.0009) +[2023-10-08 13:52:50,449][102897] Updated weights for policy 0, policy_version 52820 (0.0009) +[2023-10-08 13:52:50,834][102897] Updated weights for policy 0, policy_version 52830 (0.0007) +[2023-10-08 13:52:51,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 108232704. Throughput: 0: 1801.7, 1: 1795.4. Samples: 27060518. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:52:51,876][101941] Avg episode reward: [(0, '7.270'), (1, '8.560')] +[2023-10-08 13:52:53,201][102898] Updated weights for policy 1, policy_version 52870 (0.0011) +[2023-10-08 13:52:53,560][102898] Updated weights for policy 1, policy_version 52880 (0.0011) +[2023-10-08 13:52:53,932][102898] Updated weights for policy 1, policy_version 52890 (0.0010) +[2023-10-08 13:52:54,734][102897] Updated weights for policy 0, policy_version 52840 (0.0008) +[2023-10-08 13:52:55,108][102897] Updated weights for policy 0, policy_version 52850 (0.0009) +[2023-10-08 13:52:55,481][102897] Updated weights for policy 0, policy_version 52860 (0.0008) +[2023-10-08 13:52:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 108298240. Throughput: 0: 1805.1, 1: 1797.1. Samples: 27081564. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:52:56,876][101941] Avg episode reward: [(0, '6.740'), (1, '9.200')] +[2023-10-08 13:52:57,660][102898] Updated weights for policy 1, policy_version 52900 (0.0009) +[2023-10-08 13:52:58,054][102898] Updated weights for policy 1, policy_version 52910 (0.0008) +[2023-10-08 13:52:58,429][102898] Updated weights for policy 1, policy_version 52920 (0.0009) +[2023-10-08 13:52:59,411][102897] Updated weights for policy 0, policy_version 52870 (0.0009) +[2023-10-08 13:52:59,805][102897] Updated weights for policy 0, policy_version 52880 (0.0008) +[2023-10-08 13:53:00,179][102897] Updated weights for policy 0, policy_version 52890 (0.0008) +[2023-10-08 13:53:01,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 108363776. Throughput: 0: 1791.0, 1: 1797.6. Samples: 27103144. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:53:01,876][101941] Avg episode reward: [(0, '7.210'), (1, '9.580')] +[2023-10-08 13:53:02,272][102898] Updated weights for policy 1, policy_version 52930 (0.0009) +[2023-10-08 13:53:02,638][102898] Updated weights for policy 1, policy_version 52940 (0.0007) +[2023-10-08 13:53:03,010][102898] Updated weights for policy 1, policy_version 52950 (0.0007) +[2023-10-08 13:53:03,377][102898] Updated weights for policy 1, policy_version 52960 (0.0008) +[2023-10-08 13:53:03,989][102897] Updated weights for policy 0, policy_version 52900 (0.0008) +[2023-10-08 13:53:04,369][102897] Updated weights for policy 0, policy_version 52910 (0.0007) +[2023-10-08 13:53:04,740][102897] Updated weights for policy 0, policy_version 52920 (0.0008) +[2023-10-08 13:53:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 108429312. Throughput: 0: 1802.9, 1: 1796.8. Samples: 27113622. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:53:06,875][101941] Avg episode reward: [(0, '7.340'), (1, '9.100')] +[2023-10-08 13:53:07,199][102898] Updated weights for policy 1, policy_version 52970 (0.0009) +[2023-10-08 13:53:07,566][102898] Updated weights for policy 1, policy_version 52980 (0.0009) +[2023-10-08 13:53:07,937][102898] Updated weights for policy 1, policy_version 52990 (0.0007) +[2023-10-08 13:53:08,453][102897] Updated weights for policy 0, policy_version 52930 (0.0007) +[2023-10-08 13:53:08,833][102897] Updated weights for policy 0, policy_version 52940 (0.0007) +[2023-10-08 13:53:09,200][102897] Updated weights for policy 0, policy_version 52950 (0.0008) +[2023-10-08 13:53:09,577][102897] Updated weights for policy 0, policy_version 52960 (0.0009) +[2023-10-08 13:53:11,843][102898] Updated weights for policy 1, policy_version 53000 (0.0008) +[2023-10-08 13:53:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 108494848. Throughput: 0: 1781.4, 1: 1795.6. Samples: 27135028. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:53:11,876][101941] Avg episode reward: [(0, '7.200'), (1, '9.510')] +[2023-10-08 13:53:12,202][102898] Updated weights for policy 1, policy_version 53010 (0.0007) +[2023-10-08 13:53:12,567][102898] Updated weights for policy 1, policy_version 53020 (0.0008) +[2023-10-08 13:53:13,262][102897] Updated weights for policy 0, policy_version 52970 (0.0007) +[2023-10-08 13:53:13,638][102897] Updated weights for policy 0, policy_version 52980 (0.0009) +[2023-10-08 13:53:14,006][102897] Updated weights for policy 0, policy_version 52990 (0.0008) +[2023-10-08 13:53:16,225][102898] Updated weights for policy 1, policy_version 53030 (0.0007) +[2023-10-08 13:53:16,599][102898] Updated weights for policy 1, policy_version 53040 (0.0007) +[2023-10-08 13:53:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 108560384. Throughput: 0: 1775.8, 1: 1814.5. Samples: 27156912. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:53:16,876][101941] Avg episode reward: [(0, '7.260'), (1, '9.460')] +[2023-10-08 13:53:16,970][102898] Updated weights for policy 1, policy_version 53050 (0.0010) +[2023-10-08 13:53:17,688][102897] Updated weights for policy 0, policy_version 53000 (0.0007) +[2023-10-08 13:53:18,051][102897] Updated weights for policy 0, policy_version 53010 (0.0009) +[2023-10-08 13:53:18,425][102897] Updated weights for policy 0, policy_version 53020 (0.0010) +[2023-10-08 13:53:20,694][102898] Updated weights for policy 1, policy_version 53060 (0.0008) +[2023-10-08 13:53:21,062][102898] Updated weights for policy 1, policy_version 53070 (0.0007) +[2023-10-08 13:53:21,426][102898] Updated weights for policy 1, policy_version 53080 (0.0010) +[2023-10-08 13:53:21,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 108658688. Throughput: 0: 1778.3, 1: 1793.3. Samples: 27167380. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:53:21,875][101941] Avg episode reward: [(0, '7.120'), (1, '8.780')] +[2023-10-08 13:53:22,111][102897] Updated weights for policy 0, policy_version 53030 (0.0009) +[2023-10-08 13:53:22,488][102897] Updated weights for policy 0, policy_version 53040 (0.0009) +[2023-10-08 13:53:22,865][102897] Updated weights for policy 0, policy_version 53050 (0.0008) +[2023-10-08 13:53:25,260][102898] Updated weights for policy 1, policy_version 53090 (0.0008) +[2023-10-08 13:53:25,635][102898] Updated weights for policy 1, policy_version 53100 (0.0011) +[2023-10-08 13:53:25,998][102898] Updated weights for policy 1, policy_version 53110 (0.0010) +[2023-10-08 13:53:26,357][102898] Updated weights for policy 1, policy_version 53120 (0.0007) +[2023-10-08 13:53:26,615][102897] Updated weights for policy 0, policy_version 53060 (0.0008) +[2023-10-08 13:53:26,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.5, 300 sec: 14329.1). Total num frames: 108724224. Throughput: 0: 1775.1, 1: 1815.3. Samples: 27189414. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:53:26,876][101941] Avg episode reward: [(0, '7.780'), (1, '9.490')] +[2023-10-08 13:53:26,998][102897] Updated weights for policy 0, policy_version 53070 (0.0008) +[2023-10-08 13:53:27,369][102897] Updated weights for policy 0, policy_version 53080 (0.0007) +[2023-10-08 13:53:30,224][102898] Updated weights for policy 1, policy_version 53130 (0.0007) +[2023-10-08 13:53:30,596][102898] Updated weights for policy 1, policy_version 53140 (0.0008) +[2023-10-08 13:53:30,961][102898] Updated weights for policy 1, policy_version 53150 (0.0010) +[2023-10-08 13:53:31,305][102897] Updated weights for policy 0, policy_version 53090 (0.0008) +[2023-10-08 13:53:31,670][102897] Updated weights for policy 0, policy_version 53100 (0.0009) +[2023-10-08 13:53:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 108789760. Throughput: 0: 1792.4, 1: 1784.2. Samples: 27209986. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:53:31,875][101941] Avg episode reward: [(0, '7.350'), (1, '9.660')] +[2023-10-08 13:53:32,040][102897] Updated weights for policy 0, policy_version 53110 (0.0010) +[2023-10-08 13:53:32,414][102897] Updated weights for policy 0, policy_version 53120 (0.0010) +[2023-10-08 13:53:34,763][102898] Updated weights for policy 1, policy_version 53160 (0.0007) +[2023-10-08 13:53:35,130][102898] Updated weights for policy 1, policy_version 53170 (0.0007) +[2023-10-08 13:53:35,498][102898] Updated weights for policy 1, policy_version 53180 (0.0008) +[2023-10-08 13:53:36,134][102897] Updated weights for policy 0, policy_version 53130 (0.0010) +[2023-10-08 13:53:36,512][102897] Updated weights for policy 0, policy_version 53140 (0.0007) +[2023-10-08 13:53:36,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 108855296. Throughput: 0: 1761.5, 1: 1811.0. Samples: 27221280. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:53:36,875][101941] Avg episode reward: [(0, '7.030'), (1, '9.720')] +[2023-10-08 13:53:36,882][102897] Updated weights for policy 0, policy_version 53150 (0.0007) +[2023-10-08 13:53:39,249][102898] Updated weights for policy 1, policy_version 53190 (0.0009) +[2023-10-08 13:53:39,617][102898] Updated weights for policy 1, policy_version 53200 (0.0009) +[2023-10-08 13:53:39,994][102898] Updated weights for policy 1, policy_version 53210 (0.0010) +[2023-10-08 13:53:40,695][102897] Updated weights for policy 0, policy_version 53160 (0.0008) +[2023-10-08 13:53:41,067][102897] Updated weights for policy 0, policy_version 53170 (0.0010) +[2023-10-08 13:53:41,441][102897] Updated weights for policy 0, policy_version 53180 (0.0008) +[2023-10-08 13:53:41,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 108953600. Throughput: 0: 1794.4, 1: 1778.4. Samples: 27242340. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:53:41,876][101941] Avg episode reward: [(0, '7.090'), (1, '9.220')] +[2023-10-08 13:53:43,930][102898] Updated weights for policy 1, policy_version 53220 (0.0008) +[2023-10-08 13:53:44,302][102898] Updated weights for policy 1, policy_version 53230 (0.0009) +[2023-10-08 13:53:44,666][102898] Updated weights for policy 1, policy_version 53240 (0.0007) +[2023-10-08 13:53:45,139][102897] Updated weights for policy 0, policy_version 53190 (0.0009) +[2023-10-08 13:53:45,511][102897] Updated weights for policy 0, policy_version 53200 (0.0008) +[2023-10-08 13:53:45,883][102897] Updated weights for policy 0, policy_version 53210 (0.0007) +[2023-10-08 13:53:46,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 109019136. Throughput: 0: 1776.1, 1: 1779.1. Samples: 27263130. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:53:46,876][101941] Avg episode reward: [(0, '7.240'), (1, '8.660')] +[2023-10-08 13:53:48,302][102898] Updated weights for policy 1, policy_version 53250 (0.0008) +[2023-10-08 13:53:48,671][102898] Updated weights for policy 1, policy_version 53260 (0.0008) +[2023-10-08 13:53:49,038][102898] Updated weights for policy 1, policy_version 53270 (0.0008) +[2023-10-08 13:53:49,399][102898] Updated weights for policy 1, policy_version 53280 (0.0008) +[2023-10-08 13:53:49,681][102897] Updated weights for policy 0, policy_version 53220 (0.0008) +[2023-10-08 13:53:50,056][102897] Updated weights for policy 0, policy_version 53230 (0.0008) +[2023-10-08 13:53:50,437][102897] Updated weights for policy 0, policy_version 53240 (0.0008) +[2023-10-08 13:53:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 109084672. Throughput: 0: 1792.6, 1: 1777.7. Samples: 27274286. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:53:51,876][101941] Avg episode reward: [(0, '7.840'), (1, '8.920')] +[2023-10-08 13:53:53,049][102898] Updated weights for policy 1, policy_version 53290 (0.0008) +[2023-10-08 13:53:53,413][102898] Updated weights for policy 1, policy_version 53300 (0.0007) +[2023-10-08 13:53:53,785][102898] Updated weights for policy 1, policy_version 53310 (0.0008) +[2023-10-08 13:53:54,255][102897] Updated weights for policy 0, policy_version 53250 (0.0009) +[2023-10-08 13:53:54,636][102897] Updated weights for policy 0, policy_version 53260 (0.0008) +[2023-10-08 13:53:55,002][102897] Updated weights for policy 0, policy_version 53270 (0.0007) +[2023-10-08 13:53:55,367][102897] Updated weights for policy 0, policy_version 53280 (0.0008) +[2023-10-08 13:53:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 109150208. Throughput: 0: 1781.1, 1: 1782.4. Samples: 27295388. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:53:56,876][101941] Avg episode reward: [(0, '8.200'), (1, '8.610')] +[2023-10-08 13:53:57,527][102898] Updated weights for policy 1, policy_version 53320 (0.0009) +[2023-10-08 13:53:57,903][102898] Updated weights for policy 1, policy_version 53330 (0.0010) +[2023-10-08 13:53:58,278][102898] Updated weights for policy 1, policy_version 53340 (0.0009) +[2023-10-08 13:53:59,090][102897] Updated weights for policy 0, policy_version 53290 (0.0007) +[2023-10-08 13:53:59,462][102897] Updated weights for policy 0, policy_version 53300 (0.0008) +[2023-10-08 13:53:59,838][102897] Updated weights for policy 0, policy_version 53310 (0.0009) +[2023-10-08 13:54:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 109215744. Throughput: 0: 1780.4, 1: 1791.7. Samples: 27317658. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:54:01,876][101941] Avg episode reward: [(0, '7.830'), (1, '8.290')] +[2023-10-08 13:54:02,055][102898] Updated weights for policy 1, policy_version 53350 (0.0008) +[2023-10-08 13:54:02,419][102898] Updated weights for policy 1, policy_version 53360 (0.0009) +[2023-10-08 13:54:02,788][102898] Updated weights for policy 1, policy_version 53370 (0.0008) +[2023-10-08 13:54:03,656][102897] Updated weights for policy 0, policy_version 53320 (0.0007) +[2023-10-08 13:54:04,028][102897] Updated weights for policy 0, policy_version 53330 (0.0010) +[2023-10-08 13:54:04,412][102897] Updated weights for policy 0, policy_version 53340 (0.0007) +[2023-10-08 13:54:06,566][102898] Updated weights for policy 1, policy_version 53380 (0.0007) +[2023-10-08 13:54:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 109281280. Throughput: 0: 1787.6, 1: 1776.9. Samples: 27327784. Policy #0 lag: (min: 9.0, avg: 26.4, max: 41.0) +[2023-10-08 13:54:06,876][101941] Avg episode reward: [(0, '7.480'), (1, '7.750')] +[2023-10-08 13:54:06,934][102898] Updated weights for policy 1, policy_version 53390 (0.0009) +[2023-10-08 13:54:07,291][102898] Updated weights for policy 1, policy_version 53400 (0.0009) +[2023-10-08 13:54:08,073][102897] Updated weights for policy 0, policy_version 53350 (0.0007) +[2023-10-08 13:54:08,441][102897] Updated weights for policy 0, policy_version 53360 (0.0007) +[2023-10-08 13:54:08,815][102897] Updated weights for policy 0, policy_version 53370 (0.0007) +[2023-10-08 13:54:11,068][102898] Updated weights for policy 1, policy_version 53410 (0.0010) +[2023-10-08 13:54:11,433][102898] Updated weights for policy 1, policy_version 53420 (0.0009) +[2023-10-08 13:54:11,803][102898] Updated weights for policy 1, policy_version 53430 (0.0007) +[2023-10-08 13:54:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 109346816. Throughput: 0: 1779.7, 1: 1785.6. Samples: 27349852. Policy #0 lag: (min: 9.0, avg: 26.4, max: 41.0) +[2023-10-08 13:54:11,876][101941] Avg episode reward: [(0, '7.550'), (1, '8.240')] +[2023-10-08 13:54:12,169][102898] Updated weights for policy 1, policy_version 53440 (0.0007) +[2023-10-08 13:54:12,547][102897] Updated weights for policy 0, policy_version 53380 (0.0007) +[2023-10-08 13:54:12,925][102897] Updated weights for policy 0, policy_version 53390 (0.0008) +[2023-10-08 13:54:13,300][102897] Updated weights for policy 0, policy_version 53400 (0.0009) +[2023-10-08 13:54:16,037][102898] Updated weights for policy 1, policy_version 53450 (0.0010) +[2023-10-08 13:54:16,410][102898] Updated weights for policy 1, policy_version 53460 (0.0008) +[2023-10-08 13:54:16,778][102898] Updated weights for policy 1, policy_version 53470 (0.0008) +[2023-10-08 13:54:16,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 109445120. Throughput: 0: 1781.4, 1: 1791.9. Samples: 27370786. Policy #0 lag: (min: 9.0, avg: 26.4, max: 41.0) +[2023-10-08 13:54:16,876][101941] Avg episode reward: [(0, '7.280'), (1, '9.050')] +[2023-10-08 13:54:16,889][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000053408_54689792.pth... +[2023-10-08 13:54:16,889][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000053472_54755328.pth... +[2023-10-08 13:54:16,925][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000051776_53018624.pth +[2023-10-08 13:54:16,927][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000051744_52985856.pth +[2023-10-08 13:54:17,204][102897] Updated weights for policy 0, policy_version 53410 (0.0007) +[2023-10-08 13:54:17,570][102897] Updated weights for policy 0, policy_version 53420 (0.0009) +[2023-10-08 13:54:17,940][102897] Updated weights for policy 0, policy_version 53430 (0.0009) +[2023-10-08 13:54:18,298][102897] Updated weights for policy 0, policy_version 53440 (0.0007) +[2023-10-08 13:54:20,419][102898] Updated weights for policy 1, policy_version 53480 (0.0010) +[2023-10-08 13:54:20,787][102898] Updated weights for policy 1, policy_version 53490 (0.0008) +[2023-10-08 13:54:21,162][102898] Updated weights for policy 1, policy_version 53500 (0.0011) +[2023-10-08 13:54:21,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 109510656. Throughput: 0: 1778.8, 1: 1780.7. Samples: 27381460. Policy #0 lag: (min: 9.0, avg: 26.4, max: 41.0) +[2023-10-08 13:54:21,876][101941] Avg episode reward: [(0, '7.600'), (1, '10.310')] +[2023-10-08 13:54:22,118][102897] Updated weights for policy 0, policy_version 53450 (0.0009) +[2023-10-08 13:54:22,499][102897] Updated weights for policy 0, policy_version 53460 (0.0009) +[2023-10-08 13:54:22,864][102897] Updated weights for policy 0, policy_version 53470 (0.0008) +[2023-10-08 13:54:24,952][102898] Updated weights for policy 1, policy_version 53510 (0.0011) +[2023-10-08 13:54:25,314][102898] Updated weights for policy 1, policy_version 53520 (0.0008) +[2023-10-08 13:54:25,683][102898] Updated weights for policy 1, policy_version 53530 (0.0008) +[2023-10-08 13:54:26,575][102897] Updated weights for policy 0, policy_version 53480 (0.0007) +[2023-10-08 13:54:26,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 109576192. Throughput: 0: 1770.7, 1: 1797.1. Samples: 27402890. Policy #0 lag: (min: 9.0, avg: 26.4, max: 41.0) +[2023-10-08 13:54:26,876][101941] Avg episode reward: [(0, '7.770'), (1, '9.000')] +[2023-10-08 13:54:26,947][102897] Updated weights for policy 0, policy_version 53490 (0.0009) +[2023-10-08 13:54:27,332][102897] Updated weights for policy 0, policy_version 53500 (0.0008) +[2023-10-08 13:54:29,297][102898] Updated weights for policy 1, policy_version 53540 (0.0007) +[2023-10-08 13:54:29,675][102898] Updated weights for policy 1, policy_version 53550 (0.0010) +[2023-10-08 13:54:30,042][102898] Updated weights for policy 1, policy_version 53560 (0.0009) +[2023-10-08 13:54:31,244][102897] Updated weights for policy 0, policy_version 53510 (0.0009) +[2023-10-08 13:54:31,628][102897] Updated weights for policy 0, policy_version 53520 (0.0008) +[2023-10-08 13:54:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 109641728. Throughput: 0: 1787.6, 1: 1785.5. Samples: 27423920. Policy #0 lag: (min: 9.0, avg: 26.4, max: 41.0) +[2023-10-08 13:54:31,876][101941] Avg episode reward: [(0, '6.970'), (1, '9.120')] +[2023-10-08 13:54:31,996][102897] Updated weights for policy 0, policy_version 53530 (0.0007) +[2023-10-08 13:54:34,003][102898] Updated weights for policy 1, policy_version 53570 (0.0009) +[2023-10-08 13:54:34,372][102898] Updated weights for policy 1, policy_version 53580 (0.0010) +[2023-10-08 13:54:34,732][102898] Updated weights for policy 1, policy_version 53590 (0.0008) +[2023-10-08 13:54:35,087][102898] Updated weights for policy 1, policy_version 53600 (0.0007) +[2023-10-08 13:54:35,795][102897] Updated weights for policy 0, policy_version 53540 (0.0007) +[2023-10-08 13:54:36,173][102897] Updated weights for policy 0, policy_version 53550 (0.0010) +[2023-10-08 13:54:36,543][102897] Updated weights for policy 0, policy_version 53560 (0.0009) +[2023-10-08 13:54:36,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 109740032. Throughput: 0: 1762.0, 1: 1799.8. Samples: 27434564. Policy #0 lag: (min: 9.0, avg: 26.4, max: 41.0) +[2023-10-08 13:54:36,876][101941] Avg episode reward: [(0, '7.320'), (1, '8.960')] +[2023-10-08 13:54:38,829][102898] Updated weights for policy 1, policy_version 53610 (0.0009) +[2023-10-08 13:54:39,203][102898] Updated weights for policy 1, policy_version 53620 (0.0008) +[2023-10-08 13:54:39,564][102898] Updated weights for policy 1, policy_version 53630 (0.0007) +[2023-10-08 13:54:40,276][102897] Updated weights for policy 0, policy_version 53570 (0.0009) +[2023-10-08 13:54:40,655][102897] Updated weights for policy 0, policy_version 53580 (0.0008) +[2023-10-08 13:54:41,020][102897] Updated weights for policy 0, policy_version 53590 (0.0008) +[2023-10-08 13:54:41,394][102897] Updated weights for policy 0, policy_version 53600 (0.0009) +[2023-10-08 13:54:41,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 109805568. Throughput: 0: 1798.0, 1: 1778.8. Samples: 27456346. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:54:41,876][101941] Avg episode reward: [(0, '7.520'), (1, '8.560')] +[2023-10-08 13:54:43,236][102898] Updated weights for policy 1, policy_version 53640 (0.0007) +[2023-10-08 13:54:43,609][102898] Updated weights for policy 1, policy_version 53650 (0.0007) +[2023-10-08 13:54:43,973][102898] Updated weights for policy 1, policy_version 53660 (0.0009) +[2023-10-08 13:54:45,155][102897] Updated weights for policy 0, policy_version 53610 (0.0007) +[2023-10-08 13:54:45,517][102897] Updated weights for policy 0, policy_version 53620 (0.0007) +[2023-10-08 13:54:45,889][102897] Updated weights for policy 0, policy_version 53630 (0.0010) +[2023-10-08 13:54:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 109871104. Throughput: 0: 1771.0, 1: 1784.9. Samples: 27477674. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:54:46,875][101941] Avg episode reward: [(0, '7.430'), (1, '8.660')] +[2023-10-08 13:54:47,602][102898] Updated weights for policy 1, policy_version 53670 (0.0010) +[2023-10-08 13:54:47,970][102898] Updated weights for policy 1, policy_version 53680 (0.0008) +[2023-10-08 13:54:48,336][102898] Updated weights for policy 1, policy_version 53690 (0.0010) +[2023-10-08 13:54:49,658][102897] Updated weights for policy 0, policy_version 53640 (0.0009) +[2023-10-08 13:54:50,021][102897] Updated weights for policy 0, policy_version 53650 (0.0009) +[2023-10-08 13:54:50,394][102897] Updated weights for policy 0, policy_version 53660 (0.0008) +[2023-10-08 13:54:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 109936640. Throughput: 0: 1793.1, 1: 1786.0. Samples: 27488844. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:54:51,876][101941] Avg episode reward: [(0, '7.840'), (1, '9.000')] +[2023-10-08 13:54:52,134][102898] Updated weights for policy 1, policy_version 53700 (0.0007) +[2023-10-08 13:54:52,507][102898] Updated weights for policy 1, policy_version 53710 (0.0009) +[2023-10-08 13:54:52,888][102898] Updated weights for policy 1, policy_version 53720 (0.0008) +[2023-10-08 13:54:54,014][102897] Updated weights for policy 0, policy_version 53670 (0.0007) +[2023-10-08 13:54:54,389][102897] Updated weights for policy 0, policy_version 53680 (0.0008) +[2023-10-08 13:54:54,749][102897] Updated weights for policy 0, policy_version 53690 (0.0008) +[2023-10-08 13:54:56,702][102898] Updated weights for policy 1, policy_version 53730 (0.0009) +[2023-10-08 13:54:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 110002176. Throughput: 0: 1775.2, 1: 1789.1. Samples: 27510246. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:54:56,875][101941] Avg episode reward: [(0, '7.560'), (1, '9.120')] +[2023-10-08 13:54:57,076][102898] Updated weights for policy 1, policy_version 53740 (0.0010) +[2023-10-08 13:54:57,453][102898] Updated weights for policy 1, policy_version 53750 (0.0011) +[2023-10-08 13:54:57,820][102898] Updated weights for policy 1, policy_version 53760 (0.0010) +[2023-10-08 13:54:58,512][102897] Updated weights for policy 0, policy_version 53700 (0.0007) +[2023-10-08 13:54:58,878][102897] Updated weights for policy 0, policy_version 53710 (0.0009) +[2023-10-08 13:54:59,256][102897] Updated weights for policy 0, policy_version 53720 (0.0007) +[2023-10-08 13:55:01,583][102898] Updated weights for policy 1, policy_version 53770 (0.0008) +[2023-10-08 13:55:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 110067712. Throughput: 0: 1781.9, 1: 1809.3. Samples: 27532390. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:55:01,875][101941] Avg episode reward: [(0, '7.300'), (1, '8.720')] +[2023-10-08 13:55:01,953][102898] Updated weights for policy 1, policy_version 53780 (0.0009) +[2023-10-08 13:55:02,325][102898] Updated weights for policy 1, policy_version 53790 (0.0008) +[2023-10-08 13:55:03,038][102897] Updated weights for policy 0, policy_version 53730 (0.0008) +[2023-10-08 13:55:03,416][102897] Updated weights for policy 0, policy_version 53740 (0.0008) +[2023-10-08 13:55:03,782][102897] Updated weights for policy 0, policy_version 53750 (0.0009) +[2023-10-08 13:55:04,150][102897] Updated weights for policy 0, policy_version 53760 (0.0009) +[2023-10-08 13:55:06,006][102898] Updated weights for policy 1, policy_version 53800 (0.0010) +[2023-10-08 13:55:06,364][102898] Updated weights for policy 1, policy_version 53810 (0.0010) +[2023-10-08 13:55:06,730][102898] Updated weights for policy 1, policy_version 53820 (0.0007) +[2023-10-08 13:55:06,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 110166016. Throughput: 0: 1780.3, 1: 1798.2. Samples: 27542494. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:55:06,876][101941] Avg episode reward: [(0, '7.050'), (1, '8.720')] +[2023-10-08 13:55:07,856][102897] Updated weights for policy 0, policy_version 53770 (0.0007) +[2023-10-08 13:55:08,218][102897] Updated weights for policy 0, policy_version 53780 (0.0008) +[2023-10-08 13:55:08,594][102897] Updated weights for policy 0, policy_version 53790 (0.0008) +[2023-10-08 13:55:10,577][102898] Updated weights for policy 1, policy_version 53830 (0.0007) +[2023-10-08 13:55:10,942][102898] Updated weights for policy 1, policy_version 53840 (0.0008) +[2023-10-08 13:55:11,312][102898] Updated weights for policy 1, policy_version 53850 (0.0007) +[2023-10-08 13:55:11,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 110231552. Throughput: 0: 1787.4, 1: 1810.8. Samples: 27564810. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:55:11,876][101941] Avg episode reward: [(0, '7.410'), (1, '8.890')] +[2023-10-08 13:55:12,357][102897] Updated weights for policy 0, policy_version 53800 (0.0007) +[2023-10-08 13:55:12,726][102897] Updated weights for policy 0, policy_version 53810 (0.0007) +[2023-10-08 13:55:13,099][102897] Updated weights for policy 0, policy_version 53820 (0.0007) +[2023-10-08 13:55:15,097][102898] Updated weights for policy 1, policy_version 53860 (0.0009) +[2023-10-08 13:55:15,494][102898] Updated weights for policy 1, policy_version 53870 (0.0009) +[2023-10-08 13:55:15,857][102898] Updated weights for policy 1, policy_version 53880 (0.0008) +[2023-10-08 13:55:16,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 110297088. Throughput: 0: 1806.3, 1: 1792.2. Samples: 27585852. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:55:16,876][101941] Avg episode reward: [(0, '8.530'), (1, '8.640')] +[2023-10-08 13:55:16,962][102897] Updated weights for policy 0, policy_version 53830 (0.0009) +[2023-10-08 13:55:17,336][102897] Updated weights for policy 0, policy_version 53840 (0.0009) +[2023-10-08 13:55:17,712][102897] Updated weights for policy 0, policy_version 53850 (0.0011) +[2023-10-08 13:55:19,663][102898] Updated weights for policy 1, policy_version 53890 (0.0009) +[2023-10-08 13:55:20,027][102898] Updated weights for policy 1, policy_version 53900 (0.0007) +[2023-10-08 13:55:20,391][102898] Updated weights for policy 1, policy_version 53910 (0.0008) +[2023-10-08 13:55:20,759][102898] Updated weights for policy 1, policy_version 53920 (0.0008) +[2023-10-08 13:55:21,420][102897] Updated weights for policy 0, policy_version 53860 (0.0008) +[2023-10-08 13:55:21,801][102897] Updated weights for policy 0, policy_version 53870 (0.0008) +[2023-10-08 13:55:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 110362624. Throughput: 0: 1791.9, 1: 1809.4. Samples: 27596624. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:55:21,876][101941] Avg episode reward: [(0, '8.780'), (1, '9.110')] +[2023-10-08 13:55:22,180][102897] Updated weights for policy 0, policy_version 53880 (0.0009) +[2023-10-08 13:55:24,394][102898] Updated weights for policy 1, policy_version 53930 (0.0007) +[2023-10-08 13:55:24,750][102898] Updated weights for policy 1, policy_version 53940 (0.0008) +[2023-10-08 13:55:25,119][102898] Updated weights for policy 1, policy_version 53950 (0.0011) +[2023-10-08 13:55:25,936][102897] Updated weights for policy 0, policy_version 53890 (0.0008) +[2023-10-08 13:55:26,309][102897] Updated weights for policy 0, policy_version 53900 (0.0009) +[2023-10-08 13:55:26,684][102897] Updated weights for policy 0, policy_version 53910 (0.0010) +[2023-10-08 13:55:26,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 110428160. Throughput: 0: 1794.8, 1: 1795.5. Samples: 27617910. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:55:26,876][101941] Avg episode reward: [(0, '7.590'), (1, '8.450')] +[2023-10-08 13:55:27,062][102897] Updated weights for policy 0, policy_version 53920 (0.0008) +[2023-10-08 13:55:28,836][102898] Updated weights for policy 1, policy_version 53960 (0.0011) +[2023-10-08 13:55:29,200][102898] Updated weights for policy 1, policy_version 53970 (0.0009) +[2023-10-08 13:55:29,564][102898] Updated weights for policy 1, policy_version 53980 (0.0007) +[2023-10-08 13:55:30,779][102897] Updated weights for policy 0, policy_version 53930 (0.0008) +[2023-10-08 13:55:31,153][102897] Updated weights for policy 0, policy_version 53940 (0.0008) +[2023-10-08 13:55:31,531][102897] Updated weights for policy 0, policy_version 53950 (0.0008) +[2023-10-08 13:55:31,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 110526464. Throughput: 0: 1795.4, 1: 1795.4. Samples: 27639260. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:55:31,875][101941] Avg episode reward: [(0, '6.910'), (1, '9.220')] +[2023-10-08 13:55:33,201][102898] Updated weights for policy 1, policy_version 53990 (0.0007) +[2023-10-08 13:55:33,570][102898] Updated weights for policy 1, policy_version 54000 (0.0008) +[2023-10-08 13:55:33,942][102898] Updated weights for policy 1, policy_version 54010 (0.0008) +[2023-10-08 13:55:35,340][102897] Updated weights for policy 0, policy_version 53960 (0.0009) +[2023-10-08 13:55:35,714][102897] Updated weights for policy 0, policy_version 53970 (0.0010) +[2023-10-08 13:55:36,087][102897] Updated weights for policy 0, policy_version 53980 (0.0009) +[2023-10-08 13:55:36,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 110592000. Throughput: 0: 1790.9, 1: 1792.7. Samples: 27650104. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:55:36,875][101941] Avg episode reward: [(0, '7.070'), (1, '9.210')] +[2023-10-08 13:55:37,832][102898] Updated weights for policy 1, policy_version 54020 (0.0008) +[2023-10-08 13:55:38,198][102898] Updated weights for policy 1, policy_version 54030 (0.0008) +[2023-10-08 13:55:38,569][102898] Updated weights for policy 1, policy_version 54040 (0.0007) +[2023-10-08 13:55:39,881][102897] Updated weights for policy 0, policy_version 53990 (0.0007) +[2023-10-08 13:55:40,255][102897] Updated weights for policy 0, policy_version 54000 (0.0009) +[2023-10-08 13:55:40,618][102897] Updated weights for policy 0, policy_version 54010 (0.0008) +[2023-10-08 13:55:41,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 110657536. Throughput: 0: 1795.5, 1: 1786.3. Samples: 27671426. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:55:41,876][101941] Avg episode reward: [(0, '7.540'), (1, '8.760')] +[2023-10-08 13:55:42,335][102898] Updated weights for policy 1, policy_version 54050 (0.0009) +[2023-10-08 13:55:42,706][102898] Updated weights for policy 1, policy_version 54060 (0.0009) +[2023-10-08 13:55:43,078][102898] Updated weights for policy 1, policy_version 54070 (0.0008) +[2023-10-08 13:55:43,449][102898] Updated weights for policy 1, policy_version 54080 (0.0008) +[2023-10-08 13:55:44,498][102897] Updated weights for policy 0, policy_version 54020 (0.0010) +[2023-10-08 13:55:44,862][102897] Updated weights for policy 0, policy_version 54030 (0.0011) +[2023-10-08 13:55:45,242][102897] Updated weights for policy 0, policy_version 54040 (0.0007) +[2023-10-08 13:55:46,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 110723072. Throughput: 0: 1780.9, 1: 1790.9. Samples: 27693120. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:55:46,876][101941] Avg episode reward: [(0, '7.910'), (1, '9.290')] +[2023-10-08 13:55:47,109][102898] Updated weights for policy 1, policy_version 54090 (0.0009) +[2023-10-08 13:55:47,479][102898] Updated weights for policy 1, policy_version 54100 (0.0008) +[2023-10-08 13:55:47,849][102898] Updated weights for policy 1, policy_version 54110 (0.0008) +[2023-10-08 13:55:48,916][102897] Updated weights for policy 0, policy_version 54050 (0.0008) +[2023-10-08 13:55:49,295][102897] Updated weights for policy 0, policy_version 54060 (0.0011) +[2023-10-08 13:55:49,655][102897] Updated weights for policy 0, policy_version 54070 (0.0010) +[2023-10-08 13:55:50,031][102897] Updated weights for policy 0, policy_version 54080 (0.0008) +[2023-10-08 13:55:51,671][102898] Updated weights for policy 1, policy_version 54120 (0.0007) +[2023-10-08 13:55:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 110788608. Throughput: 0: 1806.0, 1: 1783.9. Samples: 27704038. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:55:51,876][101941] Avg episode reward: [(0, '7.180'), (1, '8.870')] +[2023-10-08 13:55:52,038][102898] Updated weights for policy 1, policy_version 54130 (0.0007) +[2023-10-08 13:55:52,414][102898] Updated weights for policy 1, policy_version 54140 (0.0007) +[2023-10-08 13:55:53,685][102897] Updated weights for policy 0, policy_version 54090 (0.0007) +[2023-10-08 13:55:54,058][102897] Updated weights for policy 0, policy_version 54100 (0.0008) +[2023-10-08 13:55:54,432][102897] Updated weights for policy 0, policy_version 54110 (0.0007) +[2023-10-08 13:55:56,185][102898] Updated weights for policy 1, policy_version 54150 (0.0007) +[2023-10-08 13:55:56,545][102898] Updated weights for policy 1, policy_version 54160 (0.0007) +[2023-10-08 13:55:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 110854144. Throughput: 0: 1781.5, 1: 1790.2. Samples: 27725536. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:55:56,876][101941] Avg episode reward: [(0, '7.160'), (1, '8.550')] +[2023-10-08 13:55:56,915][102898] Updated weights for policy 1, policy_version 54170 (0.0007) +[2023-10-08 13:55:58,153][102897] Updated weights for policy 0, policy_version 54120 (0.0007) +[2023-10-08 13:55:58,519][102897] Updated weights for policy 0, policy_version 54130 (0.0010) +[2023-10-08 13:55:58,899][102897] Updated weights for policy 0, policy_version 54140 (0.0010) +[2023-10-08 13:56:00,693][102898] Updated weights for policy 1, policy_version 54180 (0.0007) +[2023-10-08 13:56:01,077][102898] Updated weights for policy 1, policy_version 54190 (0.0009) +[2023-10-08 13:56:01,444][102898] Updated weights for policy 1, policy_version 54200 (0.0007) +[2023-10-08 13:56:01,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 110952448. Throughput: 0: 1784.8, 1: 1796.3. Samples: 27746998. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:56:01,875][101941] Avg episode reward: [(0, '7.470'), (1, '8.800')] +[2023-10-08 13:56:02,605][102897] Updated weights for policy 0, policy_version 54150 (0.0007) +[2023-10-08 13:56:02,979][102897] Updated weights for policy 0, policy_version 54160 (0.0008) +[2023-10-08 13:56:03,353][102897] Updated weights for policy 0, policy_version 54170 (0.0007) +[2023-10-08 13:56:05,153][102898] Updated weights for policy 1, policy_version 54210 (0.0008) +[2023-10-08 13:56:05,511][102898] Updated weights for policy 1, policy_version 54220 (0.0009) +[2023-10-08 13:56:05,876][102898] Updated weights for policy 1, policy_version 54230 (0.0008) +[2023-10-08 13:56:06,249][102898] Updated weights for policy 1, policy_version 54240 (0.0008) +[2023-10-08 13:56:06,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 111017984. Throughput: 0: 1792.3, 1: 1790.2. Samples: 27757836. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:56:06,876][101941] Avg episode reward: [(0, '7.480'), (1, '8.540')] +[2023-10-08 13:56:07,168][102897] Updated weights for policy 0, policy_version 54180 (0.0008) +[2023-10-08 13:56:07,539][102897] Updated weights for policy 0, policy_version 54190 (0.0007) +[2023-10-08 13:56:07,902][102897] Updated weights for policy 0, policy_version 54200 (0.0007) +[2023-10-08 13:56:09,944][102898] Updated weights for policy 1, policy_version 54250 (0.0008) +[2023-10-08 13:56:10,311][102898] Updated weights for policy 1, policy_version 54260 (0.0008) +[2023-10-08 13:56:10,678][102898] Updated weights for policy 1, policy_version 54270 (0.0008) +[2023-10-08 13:56:11,730][102897] Updated weights for policy 0, policy_version 54210 (0.0007) +[2023-10-08 13:56:11,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 111083520. Throughput: 0: 1785.5, 1: 1801.6. Samples: 27779328. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:56:11,876][101941] Avg episode reward: [(0, '7.400'), (1, '8.110')] +[2023-10-08 13:56:12,112][102897] Updated weights for policy 0, policy_version 54220 (0.0007) +[2023-10-08 13:56:12,484][102897] Updated weights for policy 0, policy_version 54230 (0.0007) +[2023-10-08 13:56:12,859][102897] Updated weights for policy 0, policy_version 54240 (0.0008) +[2023-10-08 13:56:14,553][102898] Updated weights for policy 1, policy_version 54280 (0.0008) +[2023-10-08 13:56:14,916][102898] Updated weights for policy 1, policy_version 54290 (0.0007) +[2023-10-08 13:56:15,279][102898] Updated weights for policy 1, policy_version 54300 (0.0008) +[2023-10-08 13:56:16,692][102897] Updated weights for policy 0, policy_version 54250 (0.0009) +[2023-10-08 13:56:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 111149056. Throughput: 0: 1809.9, 1: 1783.5. Samples: 27800962. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:56:16,876][101941] Avg episode reward: [(0, '7.500'), (1, '8.890')] +[2023-10-08 13:56:16,889][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000054304_55607296.pth... +[2023-10-08 13:56:16,922][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000052640_53903360.pth +[2023-10-08 13:56:17,066][102897] Updated weights for policy 0, policy_version 54260 (0.0010) +[2023-10-08 13:56:17,444][102897] Updated weights for policy 0, policy_version 54270 (0.0009) +[2023-10-08 13:56:17,514][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000054272_55574528.pth... +[2023-10-08 13:56:17,543][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000052576_53837824.pth +[2023-10-08 13:56:19,217][102898] Updated weights for policy 1, policy_version 54310 (0.0009) +[2023-10-08 13:56:19,584][102898] Updated weights for policy 1, policy_version 54320 (0.0007) +[2023-10-08 13:56:19,953][102898] Updated weights for policy 1, policy_version 54330 (0.0008) +[2023-10-08 13:56:21,255][102897] Updated weights for policy 0, policy_version 54280 (0.0010) +[2023-10-08 13:56:21,625][102897] Updated weights for policy 0, policy_version 54290 (0.0007) +[2023-10-08 13:56:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 111214592. Throughput: 0: 1783.6, 1: 1806.4. Samples: 27811654. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:56:21,876][101941] Avg episode reward: [(0, '7.120'), (1, '9.200')] +[2023-10-08 13:56:21,997][102897] Updated weights for policy 0, policy_version 54300 (0.0010) +[2023-10-08 13:56:23,544][102898] Updated weights for policy 1, policy_version 54340 (0.0009) +[2023-10-08 13:56:23,912][102898] Updated weights for policy 1, policy_version 54350 (0.0009) +[2023-10-08 13:56:24,277][102898] Updated weights for policy 1, policy_version 54360 (0.0008) +[2023-10-08 13:56:25,730][102897] Updated weights for policy 0, policy_version 54310 (0.0008) +[2023-10-08 13:56:26,114][102897] Updated weights for policy 0, policy_version 54320 (0.0011) +[2023-10-08 13:56:26,488][102897] Updated weights for policy 0, policy_version 54330 (0.0009) +[2023-10-08 13:56:26,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 111312896. Throughput: 0: 1808.3, 1: 1792.0. Samples: 27833442. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:56:26,876][101941] Avg episode reward: [(0, '7.110'), (1, '8.780')] +[2023-10-08 13:56:28,056][102898] Updated weights for policy 1, policy_version 54370 (0.0007) +[2023-10-08 13:56:28,420][102898] Updated weights for policy 1, policy_version 54380 (0.0008) +[2023-10-08 13:56:28,791][102898] Updated weights for policy 1, policy_version 54390 (0.0008) +[2023-10-08 13:56:29,155][102898] Updated weights for policy 1, policy_version 54400 (0.0008) +[2023-10-08 13:56:30,271][102897] Updated weights for policy 0, policy_version 54340 (0.0010) +[2023-10-08 13:56:30,644][102897] Updated weights for policy 0, policy_version 54350 (0.0008) +[2023-10-08 13:56:31,017][102897] Updated weights for policy 0, policy_version 54360 (0.0007) +[2023-10-08 13:56:31,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 111378432. Throughput: 0: 1788.8, 1: 1793.4. Samples: 27854322. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:56:31,876][101941] Avg episode reward: [(0, '7.100'), (1, '9.250')] +[2023-10-08 13:56:32,952][102898] Updated weights for policy 1, policy_version 54410 (0.0008) +[2023-10-08 13:56:33,321][102898] Updated weights for policy 1, policy_version 54420 (0.0007) +[2023-10-08 13:56:33,691][102898] Updated weights for policy 1, policy_version 54430 (0.0007) +[2023-10-08 13:56:34,801][102897] Updated weights for policy 0, policy_version 54370 (0.0008) +[2023-10-08 13:56:35,174][102897] Updated weights for policy 0, policy_version 54380 (0.0010) +[2023-10-08 13:56:35,544][102897] Updated weights for policy 0, policy_version 54390 (0.0009) +[2023-10-08 13:56:35,916][102897] Updated weights for policy 0, policy_version 54400 (0.0010) +[2023-10-08 13:56:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 111443968. Throughput: 0: 1794.8, 1: 1790.7. Samples: 27865384. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:56:36,876][101941] Avg episode reward: [(0, '7.730'), (1, '9.350')] +[2023-10-08 13:56:37,449][102898] Updated weights for policy 1, policy_version 54440 (0.0010) +[2023-10-08 13:56:37,808][102898] Updated weights for policy 1, policy_version 54450 (0.0010) +[2023-10-08 13:56:38,177][102898] Updated weights for policy 1, policy_version 54460 (0.0011) +[2023-10-08 13:56:39,636][102897] Updated weights for policy 0, policy_version 54410 (0.0007) +[2023-10-08 13:56:40,018][102897] Updated weights for policy 0, policy_version 54420 (0.0008) +[2023-10-08 13:56:40,384][102897] Updated weights for policy 0, policy_version 54430 (0.0008) +[2023-10-08 13:56:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 111509504. Throughput: 0: 1787.0, 1: 1785.3. Samples: 27886288. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:56:41,875][101941] Avg episode reward: [(0, '8.690'), (1, '8.870')] +[2023-10-08 13:56:41,990][102898] Updated weights for policy 1, policy_version 54470 (0.0008) +[2023-10-08 13:56:42,352][102898] Updated weights for policy 1, policy_version 54480 (0.0008) +[2023-10-08 13:56:42,718][102898] Updated weights for policy 1, policy_version 54490 (0.0009) +[2023-10-08 13:56:44,218][102897] Updated weights for policy 0, policy_version 54440 (0.0009) +[2023-10-08 13:56:44,592][102897] Updated weights for policy 0, policy_version 54450 (0.0008) +[2023-10-08 13:56:44,960][102897] Updated weights for policy 0, policy_version 54460 (0.0008) +[2023-10-08 13:56:46,562][102898] Updated weights for policy 1, policy_version 54500 (0.0008) +[2023-10-08 13:56:46,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 111575040. Throughput: 0: 1776.3, 1: 1810.0. Samples: 27908384. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:56:46,876][101941] Avg episode reward: [(0, '8.320'), (1, '8.660')] +[2023-10-08 13:56:46,952][102898] Updated weights for policy 1, policy_version 54510 (0.0008) +[2023-10-08 13:56:47,334][102898] Updated weights for policy 1, policy_version 54520 (0.0008) +[2023-10-08 13:56:48,736][102897] Updated weights for policy 0, policy_version 54470 (0.0010) +[2023-10-08 13:56:49,110][102897] Updated weights for policy 0, policy_version 54480 (0.0009) +[2023-10-08 13:56:49,478][102897] Updated weights for policy 0, policy_version 54490 (0.0010) +[2023-10-08 13:56:51,030][102898] Updated weights for policy 1, policy_version 54530 (0.0007) +[2023-10-08 13:56:51,406][102898] Updated weights for policy 1, policy_version 54540 (0.0008) +[2023-10-08 13:56:51,759][102898] Updated weights for policy 1, policy_version 54550 (0.0010) +[2023-10-08 13:56:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 111640576. Throughput: 0: 1783.9, 1: 1782.2. Samples: 27918312. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:56:51,875][101941] Avg episode reward: [(0, '7.420'), (1, '8.250')] +[2023-10-08 13:56:52,126][102898] Updated weights for policy 1, policy_version 54560 (0.0009) +[2023-10-08 13:56:53,232][102897] Updated weights for policy 0, policy_version 54500 (0.0009) +[2023-10-08 13:56:53,592][102897] Updated weights for policy 0, policy_version 54510 (0.0009) +[2023-10-08 13:56:53,963][102897] Updated weights for policy 0, policy_version 54520 (0.0010) +[2023-10-08 13:56:55,983][102898] Updated weights for policy 1, policy_version 54570 (0.0007) +[2023-10-08 13:56:56,366][102898] Updated weights for policy 1, policy_version 54580 (0.0008) +[2023-10-08 13:56:56,728][102898] Updated weights for policy 1, policy_version 54590 (0.0007) +[2023-10-08 13:56:56,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 111738880. Throughput: 0: 1775.3, 1: 1799.9. Samples: 27940214. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:56:56,876][101941] Avg episode reward: [(0, '8.080'), (1, '8.270')] +[2023-10-08 13:56:57,721][102897] Updated weights for policy 0, policy_version 54530 (0.0011) +[2023-10-08 13:56:58,097][102897] Updated weights for policy 0, policy_version 54540 (0.0007) +[2023-10-08 13:56:58,465][102897] Updated weights for policy 0, policy_version 54550 (0.0007) +[2023-10-08 13:56:58,829][102897] Updated weights for policy 0, policy_version 54560 (0.0009) +[2023-10-08 13:57:00,431][102898] Updated weights for policy 1, policy_version 54600 (0.0010) +[2023-10-08 13:57:00,805][102898] Updated weights for policy 1, policy_version 54610 (0.0008) +[2023-10-08 13:57:01,165][102898] Updated weights for policy 1, policy_version 54620 (0.0011) +[2023-10-08 13:57:01,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 111804416. Throughput: 0: 1777.0, 1: 1778.6. Samples: 27960964. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:57:01,876][101941] Avg episode reward: [(0, '7.430'), (1, '8.030')] +[2023-10-08 13:57:02,662][102897] Updated weights for policy 0, policy_version 54570 (0.0009) +[2023-10-08 13:57:03,033][102897] Updated weights for policy 0, policy_version 54580 (0.0009) +[2023-10-08 13:57:03,404][102897] Updated weights for policy 0, policy_version 54590 (0.0008) +[2023-10-08 13:57:04,945][102898] Updated weights for policy 1, policy_version 54630 (0.0009) +[2023-10-08 13:57:05,311][102898] Updated weights for policy 1, policy_version 54640 (0.0007) +[2023-10-08 13:57:05,679][102898] Updated weights for policy 1, policy_version 54650 (0.0010) +[2023-10-08 13:57:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 111869952. Throughput: 0: 1774.7, 1: 1792.7. Samples: 27972188. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:57:06,876][101941] Avg episode reward: [(0, '6.510'), (1, '9.220')] +[2023-10-08 13:57:07,163][102897] Updated weights for policy 0, policy_version 54600 (0.0007) +[2023-10-08 13:57:07,542][102897] Updated weights for policy 0, policy_version 54610 (0.0009) +[2023-10-08 13:57:07,904][102897] Updated weights for policy 0, policy_version 54620 (0.0007) +[2023-10-08 13:57:09,577][102898] Updated weights for policy 1, policy_version 54660 (0.0008) +[2023-10-08 13:57:09,945][102898] Updated weights for policy 1, policy_version 54670 (0.0009) +[2023-10-08 13:57:10,320][102898] Updated weights for policy 1, policy_version 54680 (0.0009) +[2023-10-08 13:57:11,733][102897] Updated weights for policy 0, policy_version 54630 (0.0009) +[2023-10-08 13:57:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 111935488. Throughput: 0: 1771.1, 1: 1779.2. Samples: 27993206. Policy #0 lag: (min: 12.0, avg: 25.8, max: 44.0) +[2023-10-08 13:57:11,876][101941] Avg episode reward: [(0, '7.390'), (1, '8.470')] +[2023-10-08 13:57:12,112][102897] Updated weights for policy 0, policy_version 54640 (0.0007) +[2023-10-08 13:57:12,492][102897] Updated weights for policy 0, policy_version 54650 (0.0007) +[2023-10-08 13:57:14,003][102898] Updated weights for policy 1, policy_version 54690 (0.0009) +[2023-10-08 13:57:14,373][102898] Updated weights for policy 1, policy_version 54700 (0.0007) +[2023-10-08 13:57:14,734][102898] Updated weights for policy 1, policy_version 54710 (0.0007) +[2023-10-08 13:57:15,104][102898] Updated weights for policy 1, policy_version 54720 (0.0009) +[2023-10-08 13:57:16,365][102897] Updated weights for policy 0, policy_version 54660 (0.0008) +[2023-10-08 13:57:16,741][102897] Updated weights for policy 0, policy_version 54670 (0.0008) +[2023-10-08 13:57:16,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 112001024. Throughput: 0: 1795.0, 1: 1768.2. Samples: 28014664. Policy #0 lag: (min: 12.0, avg: 25.8, max: 44.0) +[2023-10-08 13:57:16,875][101941] Avg episode reward: [(0, '6.950'), (1, '8.430')] +[2023-10-08 13:57:17,109][102897] Updated weights for policy 0, policy_version 54680 (0.0010) +[2023-10-08 13:57:18,891][102898] Updated weights for policy 1, policy_version 54730 (0.0008) +[2023-10-08 13:57:19,255][102898] Updated weights for policy 1, policy_version 54740 (0.0007) +[2023-10-08 13:57:19,619][102898] Updated weights for policy 1, policy_version 54750 (0.0007) +[2023-10-08 13:57:20,858][102897] Updated weights for policy 0, policy_version 54690 (0.0010) +[2023-10-08 13:57:21,224][102897] Updated weights for policy 0, policy_version 54700 (0.0007) +[2023-10-08 13:57:21,583][102897] Updated weights for policy 0, policy_version 54710 (0.0007) +[2023-10-08 13:57:21,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 112066560. Throughput: 0: 1766.7, 1: 1780.7. Samples: 28025016. Policy #0 lag: (min: 12.0, avg: 25.8, max: 44.0) +[2023-10-08 13:57:21,875][101941] Avg episode reward: [(0, '6.330'), (1, '8.640')] +[2023-10-08 13:57:21,954][102897] Updated weights for policy 0, policy_version 54720 (0.0010) +[2023-10-08 13:57:23,461][102898] Updated weights for policy 1, policy_version 54760 (0.0008) +[2023-10-08 13:57:23,820][102898] Updated weights for policy 1, policy_version 54770 (0.0010) +[2023-10-08 13:57:24,189][102898] Updated weights for policy 1, policy_version 54780 (0.0011) +[2023-10-08 13:57:25,665][102897] Updated weights for policy 0, policy_version 54730 (0.0008) +[2023-10-08 13:57:26,041][102897] Updated weights for policy 0, policy_version 54740 (0.0008) +[2023-10-08 13:57:26,405][102897] Updated weights for policy 0, policy_version 54750 (0.0007) +[2023-10-08 13:57:26,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 112164864. Throughput: 0: 1792.6, 1: 1775.9. Samples: 28046870. Policy #0 lag: (min: 12.0, avg: 25.8, max: 44.0) +[2023-10-08 13:57:26,876][101941] Avg episode reward: [(0, '6.810'), (1, '8.850')] +[2023-10-08 13:57:27,895][102898] Updated weights for policy 1, policy_version 54790 (0.0009) +[2023-10-08 13:57:28,266][102898] Updated weights for policy 1, policy_version 54800 (0.0007) +[2023-10-08 13:57:28,626][102898] Updated weights for policy 1, policy_version 54810 (0.0008) +[2023-10-08 13:57:30,040][102897] Updated weights for policy 0, policy_version 54760 (0.0007) +[2023-10-08 13:57:30,407][102897] Updated weights for policy 0, policy_version 54770 (0.0008) +[2023-10-08 13:57:30,781][102897] Updated weights for policy 0, policy_version 54780 (0.0007) +[2023-10-08 13:57:31,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 112230400. Throughput: 0: 1774.9, 1: 1779.5. Samples: 28068334. Policy #0 lag: (min: 12.0, avg: 25.8, max: 44.0) +[2023-10-08 13:57:31,876][101941] Avg episode reward: [(0, '7.110'), (1, '9.010')] +[2023-10-08 13:57:32,428][102898] Updated weights for policy 1, policy_version 54820 (0.0010) +[2023-10-08 13:57:32,818][102898] Updated weights for policy 1, policy_version 54830 (0.0009) +[2023-10-08 13:57:33,183][102898] Updated weights for policy 1, policy_version 54840 (0.0008) +[2023-10-08 13:57:34,552][102897] Updated weights for policy 0, policy_version 54790 (0.0008) +[2023-10-08 13:57:34,936][102897] Updated weights for policy 0, policy_version 54800 (0.0009) +[2023-10-08 13:57:35,301][102897] Updated weights for policy 0, policy_version 54810 (0.0007) +[2023-10-08 13:57:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 112295936. Throughput: 0: 1800.0, 1: 1777.8. Samples: 28079316. Policy #0 lag: (min: 12.0, avg: 25.8, max: 44.0) +[2023-10-08 13:57:36,876][101941] Avg episode reward: [(0, '6.410'), (1, '9.460')] +[2023-10-08 13:57:36,882][102898] Updated weights for policy 1, policy_version 54850 (0.0008) +[2023-10-08 13:57:37,246][102898] Updated weights for policy 1, policy_version 54860 (0.0008) +[2023-10-08 13:57:37,607][102898] Updated weights for policy 1, policy_version 54870 (0.0008) +[2023-10-08 13:57:37,972][102898] Updated weights for policy 1, policy_version 54880 (0.0009) +[2023-10-08 13:57:39,022][102897] Updated weights for policy 0, policy_version 54820 (0.0008) +[2023-10-08 13:57:39,387][102897] Updated weights for policy 0, policy_version 54830 (0.0008) +[2023-10-08 13:57:39,766][102897] Updated weights for policy 0, policy_version 54840 (0.0009) +[2023-10-08 13:57:41,700][102898] Updated weights for policy 1, policy_version 54890 (0.0008) +[2023-10-08 13:57:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 112361472. Throughput: 0: 1778.9, 1: 1784.2. Samples: 28100554. Policy #0 lag: (min: 12.0, avg: 25.8, max: 44.0) +[2023-10-08 13:57:41,876][101941] Avg episode reward: [(0, '6.620'), (1, '9.100')] +[2023-10-08 13:57:42,069][102898] Updated weights for policy 1, policy_version 54900 (0.0007) +[2023-10-08 13:57:42,433][102898] Updated weights for policy 1, policy_version 54910 (0.0008) +[2023-10-08 13:57:43,390][102897] Updated weights for policy 0, policy_version 54850 (0.0008) +[2023-10-08 13:57:43,759][102897] Updated weights for policy 0, policy_version 54860 (0.0009) +[2023-10-08 13:57:44,133][102897] Updated weights for policy 0, policy_version 54870 (0.0008) +[2023-10-08 13:57:44,502][102897] Updated weights for policy 0, policy_version 54880 (0.0007) +[2023-10-08 13:57:46,224][102898] Updated weights for policy 1, policy_version 54920 (0.0008) +[2023-10-08 13:57:46,593][102898] Updated weights for policy 1, policy_version 54930 (0.0010) +[2023-10-08 13:57:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 112427008. Throughput: 0: 1784.0, 1: 1804.1. Samples: 28122430. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 13:57:46,876][101941] Avg episode reward: [(0, '7.120'), (1, '8.880')] +[2023-10-08 13:57:46,963][102898] Updated weights for policy 1, policy_version 54940 (0.0008) +[2023-10-08 13:57:48,353][102897] Updated weights for policy 0, policy_version 54890 (0.0010) +[2023-10-08 13:57:48,714][102897] Updated weights for policy 0, policy_version 54900 (0.0008) +[2023-10-08 13:57:49,078][102897] Updated weights for policy 0, policy_version 54910 (0.0009) +[2023-10-08 13:57:50,646][102898] Updated weights for policy 1, policy_version 54950 (0.0011) +[2023-10-08 13:57:51,015][102898] Updated weights for policy 1, policy_version 54960 (0.0009) +[2023-10-08 13:57:51,374][102898] Updated weights for policy 1, policy_version 54970 (0.0007) +[2023-10-08 13:57:51,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 112525312. Throughput: 0: 1783.7, 1: 1784.5. Samples: 28132758. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 13:57:51,875][101941] Avg episode reward: [(0, '6.930'), (1, '8.590')] +[2023-10-08 13:57:52,862][102897] Updated weights for policy 0, policy_version 54920 (0.0009) +[2023-10-08 13:57:53,237][102897] Updated weights for policy 0, policy_version 54930 (0.0007) +[2023-10-08 13:57:53,606][102897] Updated weights for policy 0, policy_version 54940 (0.0007) +[2023-10-08 13:57:55,088][102898] Updated weights for policy 1, policy_version 54980 (0.0007) +[2023-10-08 13:57:55,455][102898] Updated weights for policy 1, policy_version 54990 (0.0009) +[2023-10-08 13:57:55,824][102898] Updated weights for policy 1, policy_version 55000 (0.0009) +[2023-10-08 13:57:56,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 112590848. Throughput: 0: 1782.0, 1: 1806.1. Samples: 28154670. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 13:57:56,876][101941] Avg episode reward: [(0, '7.350'), (1, '8.350')] +[2023-10-08 13:57:57,543][102897] Updated weights for policy 0, policy_version 54950 (0.0009) +[2023-10-08 13:57:57,914][102897] Updated weights for policy 0, policy_version 54960 (0.0008) +[2023-10-08 13:57:58,281][102897] Updated weights for policy 0, policy_version 54970 (0.0009) +[2023-10-08 13:57:59,565][102898] Updated weights for policy 1, policy_version 55010 (0.0007) +[2023-10-08 13:57:59,934][102898] Updated weights for policy 1, policy_version 55020 (0.0011) +[2023-10-08 13:58:00,302][102898] Updated weights for policy 1, policy_version 55030 (0.0009) +[2023-10-08 13:58:00,676][102898] Updated weights for policy 1, policy_version 55040 (0.0009) +[2023-10-08 13:58:01,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 112656384. Throughput: 0: 1794.6, 1: 1798.8. Samples: 28176366. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 13:58:01,876][101941] Avg episode reward: [(0, '7.540'), (1, '7.810')] +[2023-10-08 13:58:02,093][102897] Updated weights for policy 0, policy_version 54980 (0.0008) +[2023-10-08 13:58:02,473][102897] Updated weights for policy 0, policy_version 54990 (0.0008) +[2023-10-08 13:58:02,834][102897] Updated weights for policy 0, policy_version 55000 (0.0010) +[2023-10-08 13:58:04,386][102898] Updated weights for policy 1, policy_version 55050 (0.0008) +[2023-10-08 13:58:04,754][102898] Updated weights for policy 1, policy_version 55060 (0.0007) +[2023-10-08 13:58:05,128][102898] Updated weights for policy 1, policy_version 55070 (0.0007) +[2023-10-08 13:58:06,573][102897] Updated weights for policy 0, policy_version 55010 (0.0010) +[2023-10-08 13:58:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 112721920. Throughput: 0: 1787.8, 1: 1806.5. Samples: 28186760. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 13:58:06,876][101941] Avg episode reward: [(0, '6.620'), (1, '8.000')] +[2023-10-08 13:58:06,949][102897] Updated weights for policy 0, policy_version 55020 (0.0007) +[2023-10-08 13:58:07,327][102897] Updated weights for policy 0, policy_version 55030 (0.0007) +[2023-10-08 13:58:07,692][102897] Updated weights for policy 0, policy_version 55040 (0.0010) +[2023-10-08 13:58:08,820][102898] Updated weights for policy 1, policy_version 55080 (0.0007) +[2023-10-08 13:58:09,183][102898] Updated weights for policy 1, policy_version 55090 (0.0007) +[2023-10-08 13:58:09,553][102898] Updated weights for policy 1, policy_version 55100 (0.0007) +[2023-10-08 13:58:11,526][102897] Updated weights for policy 0, policy_version 55050 (0.0009) +[2023-10-08 13:58:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 112787456. Throughput: 0: 1791.1, 1: 1797.6. Samples: 28208362. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 13:58:11,876][101941] Avg episode reward: [(0, '6.800'), (1, '8.130')] +[2023-10-08 13:58:11,894][102897] Updated weights for policy 0, policy_version 55060 (0.0009) +[2023-10-08 13:58:12,269][102897] Updated weights for policy 0, policy_version 55070 (0.0009) +[2023-10-08 13:58:13,388][102898] Updated weights for policy 1, policy_version 55110 (0.0009) +[2023-10-08 13:58:13,753][102898] Updated weights for policy 1, policy_version 55120 (0.0009) +[2023-10-08 13:58:14,121][102898] Updated weights for policy 1, policy_version 55130 (0.0011) +[2023-10-08 13:58:15,845][102897] Updated weights for policy 0, policy_version 55080 (0.0007) +[2023-10-08 13:58:16,218][102897] Updated weights for policy 0, policy_version 55090 (0.0010) +[2023-10-08 13:58:16,592][102897] Updated weights for policy 0, policy_version 55100 (0.0010) +[2023-10-08 13:58:16,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 112885760. Throughput: 0: 1795.8, 1: 1793.9. Samples: 28229870. Policy #0 lag: (min: 2.0, avg: 2.0, max: 2.0) +[2023-10-08 13:58:16,877][101941] Avg episode reward: [(0, '7.540'), (1, '8.300')] +[2023-10-08 13:58:16,887][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000055104_56426496.pth... +[2023-10-08 13:58:16,887][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000055136_56459264.pth... +[2023-10-08 13:58:16,927][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000053408_54689792.pth +[2023-10-08 13:58:16,928][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000053472_54755328.pth +[2023-10-08 13:58:17,973][102898] Updated weights for policy 1, policy_version 55140 (0.0010) +[2023-10-08 13:58:18,361][102898] Updated weights for policy 1, policy_version 55150 (0.0011) +[2023-10-08 13:58:18,719][102898] Updated weights for policy 1, policy_version 55160 (0.0009) +[2023-10-08 13:58:20,246][102897] Updated weights for policy 0, policy_version 55110 (0.0008) +[2023-10-08 13:58:20,627][102897] Updated weights for policy 0, policy_version 55120 (0.0008) +[2023-10-08 13:58:20,998][102897] Updated weights for policy 0, policy_version 55130 (0.0010) +[2023-10-08 13:58:21,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 112951296. Throughput: 0: 1789.6, 1: 1794.9. Samples: 28240618. Policy #0 lag: (min: 8.0, avg: 34.7, max: 40.0) +[2023-10-08 13:58:21,875][101941] Avg episode reward: [(0, '7.810'), (1, '8.410')] +[2023-10-08 13:58:22,460][102898] Updated weights for policy 1, policy_version 55170 (0.0009) +[2023-10-08 13:58:22,820][102898] Updated weights for policy 1, policy_version 55180 (0.0007) +[2023-10-08 13:58:23,183][102898] Updated weights for policy 1, policy_version 55190 (0.0007) +[2023-10-08 13:58:23,551][102898] Updated weights for policy 1, policy_version 55200 (0.0009) +[2023-10-08 13:58:24,736][102897] Updated weights for policy 0, policy_version 55140 (0.0009) +[2023-10-08 13:58:25,102][102897] Updated weights for policy 0, policy_version 55150 (0.0009) +[2023-10-08 13:58:25,469][102897] Updated weights for policy 0, policy_version 55160 (0.0010) +[2023-10-08 13:58:26,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 113016832. Throughput: 0: 1798.4, 1: 1791.8. Samples: 28262114. Policy #0 lag: (min: 8.0, avg: 34.7, max: 40.0) +[2023-10-08 13:58:26,876][101941] Avg episode reward: [(0, '7.370'), (1, '9.040')] +[2023-10-08 13:58:27,441][102898] Updated weights for policy 1, policy_version 55210 (0.0011) +[2023-10-08 13:58:27,802][102898] Updated weights for policy 1, policy_version 55220 (0.0011) +[2023-10-08 13:58:28,169][102898] Updated weights for policy 1, policy_version 55230 (0.0009) +[2023-10-08 13:58:29,278][102897] Updated weights for policy 0, policy_version 55170 (0.0009) +[2023-10-08 13:58:29,648][102897] Updated weights for policy 0, policy_version 55180 (0.0008) +[2023-10-08 13:58:30,028][102897] Updated weights for policy 0, policy_version 55190 (0.0010) +[2023-10-08 13:58:30,402][102897] Updated weights for policy 0, policy_version 55200 (0.0011) +[2023-10-08 13:58:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 113082368. Throughput: 0: 1781.9, 1: 1799.1. Samples: 28283574. Policy #0 lag: (min: 8.0, avg: 34.7, max: 40.0) +[2023-10-08 13:58:31,876][101941] Avg episode reward: [(0, '8.590'), (1, '9.190')] +[2023-10-08 13:58:32,013][102898] Updated weights for policy 1, policy_version 55240 (0.0008) +[2023-10-08 13:58:32,381][102898] Updated weights for policy 1, policy_version 55250 (0.0007) +[2023-10-08 13:58:32,744][102898] Updated weights for policy 1, policy_version 55260 (0.0008) +[2023-10-08 13:58:34,106][102897] Updated weights for policy 0, policy_version 55210 (0.0010) +[2023-10-08 13:58:34,490][102897] Updated weights for policy 0, policy_version 55220 (0.0010) +[2023-10-08 13:58:34,872][102897] Updated weights for policy 0, policy_version 55230 (0.0010) +[2023-10-08 13:58:36,548][102898] Updated weights for policy 1, policy_version 55270 (0.0008) +[2023-10-08 13:58:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 113147904. Throughput: 0: 1802.6, 1: 1784.1. Samples: 28294160. Policy #0 lag: (min: 8.0, avg: 34.7, max: 40.0) +[2023-10-08 13:58:36,875][101941] Avg episode reward: [(0, '8.470'), (1, '8.650')] +[2023-10-08 13:58:36,912][102898] Updated weights for policy 1, policy_version 55280 (0.0010) +[2023-10-08 13:58:37,293][102898] Updated weights for policy 1, policy_version 55290 (0.0011) +[2023-10-08 13:58:38,683][102897] Updated weights for policy 0, policy_version 55240 (0.0010) +[2023-10-08 13:58:39,068][102897] Updated weights for policy 0, policy_version 55250 (0.0009) +[2023-10-08 13:58:39,427][102897] Updated weights for policy 0, policy_version 55260 (0.0008) +[2023-10-08 13:58:41,103][102898] Updated weights for policy 1, policy_version 55300 (0.0008) +[2023-10-08 13:58:41,465][102898] Updated weights for policy 1, policy_version 55310 (0.0007) +[2023-10-08 13:58:41,835][102898] Updated weights for policy 1, policy_version 55320 (0.0009) +[2023-10-08 13:58:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 113213440. Throughput: 0: 1787.7, 1: 1789.4. Samples: 28315642. Policy #0 lag: (min: 8.0, avg: 34.7, max: 40.0) +[2023-10-08 13:58:41,876][101941] Avg episode reward: [(0, '7.720'), (1, '9.180')] +[2023-10-08 13:58:43,126][102897] Updated weights for policy 0, policy_version 55270 (0.0008) +[2023-10-08 13:58:43,490][102897] Updated weights for policy 0, policy_version 55280 (0.0007) +[2023-10-08 13:58:43,869][102897] Updated weights for policy 0, policy_version 55290 (0.0007) +[2023-10-08 13:58:45,386][102898] Updated weights for policy 1, policy_version 55330 (0.0009) +[2023-10-08 13:58:45,752][102898] Updated weights for policy 1, policy_version 55340 (0.0008) +[2023-10-08 13:58:46,114][102898] Updated weights for policy 1, policy_version 55350 (0.0008) +[2023-10-08 13:58:46,486][102898] Updated weights for policy 1, policy_version 55360 (0.0008) +[2023-10-08 13:58:46,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 113311744. Throughput: 0: 1788.0, 1: 1777.6. Samples: 28336814. Policy #0 lag: (min: 8.0, avg: 34.7, max: 40.0) +[2023-10-08 13:58:46,876][101941] Avg episode reward: [(0, '7.200'), (1, '9.410')] +[2023-10-08 13:58:47,621][102897] Updated weights for policy 0, policy_version 55300 (0.0009) +[2023-10-08 13:58:47,988][102897] Updated weights for policy 0, policy_version 55310 (0.0010) +[2023-10-08 13:58:48,359][102897] Updated weights for policy 0, policy_version 55320 (0.0011) +[2023-10-08 13:58:50,213][102898] Updated weights for policy 1, policy_version 55370 (0.0007) +[2023-10-08 13:58:50,579][102898] Updated weights for policy 1, policy_version 55380 (0.0007) +[2023-10-08 13:58:50,943][102898] Updated weights for policy 1, policy_version 55390 (0.0007) +[2023-10-08 13:58:51,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 113377280. Throughput: 0: 1789.6, 1: 1792.3. Samples: 28347948. Policy #0 lag: (min: 8.0, avg: 34.7, max: 40.0) +[2023-10-08 13:58:51,876][101941] Avg episode reward: [(0, '7.250'), (1, '9.340')] +[2023-10-08 13:58:52,115][102897] Updated weights for policy 0, policy_version 55330 (0.0010) +[2023-10-08 13:58:52,493][102897] Updated weights for policy 0, policy_version 55340 (0.0007) +[2023-10-08 13:58:52,859][102897] Updated weights for policy 0, policy_version 55350 (0.0008) +[2023-10-08 13:58:53,232][102897] Updated weights for policy 0, policy_version 55360 (0.0008) +[2023-10-08 13:58:54,643][102898] Updated weights for policy 1, policy_version 55400 (0.0007) +[2023-10-08 13:58:55,016][102898] Updated weights for policy 1, policy_version 55410 (0.0009) +[2023-10-08 13:58:55,381][102898] Updated weights for policy 1, policy_version 55420 (0.0008) +[2023-10-08 13:58:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 113442816. Throughput: 0: 1790.6, 1: 1790.6. Samples: 28369516. Policy #0 lag: (min: 8.0, avg: 34.7, max: 40.0) +[2023-10-08 13:58:56,876][101941] Avg episode reward: [(0, '7.660'), (1, '8.400')] +[2023-10-08 13:58:56,952][102897] Updated weights for policy 0, policy_version 55370 (0.0009) +[2023-10-08 13:58:57,323][102897] Updated weights for policy 0, policy_version 55380 (0.0008) +[2023-10-08 13:58:57,692][102897] Updated weights for policy 0, policy_version 55390 (0.0008) +[2023-10-08 13:58:59,127][102898] Updated weights for policy 1, policy_version 55430 (0.0008) +[2023-10-08 13:58:59,482][102898] Updated weights for policy 1, policy_version 55440 (0.0007) +[2023-10-08 13:58:59,840][102898] Updated weights for policy 1, policy_version 55450 (0.0007) +[2023-10-08 13:59:01,488][102897] Updated weights for policy 0, policy_version 55400 (0.0010) +[2023-10-08 13:59:01,864][102897] Updated weights for policy 0, policy_version 55410 (0.0010) +[2023-10-08 13:59:01,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 113508352. Throughput: 0: 1801.3, 1: 1789.3. Samples: 28391450. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:59:01,875][101941] Avg episode reward: [(0, '8.190'), (1, '8.980')] +[2023-10-08 13:59:02,233][102897] Updated weights for policy 0, policy_version 55420 (0.0010) +[2023-10-08 13:59:03,712][102898] Updated weights for policy 1, policy_version 55460 (0.0008) +[2023-10-08 13:59:04,092][102898] Updated weights for policy 1, policy_version 55470 (0.0009) +[2023-10-08 13:59:04,458][102898] Updated weights for policy 1, policy_version 55480 (0.0008) +[2023-10-08 13:59:06,144][102897] Updated weights for policy 0, policy_version 55430 (0.0009) +[2023-10-08 13:59:06,514][102897] Updated weights for policy 0, policy_version 55440 (0.0007) +[2023-10-08 13:59:06,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 113573888. Throughput: 0: 1778.6, 1: 1798.1. Samples: 28401570. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:59:06,875][101941] Avg episode reward: [(0, '7.580'), (1, '9.260')] +[2023-10-08 13:59:06,885][102897] Updated weights for policy 0, policy_version 55450 (0.0008) +[2023-10-08 13:59:08,165][102898] Updated weights for policy 1, policy_version 55490 (0.0007) +[2023-10-08 13:59:08,529][102898] Updated weights for policy 1, policy_version 55500 (0.0009) +[2023-10-08 13:59:08,896][102898] Updated weights for policy 1, policy_version 55510 (0.0008) +[2023-10-08 13:59:09,261][102898] Updated weights for policy 1, policy_version 55520 (0.0007) +[2023-10-08 13:59:10,775][102897] Updated weights for policy 0, policy_version 55460 (0.0009) +[2023-10-08 13:59:11,152][102897] Updated weights for policy 0, policy_version 55470 (0.0008) +[2023-10-08 13:59:11,521][102897] Updated weights for policy 0, policy_version 55480 (0.0007) +[2023-10-08 13:59:11,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 113672192. Throughput: 0: 1797.6, 1: 1790.1. Samples: 28423560. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:59:11,876][101941] Avg episode reward: [(0, '7.410'), (1, '8.450')] +[2023-10-08 13:59:12,911][102898] Updated weights for policy 1, policy_version 55530 (0.0007) +[2023-10-08 13:59:13,270][102898] Updated weights for policy 1, policy_version 55540 (0.0007) +[2023-10-08 13:59:13,641][102898] Updated weights for policy 1, policy_version 55550 (0.0007) +[2023-10-08 13:59:15,148][102897] Updated weights for policy 0, policy_version 55490 (0.0008) +[2023-10-08 13:59:15,512][102897] Updated weights for policy 0, policy_version 55500 (0.0009) +[2023-10-08 13:59:15,874][102897] Updated weights for policy 0, policy_version 55510 (0.0009) +[2023-10-08 13:59:16,243][102897] Updated weights for policy 0, policy_version 55520 (0.0007) +[2023-10-08 13:59:16,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 113737728. Throughput: 0: 1785.5, 1: 1800.4. Samples: 28444936. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:59:16,876][101941] Avg episode reward: [(0, '7.000'), (1, '8.170')] +[2023-10-08 13:59:17,429][102898] Updated weights for policy 1, policy_version 55560 (0.0007) +[2023-10-08 13:59:17,791][102898] Updated weights for policy 1, policy_version 55570 (0.0008) +[2023-10-08 13:59:18,155][102898] Updated weights for policy 1, policy_version 55580 (0.0009) +[2023-10-08 13:59:19,953][102897] Updated weights for policy 0, policy_version 55530 (0.0008) +[2023-10-08 13:59:20,323][102897] Updated weights for policy 0, policy_version 55540 (0.0010) +[2023-10-08 13:59:20,690][102897] Updated weights for policy 0, policy_version 55550 (0.0010) +[2023-10-08 13:59:21,785][102898] Updated weights for policy 1, policy_version 55590 (0.0010) +[2023-10-08 13:59:21,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 113803264. Throughput: 0: 1800.4, 1: 1799.3. Samples: 28456146. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:59:21,875][101941] Avg episode reward: [(0, '6.540'), (1, '7.890')] +[2023-10-08 13:59:22,148][102898] Updated weights for policy 1, policy_version 55600 (0.0008) +[2023-10-08 13:59:22,515][102898] Updated weights for policy 1, policy_version 55610 (0.0011) +[2023-10-08 13:59:24,466][102897] Updated weights for policy 0, policy_version 55560 (0.0007) +[2023-10-08 13:59:24,839][102897] Updated weights for policy 0, policy_version 55570 (0.0007) +[2023-10-08 13:59:25,206][102897] Updated weights for policy 0, policy_version 55580 (0.0007) +[2023-10-08 13:59:26,660][102898] Updated weights for policy 1, policy_version 55620 (0.0009) +[2023-10-08 13:59:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 113868800. Throughput: 0: 1784.5, 1: 1797.9. Samples: 28476850. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:59:26,876][101941] Avg episode reward: [(0, '6.680'), (1, '7.310')] +[2023-10-08 13:59:27,029][102898] Updated weights for policy 1, policy_version 55630 (0.0007) +[2023-10-08 13:59:27,391][102898] Updated weights for policy 1, policy_version 55640 (0.0007) +[2023-10-08 13:59:28,817][102897] Updated weights for policy 0, policy_version 55590 (0.0007) +[2023-10-08 13:59:29,194][102897] Updated weights for policy 0, policy_version 55600 (0.0007) +[2023-10-08 13:59:29,569][102897] Updated weights for policy 0, policy_version 55610 (0.0008) +[2023-10-08 13:59:31,206][102898] Updated weights for policy 1, policy_version 55650 (0.0007) +[2023-10-08 13:59:31,574][102898] Updated weights for policy 1, policy_version 55660 (0.0008) +[2023-10-08 13:59:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 113934336. Throughput: 0: 1785.7, 1: 1814.7. Samples: 28498832. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 13:59:31,876][101941] Avg episode reward: [(0, '6.700'), (1, '8.520')] +[2023-10-08 13:59:31,938][102898] Updated weights for policy 1, policy_version 55670 (0.0009) +[2023-10-08 13:59:32,303][102898] Updated weights for policy 1, policy_version 55680 (0.0011) +[2023-10-08 13:59:33,285][102897] Updated weights for policy 0, policy_version 55620 (0.0009) +[2023-10-08 13:59:33,651][102897] Updated weights for policy 0, policy_version 55630 (0.0007) +[2023-10-08 13:59:34,019][102897] Updated weights for policy 0, policy_version 55640 (0.0010) +[2023-10-08 13:59:35,848][102898] Updated weights for policy 1, policy_version 55690 (0.0009) +[2023-10-08 13:59:36,222][102898] Updated weights for policy 1, policy_version 55700 (0.0009) +[2023-10-08 13:59:36,595][102898] Updated weights for policy 1, policy_version 55710 (0.0008) +[2023-10-08 13:59:36,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 114032640. Throughput: 0: 1785.4, 1: 1792.5. Samples: 28508954. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 13:59:36,875][101941] Avg episode reward: [(0, '7.070'), (1, '9.040')] +[2023-10-08 13:59:37,820][102897] Updated weights for policy 0, policy_version 55650 (0.0009) +[2023-10-08 13:59:38,200][102897] Updated weights for policy 0, policy_version 55660 (0.0007) +[2023-10-08 13:59:38,568][102897] Updated weights for policy 0, policy_version 55670 (0.0009) +[2023-10-08 13:59:38,931][102897] Updated weights for policy 0, policy_version 55680 (0.0010) +[2023-10-08 13:59:40,343][102898] Updated weights for policy 1, policy_version 55720 (0.0008) +[2023-10-08 13:59:40,705][102898] Updated weights for policy 1, policy_version 55730 (0.0008) +[2023-10-08 13:59:41,073][102898] Updated weights for policy 1, policy_version 55740 (0.0007) +[2023-10-08 13:59:41,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 114098176. Throughput: 0: 1780.3, 1: 1804.1. Samples: 28530816. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 13:59:41,876][101941] Avg episode reward: [(0, '7.800'), (1, '8.760')] +[2023-10-08 13:59:42,731][102897] Updated weights for policy 0, policy_version 55690 (0.0007) +[2023-10-08 13:59:43,100][102897] Updated weights for policy 0, policy_version 55700 (0.0007) +[2023-10-08 13:59:43,463][102897] Updated weights for policy 0, policy_version 55710 (0.0007) +[2023-10-08 13:59:44,885][102898] Updated weights for policy 1, policy_version 55750 (0.0008) +[2023-10-08 13:59:45,255][102898] Updated weights for policy 1, policy_version 55760 (0.0007) +[2023-10-08 13:59:45,627][102898] Updated weights for policy 1, policy_version 55770 (0.0009) +[2023-10-08 13:59:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 114163712. Throughput: 0: 1785.6, 1: 1780.8. Samples: 28551936. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 13:59:46,875][101941] Avg episode reward: [(0, '7.940'), (1, '8.950')] +[2023-10-08 13:59:47,360][102897] Updated weights for policy 0, policy_version 55720 (0.0010) +[2023-10-08 13:59:47,729][102897] Updated weights for policy 0, policy_version 55730 (0.0009) +[2023-10-08 13:59:48,108][102897] Updated weights for policy 0, policy_version 55740 (0.0008) +[2023-10-08 13:59:49,442][102898] Updated weights for policy 1, policy_version 55780 (0.0008) +[2023-10-08 13:59:49,820][102898] Updated weights for policy 1, policy_version 55790 (0.0007) +[2023-10-08 13:59:50,190][102898] Updated weights for policy 1, policy_version 55800 (0.0008) +[2023-10-08 13:59:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 114229248. Throughput: 0: 1779.9, 1: 1799.9. Samples: 28562664. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 13:59:51,876][101941] Avg episode reward: [(0, '7.730'), (1, '9.340')] +[2023-10-08 13:59:51,916][102897] Updated weights for policy 0, policy_version 55750 (0.0007) +[2023-10-08 13:59:52,303][102897] Updated weights for policy 0, policy_version 55760 (0.0007) +[2023-10-08 13:59:52,681][102897] Updated weights for policy 0, policy_version 55770 (0.0007) +[2023-10-08 13:59:53,970][102898] Updated weights for policy 1, policy_version 55810 (0.0009) +[2023-10-08 13:59:54,338][102898] Updated weights for policy 1, policy_version 55820 (0.0010) +[2023-10-08 13:59:54,705][102898] Updated weights for policy 1, policy_version 55830 (0.0010) +[2023-10-08 13:59:55,067][102898] Updated weights for policy 1, policy_version 55840 (0.0008) +[2023-10-08 13:59:56,448][102897] Updated weights for policy 0, policy_version 55780 (0.0008) +[2023-10-08 13:59:56,820][102897] Updated weights for policy 0, policy_version 55790 (0.0007) +[2023-10-08 13:59:56,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 114294784. Throughput: 0: 1782.9, 1: 1777.0. Samples: 28583754. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 13:59:56,876][101941] Avg episode reward: [(0, '8.260'), (1, '8.520')] +[2023-10-08 13:59:57,193][102897] Updated weights for policy 0, policy_version 55800 (0.0007) +[2023-10-08 13:59:58,930][102898] Updated weights for policy 1, policy_version 55850 (0.0008) +[2023-10-08 13:59:59,293][102898] Updated weights for policy 1, policy_version 55860 (0.0009) +[2023-10-08 13:59:59,661][102898] Updated weights for policy 1, policy_version 55870 (0.0007) +[2023-10-08 14:00:00,939][102897] Updated weights for policy 0, policy_version 55810 (0.0011) +[2023-10-08 14:00:01,308][102897] Updated weights for policy 0, policy_version 55820 (0.0010) +[2023-10-08 14:00:01,677][102897] Updated weights for policy 0, policy_version 55830 (0.0008) +[2023-10-08 14:00:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 114360320. Throughput: 0: 1796.5, 1: 1773.4. Samples: 28605580. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 14:00:01,876][101941] Avg episode reward: [(0, '7.830'), (1, '7.860')] +[2023-10-08 14:00:02,042][102897] Updated weights for policy 0, policy_version 55840 (0.0008) +[2023-10-08 14:00:03,398][102898] Updated weights for policy 1, policy_version 55880 (0.0008) +[2023-10-08 14:00:03,761][102898] Updated weights for policy 1, policy_version 55890 (0.0010) +[2023-10-08 14:00:04,123][102898] Updated weights for policy 1, policy_version 55900 (0.0009) +[2023-10-08 14:00:05,654][102897] Updated weights for policy 0, policy_version 55850 (0.0009) +[2023-10-08 14:00:06,025][102897] Updated weights for policy 0, policy_version 55860 (0.0010) +[2023-10-08 14:00:06,395][102897] Updated weights for policy 0, policy_version 55870 (0.0011) +[2023-10-08 14:00:06,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 114458624. Throughput: 0: 1782.6, 1: 1771.7. Samples: 28616090. Policy #0 lag: (min: 27.0, avg: 27.0, max: 27.0) +[2023-10-08 14:00:06,875][101941] Avg episode reward: [(0, '7.740'), (1, '8.260')] +[2023-10-08 14:00:07,685][102898] Updated weights for policy 1, policy_version 55910 (0.0007) +[2023-10-08 14:00:08,058][102898] Updated weights for policy 1, policy_version 55920 (0.0010) +[2023-10-08 14:00:08,423][102898] Updated weights for policy 1, policy_version 55930 (0.0011) +[2023-10-08 14:00:10,253][102897] Updated weights for policy 0, policy_version 55880 (0.0008) +[2023-10-08 14:00:10,634][102897] Updated weights for policy 0, policy_version 55890 (0.0008) +[2023-10-08 14:00:10,997][102897] Updated weights for policy 0, policy_version 55900 (0.0008) +[2023-10-08 14:00:11,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 114524160. Throughput: 0: 1802.0, 1: 1785.1. Samples: 28638268. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:00:11,876][101941] Avg episode reward: [(0, '7.690'), (1, '8.760')] +[2023-10-08 14:00:12,186][102898] Updated weights for policy 1, policy_version 55940 (0.0010) +[2023-10-08 14:00:12,553][102898] Updated weights for policy 1, policy_version 55950 (0.0009) +[2023-10-08 14:00:12,923][102898] Updated weights for policy 1, policy_version 55960 (0.0010) +[2023-10-08 14:00:14,671][102897] Updated weights for policy 0, policy_version 55910 (0.0008) +[2023-10-08 14:00:15,047][102897] Updated weights for policy 0, policy_version 55920 (0.0007) +[2023-10-08 14:00:15,416][102897] Updated weights for policy 0, policy_version 55930 (0.0009) +[2023-10-08 14:00:16,679][102898] Updated weights for policy 1, policy_version 55970 (0.0010) +[2023-10-08 14:00:16,875][101941] Fps is (10 sec: 13106.7, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 114589696. Throughput: 0: 1780.8, 1: 1794.7. Samples: 28659728. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:00:16,876][101941] Avg episode reward: [(0, '7.590'), (1, '9.200')] +[2023-10-08 14:00:16,888][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000055936_57278464.pth... +[2023-10-08 14:00:16,919][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000054272_55574528.pth +[2023-10-08 14:00:17,043][102898] Updated weights for policy 1, policy_version 55980 (0.0008) +[2023-10-08 14:00:17,412][102898] Updated weights for policy 1, policy_version 55990 (0.0007) +[2023-10-08 14:00:17,779][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000056000_57344000.pth... +[2023-10-08 14:00:17,782][102898] Updated weights for policy 1, policy_version 56000 (0.0008) +[2023-10-08 14:00:17,810][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000054304_55607296.pth +[2023-10-08 14:00:19,259][102897] Updated weights for policy 0, policy_version 55940 (0.0009) +[2023-10-08 14:00:19,632][102897] Updated weights for policy 0, policy_version 55950 (0.0008) +[2023-10-08 14:00:20,007][102897] Updated weights for policy 0, policy_version 55960 (0.0009) +[2023-10-08 14:00:21,647][102898] Updated weights for policy 1, policy_version 56010 (0.0008) +[2023-10-08 14:00:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 114655232. Throughput: 0: 1807.2, 1: 1780.6. Samples: 28670404. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:00:21,875][101941] Avg episode reward: [(0, '7.450'), (1, '8.910')] +[2023-10-08 14:00:22,013][102898] Updated weights for policy 1, policy_version 56020 (0.0007) +[2023-10-08 14:00:22,377][102898] Updated weights for policy 1, policy_version 56030 (0.0010) +[2023-10-08 14:00:23,770][102897] Updated weights for policy 0, policy_version 55970 (0.0008) +[2023-10-08 14:00:24,137][102897] Updated weights for policy 0, policy_version 55980 (0.0008) +[2023-10-08 14:00:24,517][102897] Updated weights for policy 0, policy_version 55990 (0.0008) +[2023-10-08 14:00:24,878][102897] Updated weights for policy 0, policy_version 56000 (0.0009) +[2023-10-08 14:00:26,194][102898] Updated weights for policy 1, policy_version 56040 (0.0009) +[2023-10-08 14:00:26,558][102898] Updated weights for policy 1, policy_version 56050 (0.0008) +[2023-10-08 14:00:26,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 114720768. Throughput: 0: 1776.7, 1: 1785.8. Samples: 28691126. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:00:26,875][101941] Avg episode reward: [(0, '7.540'), (1, '8.830')] +[2023-10-08 14:00:26,923][102898] Updated weights for policy 1, policy_version 56060 (0.0007) +[2023-10-08 14:00:28,655][102897] Updated weights for policy 0, policy_version 56010 (0.0008) +[2023-10-08 14:00:29,017][102897] Updated weights for policy 0, policy_version 56020 (0.0008) +[2023-10-08 14:00:29,390][102897] Updated weights for policy 0, policy_version 56030 (0.0009) +[2023-10-08 14:00:30,601][102898] Updated weights for policy 1, policy_version 56070 (0.0007) +[2023-10-08 14:00:30,962][102898] Updated weights for policy 1, policy_version 56080 (0.0011) +[2023-10-08 14:00:31,329][102898] Updated weights for policy 1, policy_version 56090 (0.0007) +[2023-10-08 14:00:31,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 114819072. Throughput: 0: 1781.9, 1: 1786.4. Samples: 28712508. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:00:31,876][101941] Avg episode reward: [(0, '7.870'), (1, '9.580')] +[2023-10-08 14:00:33,017][102897] Updated weights for policy 0, policy_version 56040 (0.0008) +[2023-10-08 14:00:33,383][102897] Updated weights for policy 0, policy_version 56050 (0.0009) +[2023-10-08 14:00:33,763][102897] Updated weights for policy 0, policy_version 56060 (0.0007) +[2023-10-08 14:00:35,278][102898] Updated weights for policy 1, policy_version 56100 (0.0009) +[2023-10-08 14:00:35,675][102898] Updated weights for policy 1, policy_version 56110 (0.0009) +[2023-10-08 14:00:36,041][102898] Updated weights for policy 1, policy_version 56120 (0.0010) +[2023-10-08 14:00:36,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 114884608. Throughput: 0: 1786.8, 1: 1788.7. Samples: 28723560. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:00:36,876][101941] Avg episode reward: [(0, '7.660'), (1, '9.370')] +[2023-10-08 14:00:37,658][102897] Updated weights for policy 0, policy_version 56070 (0.0008) +[2023-10-08 14:00:38,048][102897] Updated weights for policy 0, policy_version 56080 (0.0007) +[2023-10-08 14:00:38,421][102897] Updated weights for policy 0, policy_version 56090 (0.0008) +[2023-10-08 14:00:39,598][102898] Updated weights for policy 1, policy_version 56130 (0.0010) +[2023-10-08 14:00:39,970][102898] Updated weights for policy 1, policy_version 56140 (0.0009) +[2023-10-08 14:00:40,324][102898] Updated weights for policy 1, policy_version 56150 (0.0010) +[2023-10-08 14:00:40,691][102898] Updated weights for policy 1, policy_version 56160 (0.0010) +[2023-10-08 14:00:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 114950144. Throughput: 0: 1782.8, 1: 1794.1. Samples: 28744712. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:00:41,875][101941] Avg episode reward: [(0, '7.300'), (1, '9.150')] +[2023-10-08 14:00:42,161][102897] Updated weights for policy 0, policy_version 56100 (0.0009) +[2023-10-08 14:00:42,539][102897] Updated weights for policy 0, policy_version 56110 (0.0009) +[2023-10-08 14:00:42,911][102897] Updated weights for policy 0, policy_version 56120 (0.0009) +[2023-10-08 14:00:44,303][102898] Updated weights for policy 1, policy_version 56170 (0.0009) +[2023-10-08 14:00:44,680][102898] Updated weights for policy 1, policy_version 56180 (0.0008) +[2023-10-08 14:00:45,047][102898] Updated weights for policy 1, policy_version 56190 (0.0008) +[2023-10-08 14:00:46,655][102897] Updated weights for policy 0, policy_version 56130 (0.0010) +[2023-10-08 14:00:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 115015680. Throughput: 0: 1798.8, 1: 1787.6. Samples: 28766970. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:00:46,875][101941] Avg episode reward: [(0, '7.910'), (1, '9.240')] +[2023-10-08 14:00:47,029][102897] Updated weights for policy 0, policy_version 56140 (0.0009) +[2023-10-08 14:00:47,395][102897] Updated weights for policy 0, policy_version 56150 (0.0009) +[2023-10-08 14:00:47,773][102897] Updated weights for policy 0, policy_version 56160 (0.0009) +[2023-10-08 14:00:49,051][102898] Updated weights for policy 1, policy_version 56200 (0.0008) +[2023-10-08 14:00:49,420][102898] Updated weights for policy 1, policy_version 56210 (0.0008) +[2023-10-08 14:00:49,792][102898] Updated weights for policy 1, policy_version 56220 (0.0008) +[2023-10-08 14:00:51,521][102897] Updated weights for policy 0, policy_version 56170 (0.0007) +[2023-10-08 14:00:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 115081216. Throughput: 0: 1777.1, 1: 1801.5. Samples: 28777128. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:00:51,876][101941] Avg episode reward: [(0, '7.870'), (1, '9.040')] +[2023-10-08 14:00:51,891][102897] Updated weights for policy 0, policy_version 56180 (0.0008) +[2023-10-08 14:00:52,261][102897] Updated weights for policy 0, policy_version 56190 (0.0010) +[2023-10-08 14:00:53,556][102898] Updated weights for policy 1, policy_version 56230 (0.0008) +[2023-10-08 14:00:53,920][102898] Updated weights for policy 1, policy_version 56240 (0.0010) +[2023-10-08 14:00:54,280][102898] Updated weights for policy 1, policy_version 56250 (0.0010) +[2023-10-08 14:00:56,105][102897] Updated weights for policy 0, policy_version 56200 (0.0009) +[2023-10-08 14:00:56,484][102897] Updated weights for policy 0, policy_version 56210 (0.0009) +[2023-10-08 14:00:56,859][102897] Updated weights for policy 0, policy_version 56220 (0.0009) +[2023-10-08 14:00:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 115146752. Throughput: 0: 1789.5, 1: 1778.5. Samples: 28798830. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:00:56,875][101941] Avg episode reward: [(0, '7.460'), (1, '8.550')] +[2023-10-08 14:00:58,085][102898] Updated weights for policy 1, policy_version 56260 (0.0009) +[2023-10-08 14:00:58,456][102898] Updated weights for policy 1, policy_version 56270 (0.0007) +[2023-10-08 14:00:58,818][102898] Updated weights for policy 1, policy_version 56280 (0.0008) +[2023-10-08 14:01:00,616][102897] Updated weights for policy 0, policy_version 56230 (0.0009) +[2023-10-08 14:01:00,990][102897] Updated weights for policy 0, policy_version 56240 (0.0008) +[2023-10-08 14:01:01,364][102897] Updated weights for policy 0, policy_version 56250 (0.0011) +[2023-10-08 14:01:01,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 115245056. Throughput: 0: 1781.8, 1: 1780.8. Samples: 28820044. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:01:01,875][101941] Avg episode reward: [(0, '7.030'), (1, '7.680')] +[2023-10-08 14:01:02,552][102898] Updated weights for policy 1, policy_version 56290 (0.0008) +[2023-10-08 14:01:02,910][102898] Updated weights for policy 1, policy_version 56300 (0.0010) +[2023-10-08 14:01:03,273][102898] Updated weights for policy 1, policy_version 56310 (0.0011) +[2023-10-08 14:01:03,640][102898] Updated weights for policy 1, policy_version 56320 (0.0009) +[2023-10-08 14:01:05,049][102897] Updated weights for policy 0, policy_version 56260 (0.0008) +[2023-10-08 14:01:05,426][102897] Updated weights for policy 0, policy_version 56270 (0.0007) +[2023-10-08 14:01:05,794][102897] Updated weights for policy 0, policy_version 56280 (0.0007) +[2023-10-08 14:01:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 115310592. Throughput: 0: 1786.3, 1: 1781.0. Samples: 28830932. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:01:06,876][101941] Avg episode reward: [(0, '7.040'), (1, '7.980')] +[2023-10-08 14:01:07,347][102898] Updated weights for policy 1, policy_version 56330 (0.0008) +[2023-10-08 14:01:07,705][102898] Updated weights for policy 1, policy_version 56340 (0.0009) +[2023-10-08 14:01:08,072][102898] Updated weights for policy 1, policy_version 56350 (0.0007) +[2023-10-08 14:01:09,496][102897] Updated weights for policy 0, policy_version 56290 (0.0008) +[2023-10-08 14:01:09,870][102897] Updated weights for policy 0, policy_version 56300 (0.0008) +[2023-10-08 14:01:10,247][102897] Updated weights for policy 0, policy_version 56310 (0.0009) +[2023-10-08 14:01:10,613][102897] Updated weights for policy 0, policy_version 56320 (0.0011) +[2023-10-08 14:01:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 115376128. Throughput: 0: 1797.8, 1: 1788.7. Samples: 28852520. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:01:11,876][101941] Avg episode reward: [(0, '7.440'), (1, '8.660')] +[2023-10-08 14:01:11,996][102898] Updated weights for policy 1, policy_version 56360 (0.0010) +[2023-10-08 14:01:12,369][102898] Updated weights for policy 1, policy_version 56370 (0.0009) +[2023-10-08 14:01:12,720][102898] Updated weights for policy 1, policy_version 56380 (0.0011) +[2023-10-08 14:01:14,340][102897] Updated weights for policy 0, policy_version 56330 (0.0007) +[2023-10-08 14:01:14,707][102897] Updated weights for policy 0, policy_version 56340 (0.0007) +[2023-10-08 14:01:15,086][102897] Updated weights for policy 0, policy_version 56350 (0.0007) +[2023-10-08 14:01:16,504][102898] Updated weights for policy 1, policy_version 56390 (0.0008) +[2023-10-08 14:01:16,870][102898] Updated weights for policy 1, policy_version 56400 (0.0010) +[2023-10-08 14:01:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 115441664. Throughput: 0: 1790.0, 1: 1807.5. Samples: 28874396. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:01:16,876][101941] Avg episode reward: [(0, '7.020'), (1, '9.080')] +[2023-10-08 14:01:17,241][102898] Updated weights for policy 1, policy_version 56410 (0.0009) +[2023-10-08 14:01:18,638][102897] Updated weights for policy 0, policy_version 56360 (0.0009) +[2023-10-08 14:01:19,003][102897] Updated weights for policy 0, policy_version 56370 (0.0010) +[2023-10-08 14:01:19,373][102897] Updated weights for policy 0, policy_version 56380 (0.0009) +[2023-10-08 14:01:20,975][102898] Updated weights for policy 1, policy_version 56420 (0.0007) +[2023-10-08 14:01:21,350][102898] Updated weights for policy 1, policy_version 56430 (0.0008) +[2023-10-08 14:01:21,714][102898] Updated weights for policy 1, policy_version 56440 (0.0008) +[2023-10-08 14:01:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 115507200. Throughput: 0: 1796.5, 1: 1786.3. Samples: 28884784. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:01:21,876][101941] Avg episode reward: [(0, '6.930'), (1, '9.160')] +[2023-10-08 14:01:23,155][102897] Updated weights for policy 0, policy_version 56390 (0.0010) +[2023-10-08 14:01:23,525][102897] Updated weights for policy 0, policy_version 56400 (0.0010) +[2023-10-08 14:01:23,890][102897] Updated weights for policy 0, policy_version 56410 (0.0010) +[2023-10-08 14:01:25,638][102898] Updated weights for policy 1, policy_version 56450 (0.0007) +[2023-10-08 14:01:26,004][102898] Updated weights for policy 1, policy_version 56460 (0.0008) +[2023-10-08 14:01:26,378][102898] Updated weights for policy 1, policy_version 56470 (0.0009) +[2023-10-08 14:01:26,741][102898] Updated weights for policy 1, policy_version 56480 (0.0010) +[2023-10-08 14:01:26,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 115605504. Throughput: 0: 1794.1, 1: 1808.6. Samples: 28906834. Policy #0 lag: (min: 31.0, avg: 32.4, max: 57.0) +[2023-10-08 14:01:26,875][101941] Avg episode reward: [(0, '7.080'), (1, '9.800')] +[2023-10-08 14:01:27,708][102897] Updated weights for policy 0, policy_version 56420 (0.0010) +[2023-10-08 14:01:28,104][102897] Updated weights for policy 0, policy_version 56430 (0.0007) +[2023-10-08 14:01:28,477][102897] Updated weights for policy 0, policy_version 56440 (0.0009) +[2023-10-08 14:01:30,389][102898] Updated weights for policy 1, policy_version 56490 (0.0007) +[2023-10-08 14:01:30,760][102898] Updated weights for policy 1, policy_version 56500 (0.0010) +[2023-10-08 14:01:31,128][102898] Updated weights for policy 1, policy_version 56510 (0.0011) +[2023-10-08 14:01:31,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 115671040. Throughput: 0: 1791.7, 1: 1785.2. Samples: 28927932. Policy #0 lag: (min: 31.0, avg: 32.4, max: 57.0) +[2023-10-08 14:01:31,876][101941] Avg episode reward: [(0, '6.390'), (1, '9.390')] +[2023-10-08 14:01:32,207][102897] Updated weights for policy 0, policy_version 56450 (0.0011) +[2023-10-08 14:01:32,577][102897] Updated weights for policy 0, policy_version 56460 (0.0009) +[2023-10-08 14:01:32,950][102897] Updated weights for policy 0, policy_version 56470 (0.0008) +[2023-10-08 14:01:33,312][102897] Updated weights for policy 0, policy_version 56480 (0.0008) +[2023-10-08 14:01:34,957][102898] Updated weights for policy 1, policy_version 56520 (0.0008) +[2023-10-08 14:01:35,325][102898] Updated weights for policy 1, policy_version 56530 (0.0007) +[2023-10-08 14:01:35,688][102898] Updated weights for policy 1, policy_version 56540 (0.0008) +[2023-10-08 14:01:36,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 115736576. Throughput: 0: 1791.0, 1: 1808.8. Samples: 28939122. Policy #0 lag: (min: 31.0, avg: 32.4, max: 57.0) +[2023-10-08 14:01:36,876][101941] Avg episode reward: [(0, '6.760'), (1, '8.320')] +[2023-10-08 14:01:37,135][102897] Updated weights for policy 0, policy_version 56490 (0.0009) +[2023-10-08 14:01:37,504][102897] Updated weights for policy 0, policy_version 56500 (0.0008) +[2023-10-08 14:01:37,872][102897] Updated weights for policy 0, policy_version 56510 (0.0011) +[2023-10-08 14:01:39,419][102898] Updated weights for policy 1, policy_version 56550 (0.0008) +[2023-10-08 14:01:39,784][102898] Updated weights for policy 1, policy_version 56560 (0.0007) +[2023-10-08 14:01:40,149][102898] Updated weights for policy 1, policy_version 56570 (0.0009) +[2023-10-08 14:01:41,542][102897] Updated weights for policy 0, policy_version 56520 (0.0009) +[2023-10-08 14:01:41,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 115802112. Throughput: 0: 1792.5, 1: 1791.1. Samples: 28960092. Policy #0 lag: (min: 31.0, avg: 32.4, max: 57.0) +[2023-10-08 14:01:41,875][101941] Avg episode reward: [(0, '7.160'), (1, '9.310')] +[2023-10-08 14:01:41,922][102897] Updated weights for policy 0, policy_version 56530 (0.0010) +[2023-10-08 14:01:42,287][102897] Updated weights for policy 0, policy_version 56540 (0.0008) +[2023-10-08 14:01:43,718][102898] Updated weights for policy 1, policy_version 56580 (0.0009) +[2023-10-08 14:01:44,091][102898] Updated weights for policy 1, policy_version 56590 (0.0007) +[2023-10-08 14:01:44,450][102898] Updated weights for policy 1, policy_version 56600 (0.0007) +[2023-10-08 14:01:45,996][102897] Updated weights for policy 0, policy_version 56550 (0.0007) +[2023-10-08 14:01:46,356][102897] Updated weights for policy 0, policy_version 56560 (0.0007) +[2023-10-08 14:01:46,731][102897] Updated weights for policy 0, policy_version 56570 (0.0007) +[2023-10-08 14:01:46,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 115867648. Throughput: 0: 1803.5, 1: 1796.3. Samples: 28982034. Policy #0 lag: (min: 31.0, avg: 32.4, max: 57.0) +[2023-10-08 14:01:46,875][101941] Avg episode reward: [(0, '6.710'), (1, '9.220')] +[2023-10-08 14:01:48,236][102898] Updated weights for policy 1, policy_version 56610 (0.0008) +[2023-10-08 14:01:48,609][102898] Updated weights for policy 1, policy_version 56620 (0.0008) +[2023-10-08 14:01:48,968][102898] Updated weights for policy 1, policy_version 56630 (0.0007) +[2023-10-08 14:01:49,339][102898] Updated weights for policy 1, policy_version 56640 (0.0008) +[2023-10-08 14:01:50,447][102897] Updated weights for policy 0, policy_version 56580 (0.0009) +[2023-10-08 14:01:50,805][102897] Updated weights for policy 0, policy_version 56590 (0.0009) +[2023-10-08 14:01:51,175][102897] Updated weights for policy 0, policy_version 56600 (0.0008) +[2023-10-08 14:01:51,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 115965952. Throughput: 0: 1793.2, 1: 1798.9. Samples: 28992578. Policy #0 lag: (min: 31.0, avg: 32.4, max: 57.0) +[2023-10-08 14:01:51,875][101941] Avg episode reward: [(0, '6.690'), (1, '9.230')] +[2023-10-08 14:01:52,961][102898] Updated weights for policy 1, policy_version 56650 (0.0007) +[2023-10-08 14:01:53,322][102898] Updated weights for policy 1, policy_version 56660 (0.0007) +[2023-10-08 14:01:53,695][102898] Updated weights for policy 1, policy_version 56670 (0.0008) +[2023-10-08 14:01:54,982][102897] Updated weights for policy 0, policy_version 56610 (0.0008) +[2023-10-08 14:01:55,352][102897] Updated weights for policy 0, policy_version 56620 (0.0008) +[2023-10-08 14:01:55,725][102897] Updated weights for policy 0, policy_version 56630 (0.0010) +[2023-10-08 14:01:56,096][102897] Updated weights for policy 0, policy_version 56640 (0.0009) +[2023-10-08 14:01:56,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 116031488. Throughput: 0: 1801.8, 1: 1798.9. Samples: 29014554. Policy #0 lag: (min: 31.0, avg: 32.4, max: 57.0) +[2023-10-08 14:01:56,875][101941] Avg episode reward: [(0, '6.780'), (1, '8.900')] +[2023-10-08 14:01:57,312][102898] Updated weights for policy 1, policy_version 56680 (0.0009) +[2023-10-08 14:01:57,677][102898] Updated weights for policy 1, policy_version 56690 (0.0007) +[2023-10-08 14:01:58,043][102898] Updated weights for policy 1, policy_version 56700 (0.0008) +[2023-10-08 14:01:59,965][102897] Updated weights for policy 0, policy_version 56650 (0.0009) +[2023-10-08 14:02:00,339][102897] Updated weights for policy 0, policy_version 56660 (0.0009) +[2023-10-08 14:02:00,714][102897] Updated weights for policy 0, policy_version 56670 (0.0009) +[2023-10-08 14:02:01,739][102898] Updated weights for policy 1, policy_version 56710 (0.0008) +[2023-10-08 14:02:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 116097024. Throughput: 0: 1783.6, 1: 1808.8. Samples: 29036052. Policy #0 lag: (min: 31.0, avg: 31.1, max: 39.0) +[2023-10-08 14:02:01,875][101941] Avg episode reward: [(0, '7.740'), (1, '7.800')] +[2023-10-08 14:02:02,104][102898] Updated weights for policy 1, policy_version 56720 (0.0008) +[2023-10-08 14:02:02,477][102898] Updated weights for policy 1, policy_version 56730 (0.0008) +[2023-10-08 14:02:04,578][102897] Updated weights for policy 0, policy_version 56680 (0.0008) +[2023-10-08 14:02:04,945][102897] Updated weights for policy 0, policy_version 56690 (0.0007) +[2023-10-08 14:02:05,313][102897] Updated weights for policy 0, policy_version 56700 (0.0007) +[2023-10-08 14:02:06,368][102898] Updated weights for policy 1, policy_version 56740 (0.0007) +[2023-10-08 14:02:06,748][102898] Updated weights for policy 1, policy_version 56750 (0.0007) +[2023-10-08 14:02:06,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 116162560. Throughput: 0: 1810.3, 1: 1799.0. Samples: 29047200. Policy #0 lag: (min: 31.0, avg: 31.1, max: 39.0) +[2023-10-08 14:02:06,876][101941] Avg episode reward: [(0, '7.990'), (1, '7.910')] +[2023-10-08 14:02:07,118][102898] Updated weights for policy 1, policy_version 56760 (0.0007) +[2023-10-08 14:02:08,992][102897] Updated weights for policy 0, policy_version 56710 (0.0007) +[2023-10-08 14:02:09,358][102897] Updated weights for policy 0, policy_version 56720 (0.0009) +[2023-10-08 14:02:09,728][102897] Updated weights for policy 0, policy_version 56730 (0.0009) +[2023-10-08 14:02:10,792][102898] Updated weights for policy 1, policy_version 56770 (0.0008) +[2023-10-08 14:02:11,162][102898] Updated weights for policy 1, policy_version 56780 (0.0008) +[2023-10-08 14:02:11,523][102898] Updated weights for policy 1, policy_version 56790 (0.0009) +[2023-10-08 14:02:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 116228096. Throughput: 0: 1787.7, 1: 1800.8. Samples: 29068316. Policy #0 lag: (min: 31.0, avg: 31.1, max: 39.0) +[2023-10-08 14:02:11,875][101941] Avg episode reward: [(0, '7.680'), (1, '8.750')] +[2023-10-08 14:02:11,889][102898] Updated weights for policy 1, policy_version 56800 (0.0008) +[2023-10-08 14:02:13,615][102897] Updated weights for policy 0, policy_version 56740 (0.0007) +[2023-10-08 14:02:13,988][102897] Updated weights for policy 0, policy_version 56750 (0.0009) +[2023-10-08 14:02:14,368][102897] Updated weights for policy 0, policy_version 56760 (0.0011) +[2023-10-08 14:02:15,667][102898] Updated weights for policy 1, policy_version 56810 (0.0007) +[2023-10-08 14:02:16,037][102898] Updated weights for policy 1, policy_version 56820 (0.0008) +[2023-10-08 14:02:16,405][102898] Updated weights for policy 1, policy_version 56830 (0.0009) +[2023-10-08 14:02:16,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 116326400. Throughput: 0: 1784.7, 1: 1801.0. Samples: 29089288. Policy #0 lag: (min: 31.0, avg: 31.1, max: 39.0) +[2023-10-08 14:02:16,876][101941] Avg episode reward: [(0, '7.660'), (1, '9.140')] +[2023-10-08 14:02:16,885][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000056832_58195968.pth... +[2023-10-08 14:02:16,885][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000056768_58130432.pth... +[2023-10-08 14:02:16,920][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000055104_56426496.pth +[2023-10-08 14:02:16,926][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000055136_56459264.pth +[2023-10-08 14:02:18,098][102897] Updated weights for policy 0, policy_version 56770 (0.0009) +[2023-10-08 14:02:18,473][102897] Updated weights for policy 0, policy_version 56780 (0.0010) +[2023-10-08 14:02:18,847][102897] Updated weights for policy 0, policy_version 56790 (0.0007) +[2023-10-08 14:02:19,223][102897] Updated weights for policy 0, policy_version 56800 (0.0009) +[2023-10-08 14:02:20,078][102898] Updated weights for policy 1, policy_version 56840 (0.0009) +[2023-10-08 14:02:20,448][102898] Updated weights for policy 1, policy_version 56850 (0.0008) +[2023-10-08 14:02:20,813][102898] Updated weights for policy 1, policy_version 56860 (0.0007) +[2023-10-08 14:02:21,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 116391936. Throughput: 0: 1782.0, 1: 1799.3. Samples: 29100278. Policy #0 lag: (min: 31.0, avg: 31.1, max: 39.0) +[2023-10-08 14:02:21,876][101941] Avg episode reward: [(0, '7.850'), (1, '9.090')] +[2023-10-08 14:02:23,228][102897] Updated weights for policy 0, policy_version 56810 (0.0009) +[2023-10-08 14:02:23,598][102897] Updated weights for policy 0, policy_version 56820 (0.0009) +[2023-10-08 14:02:23,966][102897] Updated weights for policy 0, policy_version 56830 (0.0007) +[2023-10-08 14:02:24,444][102898] Updated weights for policy 1, policy_version 56870 (0.0009) +[2023-10-08 14:02:24,807][102898] Updated weights for policy 1, policy_version 56880 (0.0010) +[2023-10-08 14:02:25,178][102898] Updated weights for policy 1, policy_version 56890 (0.0008) +[2023-10-08 14:02:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 116457472. Throughput: 0: 1778.5, 1: 1804.8. Samples: 29121342. Policy #0 lag: (min: 31.0, avg: 31.1, max: 39.0) +[2023-10-08 14:02:26,876][101941] Avg episode reward: [(0, '7.580'), (1, '9.250')] +[2023-10-08 14:02:27,684][102897] Updated weights for policy 0, policy_version 56840 (0.0007) +[2023-10-08 14:02:28,048][102897] Updated weights for policy 0, policy_version 56850 (0.0008) +[2023-10-08 14:02:28,419][102897] Updated weights for policy 0, policy_version 56860 (0.0007) +[2023-10-08 14:02:28,881][102898] Updated weights for policy 1, policy_version 56900 (0.0008) +[2023-10-08 14:02:29,249][102898] Updated weights for policy 1, policy_version 56910 (0.0007) +[2023-10-08 14:02:29,617][102898] Updated weights for policy 1, policy_version 56920 (0.0008) +[2023-10-08 14:02:31,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 116523008. Throughput: 0: 1789.8, 1: 1803.9. Samples: 29143752. Policy #0 lag: (min: 31.0, avg: 31.1, max: 39.0) +[2023-10-08 14:02:31,876][101941] Avg episode reward: [(0, '7.180'), (1, '8.560')] +[2023-10-08 14:02:32,239][102897] Updated weights for policy 0, policy_version 56870 (0.0007) +[2023-10-08 14:02:32,611][102897] Updated weights for policy 0, policy_version 56880 (0.0007) +[2023-10-08 14:02:32,976][102897] Updated weights for policy 0, policy_version 56890 (0.0009) +[2023-10-08 14:02:33,445][102898] Updated weights for policy 1, policy_version 56930 (0.0009) +[2023-10-08 14:02:33,809][102898] Updated weights for policy 1, policy_version 56940 (0.0009) +[2023-10-08 14:02:34,172][102898] Updated weights for policy 1, policy_version 56950 (0.0008) +[2023-10-08 14:02:34,542][102898] Updated weights for policy 1, policy_version 56960 (0.0010) +[2023-10-08 14:02:36,816][102897] Updated weights for policy 0, policy_version 56900 (0.0009) +[2023-10-08 14:02:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 116588544. Throughput: 0: 1771.2, 1: 1810.4. Samples: 29153748. Policy #0 lag: (min: 31.0, avg: 31.1, max: 39.0) +[2023-10-08 14:02:36,875][101941] Avg episode reward: [(0, '7.170'), (1, '8.200')] +[2023-10-08 14:02:37,179][102897] Updated weights for policy 0, policy_version 56910 (0.0007) +[2023-10-08 14:02:37,547][102897] Updated weights for policy 0, policy_version 56920 (0.0008) +[2023-10-08 14:02:38,137][102898] Updated weights for policy 1, policy_version 56970 (0.0009) +[2023-10-08 14:02:38,499][102898] Updated weights for policy 1, policy_version 56980 (0.0010) +[2023-10-08 14:02:38,869][102898] Updated weights for policy 1, policy_version 56990 (0.0010) +[2023-10-08 14:02:41,354][102897] Updated weights for policy 0, policy_version 56930 (0.0007) +[2023-10-08 14:02:41,733][102897] Updated weights for policy 0, policy_version 56940 (0.0009) +[2023-10-08 14:02:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 116654080. Throughput: 0: 1778.9, 1: 1804.9. Samples: 29175826. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:02:41,876][101941] Avg episode reward: [(0, '7.560'), (1, '8.770')] +[2023-10-08 14:02:42,096][102897] Updated weights for policy 0, policy_version 56950 (0.0007) +[2023-10-08 14:02:42,468][102897] Updated weights for policy 0, policy_version 56960 (0.0007) +[2023-10-08 14:02:42,501][102898] Updated weights for policy 1, policy_version 57000 (0.0008) +[2023-10-08 14:02:42,862][102898] Updated weights for policy 1, policy_version 57010 (0.0007) +[2023-10-08 14:02:43,221][102898] Updated weights for policy 1, policy_version 57020 (0.0008) +[2023-10-08 14:02:46,287][102897] Updated weights for policy 0, policy_version 56970 (0.0009) +[2023-10-08 14:02:46,651][102897] Updated weights for policy 0, policy_version 56980 (0.0008) +[2023-10-08 14:02:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 116719616. Throughput: 0: 1789.3, 1: 1805.5. Samples: 29197818. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:02:46,875][101941] Avg episode reward: [(0, '7.410'), (1, '9.640')] +[2023-10-08 14:02:46,928][102898] Updated weights for policy 1, policy_version 57030 (0.0007) +[2023-10-08 14:02:47,015][102897] Updated weights for policy 0, policy_version 56990 (0.0008) +[2023-10-08 14:02:47,300][102898] Updated weights for policy 1, policy_version 57040 (0.0007) +[2023-10-08 14:02:47,668][102898] Updated weights for policy 1, policy_version 57050 (0.0008) +[2023-10-08 14:02:50,774][102897] Updated weights for policy 0, policy_version 57000 (0.0007) +[2023-10-08 14:02:51,147][102897] Updated weights for policy 0, policy_version 57010 (0.0008) +[2023-10-08 14:02:51,511][102897] Updated weights for policy 0, policy_version 57020 (0.0007) +[2023-10-08 14:02:51,751][102898] Updated weights for policy 1, policy_version 57060 (0.0010) +[2023-10-08 14:02:51,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 116817920. Throughput: 0: 1767.0, 1: 1807.0. Samples: 29208030. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:02:51,875][101941] Avg episode reward: [(0, '7.300'), (1, '9.820')] +[2023-10-08 14:02:52,141][102898] Updated weights for policy 1, policy_version 57070 (0.0007) +[2023-10-08 14:02:52,504][102898] Updated weights for policy 1, policy_version 57080 (0.0008) +[2023-10-08 14:02:55,295][102897] Updated weights for policy 0, policy_version 57030 (0.0007) +[2023-10-08 14:02:55,665][102897] Updated weights for policy 0, policy_version 57040 (0.0008) +[2023-10-08 14:02:56,036][102897] Updated weights for policy 0, policy_version 57050 (0.0008) +[2023-10-08 14:02:56,078][102898] Updated weights for policy 1, policy_version 57090 (0.0008) +[2023-10-08 14:02:56,445][102898] Updated weights for policy 1, policy_version 57100 (0.0008) +[2023-10-08 14:02:56,820][102898] Updated weights for policy 1, policy_version 57110 (0.0009) +[2023-10-08 14:02:56,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 116883456. Throughput: 0: 1790.3, 1: 1802.1. Samples: 29229974. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:02:56,876][101941] Avg episode reward: [(0, '7.210'), (1, '9.010')] +[2023-10-08 14:02:57,183][102898] Updated weights for policy 1, policy_version 57120 (0.0008) +[2023-10-08 14:02:59,704][102897] Updated weights for policy 0, policy_version 57060 (0.0009) +[2023-10-08 14:03:00,090][102897] Updated weights for policy 0, policy_version 57070 (0.0007) +[2023-10-08 14:03:00,462][102897] Updated weights for policy 0, policy_version 57080 (0.0008) +[2023-10-08 14:03:00,884][102898] Updated weights for policy 1, policy_version 57130 (0.0008) +[2023-10-08 14:03:01,259][102898] Updated weights for policy 1, policy_version 57140 (0.0008) +[2023-10-08 14:03:01,619][102898] Updated weights for policy 1, policy_version 57150 (0.0009) +[2023-10-08 14:03:01,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 116981760. Throughput: 0: 1769.3, 1: 1813.5. Samples: 29250512. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:03:01,875][101941] Avg episode reward: [(0, '7.350'), (1, '9.550')] +[2023-10-08 14:03:04,127][102897] Updated weights for policy 0, policy_version 57090 (0.0010) +[2023-10-08 14:03:04,494][102897] Updated weights for policy 0, policy_version 57100 (0.0008) +[2023-10-08 14:03:04,859][102897] Updated weights for policy 0, policy_version 57110 (0.0009) +[2023-10-08 14:03:05,237][102897] Updated weights for policy 0, policy_version 57120 (0.0007) +[2023-10-08 14:03:05,395][102898] Updated weights for policy 1, policy_version 57160 (0.0010) +[2023-10-08 14:03:05,762][102898] Updated weights for policy 1, policy_version 57170 (0.0007) +[2023-10-08 14:03:06,118][102898] Updated weights for policy 1, policy_version 57180 (0.0007) +[2023-10-08 14:03:06,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 117047296. Throughput: 0: 1800.8, 1: 1805.7. Samples: 29262570. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:03:06,876][101941] Avg episode reward: [(0, '7.530'), (1, '9.080')] +[2023-10-08 14:03:08,998][102897] Updated weights for policy 0, policy_version 57130 (0.0007) +[2023-10-08 14:03:09,375][102897] Updated weights for policy 0, policy_version 57140 (0.0008) +[2023-10-08 14:03:09,755][102897] Updated weights for policy 0, policy_version 57150 (0.0008) +[2023-10-08 14:03:09,859][102898] Updated weights for policy 1, policy_version 57190 (0.0009) +[2023-10-08 14:03:10,232][102898] Updated weights for policy 1, policy_version 57200 (0.0009) +[2023-10-08 14:03:10,611][102898] Updated weights for policy 1, policy_version 57210 (0.0010) +[2023-10-08 14:03:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 117112832. Throughput: 0: 1776.7, 1: 1816.6. Samples: 29283040. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:03:11,875][101941] Avg episode reward: [(0, '7.760'), (1, '8.980')] +[2023-10-08 14:03:13,651][102897] Updated weights for policy 0, policy_version 57160 (0.0007) +[2023-10-08 14:03:14,020][102897] Updated weights for policy 0, policy_version 57170 (0.0008) +[2023-10-08 14:03:14,393][102897] Updated weights for policy 0, policy_version 57180 (0.0009) +[2023-10-08 14:03:14,415][102898] Updated weights for policy 1, policy_version 57220 (0.0008) +[2023-10-08 14:03:14,788][102898] Updated weights for policy 1, policy_version 57230 (0.0011) +[2023-10-08 14:03:15,153][102898] Updated weights for policy 1, policy_version 57240 (0.0009) +[2023-10-08 14:03:16,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 117178368. Throughput: 0: 1778.0, 1: 1801.6. Samples: 29304832. Policy #0 lag: (min: 9.0, avg: 21.0, max: 41.0) +[2023-10-08 14:03:16,875][101941] Avg episode reward: [(0, '7.350'), (1, '8.330')] +[2023-10-08 14:03:18,177][102897] Updated weights for policy 0, policy_version 57190 (0.0008) +[2023-10-08 14:03:18,552][102897] Updated weights for policy 0, policy_version 57200 (0.0007) +[2023-10-08 14:03:18,915][102897] Updated weights for policy 0, policy_version 57210 (0.0009) +[2023-10-08 14:03:19,042][102898] Updated weights for policy 1, policy_version 57250 (0.0008) +[2023-10-08 14:03:19,396][102898] Updated weights for policy 1, policy_version 57260 (0.0008) +[2023-10-08 14:03:19,769][102898] Updated weights for policy 1, policy_version 57270 (0.0008) +[2023-10-08 14:03:20,133][102898] Updated weights for policy 1, policy_version 57280 (0.0008) +[2023-10-08 14:03:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 117243904. Throughput: 0: 1776.8, 1: 1812.1. Samples: 29315252. Policy #0 lag: (min: 9.0, avg: 21.0, max: 41.0) +[2023-10-08 14:03:21,875][101941] Avg episode reward: [(0, '7.470'), (1, '8.100')] +[2023-10-08 14:03:22,647][102897] Updated weights for policy 0, policy_version 57220 (0.0008) +[2023-10-08 14:03:23,023][102897] Updated weights for policy 0, policy_version 57230 (0.0010) +[2023-10-08 14:03:23,388][102897] Updated weights for policy 0, policy_version 57240 (0.0009) +[2023-10-08 14:03:23,867][102898] Updated weights for policy 1, policy_version 57290 (0.0009) +[2023-10-08 14:03:24,235][102898] Updated weights for policy 1, policy_version 57300 (0.0009) +[2023-10-08 14:03:24,605][102898] Updated weights for policy 1, policy_version 57310 (0.0008) +[2023-10-08 14:03:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 117309440. Throughput: 0: 1782.4, 1: 1792.4. Samples: 29336694. Policy #0 lag: (min: 9.0, avg: 21.0, max: 41.0) +[2023-10-08 14:03:26,876][101941] Avg episode reward: [(0, '7.250'), (1, '9.080')] +[2023-10-08 14:03:27,241][102897] Updated weights for policy 0, policy_version 57250 (0.0008) +[2023-10-08 14:03:27,605][102897] Updated weights for policy 0, policy_version 57260 (0.0007) +[2023-10-08 14:03:27,970][102897] Updated weights for policy 0, policy_version 57270 (0.0007) +[2023-10-08 14:03:28,346][102897] Updated weights for policy 0, policy_version 57280 (0.0008) +[2023-10-08 14:03:28,479][102898] Updated weights for policy 1, policy_version 57320 (0.0008) +[2023-10-08 14:03:28,850][102898] Updated weights for policy 1, policy_version 57330 (0.0008) +[2023-10-08 14:03:29,224][102898] Updated weights for policy 1, policy_version 57340 (0.0008) +[2023-10-08 14:03:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 117374976. Throughput: 0: 1793.2, 1: 1787.5. Samples: 29358952. Policy #0 lag: (min: 9.0, avg: 21.0, max: 41.0) +[2023-10-08 14:03:31,875][101941] Avg episode reward: [(0, '7.410'), (1, '9.320')] +[2023-10-08 14:03:32,091][102897] Updated weights for policy 0, policy_version 57290 (0.0008) +[2023-10-08 14:03:32,472][102897] Updated weights for policy 0, policy_version 57300 (0.0011) +[2023-10-08 14:03:32,844][102897] Updated weights for policy 0, policy_version 57310 (0.0008) +[2023-10-08 14:03:32,943][102898] Updated weights for policy 1, policy_version 57350 (0.0008) +[2023-10-08 14:03:33,311][102898] Updated weights for policy 1, policy_version 57360 (0.0008) +[2023-10-08 14:03:33,678][102898] Updated weights for policy 1, policy_version 57370 (0.0010) +[2023-10-08 14:03:36,512][102897] Updated weights for policy 0, policy_version 57320 (0.0009) +[2023-10-08 14:03:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 117440512. Throughput: 0: 1778.5, 1: 1789.6. Samples: 29368596. Policy #0 lag: (min: 9.0, avg: 21.0, max: 41.0) +[2023-10-08 14:03:36,876][101941] Avg episode reward: [(0, '8.240'), (1, '8.670')] +[2023-10-08 14:03:36,881][102897] Updated weights for policy 0, policy_version 57330 (0.0007) +[2023-10-08 14:03:37,248][102897] Updated weights for policy 0, policy_version 57340 (0.0007) +[2023-10-08 14:03:37,603][102898] Updated weights for policy 1, policy_version 57380 (0.0009) +[2023-10-08 14:03:37,992][102898] Updated weights for policy 1, policy_version 57390 (0.0008) +[2023-10-08 14:03:38,359][102898] Updated weights for policy 1, policy_version 57400 (0.0010) +[2023-10-08 14:03:40,886][102897] Updated weights for policy 0, policy_version 57350 (0.0009) +[2023-10-08 14:03:41,265][102897] Updated weights for policy 0, policy_version 57360 (0.0010) +[2023-10-08 14:03:41,634][102897] Updated weights for policy 0, policy_version 57370 (0.0008) +[2023-10-08 14:03:41,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 117538816. Throughput: 0: 1793.3, 1: 1785.9. Samples: 29391038. Policy #0 lag: (min: 9.0, avg: 21.0, max: 41.0) +[2023-10-08 14:03:41,876][101941] Avg episode reward: [(0, '7.670'), (1, '9.030')] +[2023-10-08 14:03:42,065][102898] Updated weights for policy 1, policy_version 57410 (0.0011) +[2023-10-08 14:03:42,439][102898] Updated weights for policy 1, policy_version 57420 (0.0010) +[2023-10-08 14:03:42,811][102898] Updated weights for policy 1, policy_version 57430 (0.0009) +[2023-10-08 14:03:43,176][102898] Updated weights for policy 1, policy_version 57440 (0.0008) +[2023-10-08 14:03:45,315][102897] Updated weights for policy 0, policy_version 57380 (0.0007) +[2023-10-08 14:03:45,695][102897] Updated weights for policy 0, policy_version 57390 (0.0009) +[2023-10-08 14:03:46,069][102897] Updated weights for policy 0, policy_version 57400 (0.0010) +[2023-10-08 14:03:46,829][102898] Updated weights for policy 1, policy_version 57450 (0.0009) +[2023-10-08 14:03:46,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 117604352. Throughput: 0: 1786.3, 1: 1806.3. Samples: 29412176. Policy #0 lag: (min: 9.0, avg: 21.0, max: 41.0) +[2023-10-08 14:03:46,875][101941] Avg episode reward: [(0, '7.300'), (1, '8.850')] +[2023-10-08 14:03:47,194][102898] Updated weights for policy 1, policy_version 57460 (0.0009) +[2023-10-08 14:03:47,557][102898] Updated weights for policy 1, policy_version 57470 (0.0008) +[2023-10-08 14:03:49,761][102897] Updated weights for policy 0, policy_version 57410 (0.0008) +[2023-10-08 14:03:50,129][102897] Updated weights for policy 0, policy_version 57420 (0.0009) +[2023-10-08 14:03:50,502][102897] Updated weights for policy 0, policy_version 57430 (0.0008) +[2023-10-08 14:03:50,879][102897] Updated weights for policy 0, policy_version 57440 (0.0008) +[2023-10-08 14:03:51,340][102898] Updated weights for policy 1, policy_version 57480 (0.0009) +[2023-10-08 14:03:51,702][102898] Updated weights for policy 1, policy_version 57490 (0.0009) +[2023-10-08 14:03:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 117669888. Throughput: 0: 1792.8, 1: 1777.4. Samples: 29423230. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:03:51,876][101941] Avg episode reward: [(0, '7.670'), (1, '7.800')] +[2023-10-08 14:03:52,077][102898] Updated weights for policy 1, policy_version 57500 (0.0008) +[2023-10-08 14:03:54,833][102897] Updated weights for policy 0, policy_version 57450 (0.0007) +[2023-10-08 14:03:55,209][102897] Updated weights for policy 0, policy_version 57460 (0.0008) +[2023-10-08 14:03:55,574][102897] Updated weights for policy 0, policy_version 57470 (0.0007) +[2023-10-08 14:03:56,013][102898] Updated weights for policy 1, policy_version 57510 (0.0007) +[2023-10-08 14:03:56,390][102898] Updated weights for policy 1, policy_version 57520 (0.0007) +[2023-10-08 14:03:56,753][102898] Updated weights for policy 1, policy_version 57530 (0.0009) +[2023-10-08 14:03:56,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 117735424. Throughput: 0: 1792.5, 1: 1794.1. Samples: 29444436. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:03:56,876][101941] Avg episode reward: [(0, '7.390'), (1, '9.050')] +[2023-10-08 14:03:59,235][102897] Updated weights for policy 0, policy_version 57480 (0.0008) +[2023-10-08 14:03:59,601][102897] Updated weights for policy 0, policy_version 57490 (0.0008) +[2023-10-08 14:03:59,970][102897] Updated weights for policy 0, policy_version 57500 (0.0007) +[2023-10-08 14:04:00,184][102898] Updated weights for policy 1, policy_version 57540 (0.0007) +[2023-10-08 14:04:00,538][102898] Updated weights for policy 1, policy_version 57550 (0.0009) +[2023-10-08 14:04:00,912][102898] Updated weights for policy 1, policy_version 57560 (0.0007) +[2023-10-08 14:04:01,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 117833728. Throughput: 0: 1785.6, 1: 1775.6. Samples: 29465088. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:04:01,876][101941] Avg episode reward: [(0, '7.470'), (1, '8.820')] +[2023-10-08 14:04:03,869][102897] Updated weights for policy 0, policy_version 57510 (0.0008) +[2023-10-08 14:04:04,233][102897] Updated weights for policy 0, policy_version 57520 (0.0007) +[2023-10-08 14:04:04,600][102897] Updated weights for policy 0, policy_version 57530 (0.0007) +[2023-10-08 14:04:04,671][102898] Updated weights for policy 1, policy_version 57570 (0.0007) +[2023-10-08 14:04:05,034][102898] Updated weights for policy 1, policy_version 57580 (0.0008) +[2023-10-08 14:04:05,405][102898] Updated weights for policy 1, policy_version 57590 (0.0010) +[2023-10-08 14:04:05,776][102898] Updated weights for policy 1, policy_version 57600 (0.0007) +[2023-10-08 14:04:06,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 117899264. Throughput: 0: 1799.5, 1: 1791.5. Samples: 29476848. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:04:06,876][101941] Avg episode reward: [(0, '7.360'), (1, '8.090')] +[2023-10-08 14:04:08,304][102897] Updated weights for policy 0, policy_version 57540 (0.0009) +[2023-10-08 14:04:08,684][102897] Updated weights for policy 0, policy_version 57550 (0.0009) +[2023-10-08 14:04:09,045][102897] Updated weights for policy 0, policy_version 57560 (0.0008) +[2023-10-08 14:04:09,582][102898] Updated weights for policy 1, policy_version 57610 (0.0007) +[2023-10-08 14:04:09,942][102898] Updated weights for policy 1, policy_version 57620 (0.0007) +[2023-10-08 14:04:10,317][102898] Updated weights for policy 1, policy_version 57630 (0.0010) +[2023-10-08 14:04:11,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 117964800. Throughput: 0: 1788.7, 1: 1778.9. Samples: 29497236. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:04:11,876][101941] Avg episode reward: [(0, '7.640'), (1, '8.600')] +[2023-10-08 14:04:12,797][102897] Updated weights for policy 0, policy_version 57570 (0.0009) +[2023-10-08 14:04:13,179][102897] Updated weights for policy 0, policy_version 57580 (0.0009) +[2023-10-08 14:04:13,550][102897] Updated weights for policy 0, policy_version 57590 (0.0009) +[2023-10-08 14:04:13,914][102897] Updated weights for policy 0, policy_version 57600 (0.0008) +[2023-10-08 14:04:14,085][102898] Updated weights for policy 1, policy_version 57640 (0.0008) +[2023-10-08 14:04:14,451][102898] Updated weights for policy 1, policy_version 57650 (0.0009) +[2023-10-08 14:04:14,813][102898] Updated weights for policy 1, policy_version 57660 (0.0007) +[2023-10-08 14:04:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 118030336. Throughput: 0: 1793.5, 1: 1780.4. Samples: 29519780. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:04:16,876][101941] Avg episode reward: [(0, '7.730'), (1, '8.910')] +[2023-10-08 14:04:16,887][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000057664_59047936.pth... +[2023-10-08 14:04:16,887][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000057600_58982400.pth... +[2023-10-08 14:04:16,934][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000056000_57344000.pth +[2023-10-08 14:04:16,934][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000055936_57278464.pth +[2023-10-08 14:04:17,759][102897] Updated weights for policy 0, policy_version 57610 (0.0007) +[2023-10-08 14:04:18,136][102897] Updated weights for policy 0, policy_version 57620 (0.0007) +[2023-10-08 14:04:18,505][102897] Updated weights for policy 0, policy_version 57630 (0.0007) +[2023-10-08 14:04:18,674][102898] Updated weights for policy 1, policy_version 57670 (0.0008) +[2023-10-08 14:04:19,037][102898] Updated weights for policy 1, policy_version 57680 (0.0009) +[2023-10-08 14:04:19,403][102898] Updated weights for policy 1, policy_version 57690 (0.0007) +[2023-10-08 14:04:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 118095872. Throughput: 0: 1792.8, 1: 1784.4. Samples: 29529568. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:04:21,876][101941] Avg episode reward: [(0, '7.710'), (1, '8.810')] +[2023-10-08 14:04:22,406][102897] Updated weights for policy 0, policy_version 57640 (0.0008) +[2023-10-08 14:04:22,774][102897] Updated weights for policy 0, policy_version 57650 (0.0007) +[2023-10-08 14:04:23,152][102897] Updated weights for policy 0, policy_version 57660 (0.0007) +[2023-10-08 14:04:23,245][102898] Updated weights for policy 1, policy_version 57700 (0.0009) +[2023-10-08 14:04:23,608][102898] Updated weights for policy 1, policy_version 57710 (0.0009) +[2023-10-08 14:04:23,975][102898] Updated weights for policy 1, policy_version 57720 (0.0008) +[2023-10-08 14:04:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 118161408. Throughput: 0: 1782.7, 1: 1782.7. Samples: 29551480. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:04:26,876][101941] Avg episode reward: [(0, '8.410'), (1, '9.330')] +[2023-10-08 14:04:26,885][102897] Updated weights for policy 0, policy_version 57670 (0.0007) +[2023-10-08 14:04:27,259][102897] Updated weights for policy 0, policy_version 57680 (0.0007) +[2023-10-08 14:04:27,637][102897] Updated weights for policy 0, policy_version 57690 (0.0008) +[2023-10-08 14:04:27,869][102898] Updated weights for policy 1, policy_version 57730 (0.0008) +[2023-10-08 14:04:28,278][102898] Updated weights for policy 1, policy_version 57740 (0.0008) +[2023-10-08 14:04:28,640][102898] Updated weights for policy 1, policy_version 57750 (0.0008) +[2023-10-08 14:04:29,006][102898] Updated weights for policy 1, policy_version 57760 (0.0007) +[2023-10-08 14:04:31,373][102897] Updated weights for policy 0, policy_version 57700 (0.0008) +[2023-10-08 14:04:31,751][102897] Updated weights for policy 0, policy_version 57710 (0.0008) +[2023-10-08 14:04:31,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 118226944. Throughput: 0: 1809.2, 1: 1776.4. Samples: 29573528. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:04:31,876][101941] Avg episode reward: [(0, '7.850'), (1, '8.600')] +[2023-10-08 14:04:32,119][102897] Updated weights for policy 0, policy_version 57720 (0.0008) +[2023-10-08 14:04:32,811][102898] Updated weights for policy 1, policy_version 57770 (0.0009) +[2023-10-08 14:04:33,176][102898] Updated weights for policy 1, policy_version 57780 (0.0007) +[2023-10-08 14:04:33,545][102898] Updated weights for policy 1, policy_version 57790 (0.0008) +[2023-10-08 14:04:35,820][102897] Updated weights for policy 0, policy_version 57730 (0.0010) +[2023-10-08 14:04:36,197][102897] Updated weights for policy 0, policy_version 57740 (0.0010) +[2023-10-08 14:04:36,559][102897] Updated weights for policy 0, policy_version 57750 (0.0009) +[2023-10-08 14:04:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 118292480. Throughput: 0: 1782.2, 1: 1777.8. Samples: 29583430. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:04:36,876][101941] Avg episode reward: [(0, '7.310'), (1, '8.790')] +[2023-10-08 14:04:36,931][102897] Updated weights for policy 0, policy_version 57760 (0.0007) +[2023-10-08 14:04:37,340][102898] Updated weights for policy 1, policy_version 57800 (0.0008) +[2023-10-08 14:04:37,693][102898] Updated weights for policy 1, policy_version 57810 (0.0007) +[2023-10-08 14:04:38,065][102898] Updated weights for policy 1, policy_version 57820 (0.0007) +[2023-10-08 14:04:40,611][102897] Updated weights for policy 0, policy_version 57770 (0.0011) +[2023-10-08 14:04:40,984][102897] Updated weights for policy 0, policy_version 57780 (0.0009) +[2023-10-08 14:04:41,352][102897] Updated weights for policy 0, policy_version 57790 (0.0007) +[2023-10-08 14:04:41,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 118390784. Throughput: 0: 1806.9, 1: 1780.5. Samples: 29605868. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:04:41,875][101941] Avg episode reward: [(0, '7.850'), (1, '8.780')] +[2023-10-08 14:04:41,887][102898] Updated weights for policy 1, policy_version 57830 (0.0010) +[2023-10-08 14:04:42,257][102898] Updated weights for policy 1, policy_version 57840 (0.0011) +[2023-10-08 14:04:42,621][102898] Updated weights for policy 1, policy_version 57850 (0.0007) +[2023-10-08 14:04:44,910][102897] Updated weights for policy 0, policy_version 57800 (0.0008) +[2023-10-08 14:04:45,284][102897] Updated weights for policy 0, policy_version 57810 (0.0010) +[2023-10-08 14:04:45,649][102897] Updated weights for policy 0, policy_version 57820 (0.0010) +[2023-10-08 14:04:46,327][102898] Updated weights for policy 1, policy_version 57860 (0.0007) +[2023-10-08 14:04:46,690][102898] Updated weights for policy 1, policy_version 57870 (0.0009) +[2023-10-08 14:04:46,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 118456320. Throughput: 0: 1789.2, 1: 1805.3. Samples: 29626840. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:04:46,876][101941] Avg episode reward: [(0, '7.660'), (1, '8.680')] +[2023-10-08 14:04:47,055][102898] Updated weights for policy 1, policy_version 57880 (0.0008) +[2023-10-08 14:04:49,595][102897] Updated weights for policy 0, policy_version 57830 (0.0008) +[2023-10-08 14:04:49,967][102897] Updated weights for policy 0, policy_version 57840 (0.0009) +[2023-10-08 14:04:50,336][102897] Updated weights for policy 0, policy_version 57850 (0.0009) +[2023-10-08 14:04:50,896][102898] Updated weights for policy 1, policy_version 57890 (0.0010) +[2023-10-08 14:04:51,263][102898] Updated weights for policy 1, policy_version 57900 (0.0009) +[2023-10-08 14:04:51,631][102898] Updated weights for policy 1, policy_version 57910 (0.0009) +[2023-10-08 14:04:51,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 118521856. Throughput: 0: 1810.1, 1: 1779.0. Samples: 29638358. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:04:51,876][101941] Avg episode reward: [(0, '7.860'), (1, '8.600')] +[2023-10-08 14:04:51,994][102898] Updated weights for policy 1, policy_version 57920 (0.0007) +[2023-10-08 14:04:54,084][102897] Updated weights for policy 0, policy_version 57860 (0.0008) +[2023-10-08 14:04:54,447][102897] Updated weights for policy 0, policy_version 57870 (0.0007) +[2023-10-08 14:04:54,825][102897] Updated weights for policy 0, policy_version 57880 (0.0007) +[2023-10-08 14:04:55,659][102898] Updated weights for policy 1, policy_version 57930 (0.0007) +[2023-10-08 14:04:56,020][102898] Updated weights for policy 1, policy_version 57940 (0.0010) +[2023-10-08 14:04:56,392][102898] Updated weights for policy 1, policy_version 57950 (0.0010) +[2023-10-08 14:04:56,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 118620160. Throughput: 0: 1782.9, 1: 1811.0. Samples: 29658962. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:04:56,875][101941] Avg episode reward: [(0, '8.380'), (1, '8.620')] +[2023-10-08 14:04:58,547][102897] Updated weights for policy 0, policy_version 57890 (0.0007) +[2023-10-08 14:04:58,922][102897] Updated weights for policy 0, policy_version 57900 (0.0009) +[2023-10-08 14:04:59,281][102897] Updated weights for policy 0, policy_version 57910 (0.0009) +[2023-10-08 14:04:59,656][102897] Updated weights for policy 0, policy_version 57920 (0.0007) +[2023-10-08 14:05:00,116][102898] Updated weights for policy 1, policy_version 57960 (0.0007) +[2023-10-08 14:05:00,486][102898] Updated weights for policy 1, policy_version 57970 (0.0007) +[2023-10-08 14:05:00,858][102898] Updated weights for policy 1, policy_version 57980 (0.0008) +[2023-10-08 14:05:01,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 118685696. Throughput: 0: 1782.7, 1: 1783.3. Samples: 29680248. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:05:01,876][101941] Avg episode reward: [(0, '7.670'), (1, '8.410')] +[2023-10-08 14:05:03,543][102897] Updated weights for policy 0, policy_version 57930 (0.0009) +[2023-10-08 14:05:03,919][102897] Updated weights for policy 0, policy_version 57940 (0.0009) +[2023-10-08 14:05:04,282][102897] Updated weights for policy 0, policy_version 57950 (0.0008) +[2023-10-08 14:05:04,527][102898] Updated weights for policy 1, policy_version 57990 (0.0007) +[2023-10-08 14:05:04,895][102898] Updated weights for policy 1, policy_version 58000 (0.0008) +[2023-10-08 14:05:05,266][102898] Updated weights for policy 1, policy_version 58010 (0.0009) +[2023-10-08 14:05:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 118751232. Throughput: 0: 1786.7, 1: 1812.7. Samples: 29691542. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:05:06,876][101941] Avg episode reward: [(0, '7.190'), (1, '8.810')] +[2023-10-08 14:05:07,981][102897] Updated weights for policy 0, policy_version 57960 (0.0009) +[2023-10-08 14:05:08,365][102897] Updated weights for policy 0, policy_version 57970 (0.0008) +[2023-10-08 14:05:08,735][102897] Updated weights for policy 0, policy_version 57980 (0.0009) +[2023-10-08 14:05:08,967][102898] Updated weights for policy 1, policy_version 58020 (0.0009) +[2023-10-08 14:05:09,323][102898] Updated weights for policy 1, policy_version 58030 (0.0009) +[2023-10-08 14:05:09,686][102898] Updated weights for policy 1, policy_version 58040 (0.0009) +[2023-10-08 14:05:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 118816768. Throughput: 0: 1792.2, 1: 1792.3. Samples: 29712782. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 14:05:11,876][101941] Avg episode reward: [(0, '7.480'), (1, '8.490')] +[2023-10-08 14:05:12,483][102897] Updated weights for policy 0, policy_version 57990 (0.0011) +[2023-10-08 14:05:12,860][102897] Updated weights for policy 0, policy_version 58000 (0.0009) +[2023-10-08 14:05:13,222][102897] Updated weights for policy 0, policy_version 58010 (0.0009) +[2023-10-08 14:05:13,541][102898] Updated weights for policy 1, policy_version 58050 (0.0010) +[2023-10-08 14:05:13,960][102898] Updated weights for policy 1, policy_version 58060 (0.0009) +[2023-10-08 14:05:14,327][102898] Updated weights for policy 1, policy_version 58070 (0.0011) +[2023-10-08 14:05:14,692][102898] Updated weights for policy 1, policy_version 58080 (0.0008) +[2023-10-08 14:05:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 118882304. Throughput: 0: 1794.4, 1: 1792.4. Samples: 29734932. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 14:05:16,875][101941] Avg episode reward: [(0, '7.140'), (1, '8.880')] +[2023-10-08 14:05:17,036][102897] Updated weights for policy 0, policy_version 58020 (0.0007) +[2023-10-08 14:05:17,433][102897] Updated weights for policy 0, policy_version 58030 (0.0007) +[2023-10-08 14:05:17,801][102897] Updated weights for policy 0, policy_version 58040 (0.0007) +[2023-10-08 14:05:18,312][102898] Updated weights for policy 1, policy_version 58090 (0.0007) +[2023-10-08 14:05:18,679][102898] Updated weights for policy 1, policy_version 58100 (0.0008) +[2023-10-08 14:05:19,040][102898] Updated weights for policy 1, policy_version 58110 (0.0007) +[2023-10-08 14:05:21,432][102897] Updated weights for policy 0, policy_version 58050 (0.0008) +[2023-10-08 14:05:21,801][102897] Updated weights for policy 0, policy_version 58060 (0.0009) +[2023-10-08 14:05:21,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 118947840. Throughput: 0: 1786.4, 1: 1796.4. Samples: 29744652. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 14:05:21,876][101941] Avg episode reward: [(0, '7.490'), (1, '8.920')] +[2023-10-08 14:05:22,164][102897] Updated weights for policy 0, policy_version 58070 (0.0007) +[2023-10-08 14:05:22,545][102897] Updated weights for policy 0, policy_version 58080 (0.0008) +[2023-10-08 14:05:22,866][102898] Updated weights for policy 1, policy_version 58120 (0.0008) +[2023-10-08 14:05:23,233][102898] Updated weights for policy 1, policy_version 58130 (0.0008) +[2023-10-08 14:05:23,597][102898] Updated weights for policy 1, policy_version 58140 (0.0008) +[2023-10-08 14:05:26,318][102897] Updated weights for policy 0, policy_version 58090 (0.0008) +[2023-10-08 14:05:26,688][102897] Updated weights for policy 0, policy_version 58100 (0.0007) +[2023-10-08 14:05:26,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 119013376. Throughput: 0: 1790.9, 1: 1792.0. Samples: 29767102. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 14:05:26,876][101941] Avg episode reward: [(0, '7.800'), (1, '9.040')] +[2023-10-08 14:05:27,064][102897] Updated weights for policy 0, policy_version 58110 (0.0010) +[2023-10-08 14:05:27,294][102898] Updated weights for policy 1, policy_version 58150 (0.0008) +[2023-10-08 14:05:27,665][102898] Updated weights for policy 1, policy_version 58160 (0.0008) +[2023-10-08 14:05:28,030][102898] Updated weights for policy 1, policy_version 58170 (0.0009) +[2023-10-08 14:05:30,796][102897] Updated weights for policy 0, policy_version 58120 (0.0010) +[2023-10-08 14:05:31,168][102897] Updated weights for policy 0, policy_version 58130 (0.0009) +[2023-10-08 14:05:31,541][102897] Updated weights for policy 0, policy_version 58140 (0.0007) +[2023-10-08 14:05:31,863][102898] Updated weights for policy 1, policy_version 58180 (0.0008) +[2023-10-08 14:05:31,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 119111680. Throughput: 0: 1794.8, 1: 1794.9. Samples: 29788376. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 14:05:31,876][101941] Avg episode reward: [(0, '8.300'), (1, '9.380')] +[2023-10-08 14:05:32,239][102898] Updated weights for policy 1, policy_version 58190 (0.0007) +[2023-10-08 14:05:32,599][102898] Updated weights for policy 1, policy_version 58200 (0.0007) +[2023-10-08 14:05:35,092][102897] Updated weights for policy 0, policy_version 58150 (0.0007) +[2023-10-08 14:05:35,470][102897] Updated weights for policy 0, policy_version 58160 (0.0007) +[2023-10-08 14:05:35,838][102897] Updated weights for policy 0, policy_version 58170 (0.0007) +[2023-10-08 14:05:36,460][102898] Updated weights for policy 1, policy_version 58210 (0.0008) +[2023-10-08 14:05:36,823][102898] Updated weights for policy 1, policy_version 58220 (0.0008) +[2023-10-08 14:05:36,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 119177216. Throughput: 0: 1786.1, 1: 1785.4. Samples: 29799078. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 14:05:36,876][101941] Avg episode reward: [(0, '8.220'), (1, '8.730')] +[2023-10-08 14:05:37,191][102898] Updated weights for policy 1, policy_version 58230 (0.0009) +[2023-10-08 14:05:37,558][102898] Updated weights for policy 1, policy_version 58240 (0.0008) +[2023-10-08 14:05:39,569][102897] Updated weights for policy 0, policy_version 58180 (0.0008) +[2023-10-08 14:05:39,946][102897] Updated weights for policy 0, policy_version 58190 (0.0007) +[2023-10-08 14:05:40,309][102897] Updated weights for policy 0, policy_version 58200 (0.0007) +[2023-10-08 14:05:41,261][102898] Updated weights for policy 1, policy_version 58250 (0.0009) +[2023-10-08 14:05:41,621][102898] Updated weights for policy 1, policy_version 58260 (0.0009) +[2023-10-08 14:05:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 119242752. Throughput: 0: 1798.8, 1: 1789.4. Samples: 29820432. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 14:05:41,875][101941] Avg episode reward: [(0, '8.300'), (1, '8.790')] +[2023-10-08 14:05:41,988][102898] Updated weights for policy 1, policy_version 58270 (0.0007) +[2023-10-08 14:05:43,958][102897] Updated weights for policy 0, policy_version 58210 (0.0007) +[2023-10-08 14:05:44,327][102897] Updated weights for policy 0, policy_version 58220 (0.0008) +[2023-10-08 14:05:44,701][102897] Updated weights for policy 0, policy_version 58230 (0.0008) +[2023-10-08 14:05:45,066][102897] Updated weights for policy 0, policy_version 58240 (0.0011) +[2023-10-08 14:05:45,839][102898] Updated weights for policy 1, policy_version 58280 (0.0010) +[2023-10-08 14:05:46,199][102898] Updated weights for policy 1, policy_version 58290 (0.0008) +[2023-10-08 14:05:46,564][102898] Updated weights for policy 1, policy_version 58300 (0.0009) +[2023-10-08 14:05:46,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 119341056. Throughput: 0: 1791.9, 1: 1787.2. Samples: 29841304. Policy #0 lag: (min: 23.0, avg: 23.0, max: 23.0) +[2023-10-08 14:05:46,875][101941] Avg episode reward: [(0, '8.110'), (1, '8.420')] +[2023-10-08 14:05:48,849][102897] Updated weights for policy 0, policy_version 58250 (0.0007) +[2023-10-08 14:05:49,222][102897] Updated weights for policy 0, policy_version 58260 (0.0008) +[2023-10-08 14:05:49,595][102897] Updated weights for policy 0, policy_version 58270 (0.0008) +[2023-10-08 14:05:50,395][102898] Updated weights for policy 1, policy_version 58310 (0.0008) +[2023-10-08 14:05:50,761][102898] Updated weights for policy 1, policy_version 58320 (0.0008) +[2023-10-08 14:05:51,126][102898] Updated weights for policy 1, policy_version 58330 (0.0007) +[2023-10-08 14:05:51,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 119406592. Throughput: 0: 1798.3, 1: 1773.4. Samples: 29852266. Policy #0 lag: (min: 31.0, avg: 47.8, max: 63.0) +[2023-10-08 14:05:51,876][101941] Avg episode reward: [(0, '8.420'), (1, '9.220')] +[2023-10-08 14:05:53,375][102897] Updated weights for policy 0, policy_version 58280 (0.0009) +[2023-10-08 14:05:53,749][102897] Updated weights for policy 0, policy_version 58290 (0.0008) +[2023-10-08 14:05:54,118][102897] Updated weights for policy 0, policy_version 58300 (0.0007) +[2023-10-08 14:05:54,963][102898] Updated weights for policy 1, policy_version 58340 (0.0007) +[2023-10-08 14:05:55,332][102898] Updated weights for policy 1, policy_version 58350 (0.0008) +[2023-10-08 14:05:55,688][102898] Updated weights for policy 1, policy_version 58360 (0.0009) +[2023-10-08 14:05:56,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 119472128. Throughput: 0: 1787.1, 1: 1786.2. Samples: 29873580. Policy #0 lag: (min: 31.0, avg: 47.8, max: 63.0) +[2023-10-08 14:05:56,876][101941] Avg episode reward: [(0, '8.390'), (1, '8.730')] +[2023-10-08 14:05:57,805][102897] Updated weights for policy 0, policy_version 58310 (0.0007) +[2023-10-08 14:05:58,173][102897] Updated weights for policy 0, policy_version 58320 (0.0009) +[2023-10-08 14:05:58,552][102897] Updated weights for policy 0, policy_version 58330 (0.0008) +[2023-10-08 14:05:59,600][102898] Updated weights for policy 1, policy_version 58370 (0.0009) +[2023-10-08 14:06:00,003][102898] Updated weights for policy 1, policy_version 58380 (0.0007) +[2023-10-08 14:06:00,365][102898] Updated weights for policy 1, policy_version 58390 (0.0010) +[2023-10-08 14:06:00,736][102898] Updated weights for policy 1, policy_version 58400 (0.0007) +[2023-10-08 14:06:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 119537664. Throughput: 0: 1788.9, 1: 1770.1. Samples: 29895088. Policy #0 lag: (min: 31.0, avg: 47.8, max: 63.0) +[2023-10-08 14:06:01,876][101941] Avg episode reward: [(0, '7.950'), (1, '8.580')] +[2023-10-08 14:06:02,554][102897] Updated weights for policy 0, policy_version 58340 (0.0010) +[2023-10-08 14:06:02,926][102897] Updated weights for policy 0, policy_version 58350 (0.0007) +[2023-10-08 14:06:03,292][102897] Updated weights for policy 0, policy_version 58360 (0.0007) +[2023-10-08 14:06:04,265][102898] Updated weights for policy 1, policy_version 58410 (0.0009) +[2023-10-08 14:06:04,629][102898] Updated weights for policy 1, policy_version 58420 (0.0008) +[2023-10-08 14:06:04,987][102898] Updated weights for policy 1, policy_version 58430 (0.0008) +[2023-10-08 14:06:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 119603200. Throughput: 0: 1788.6, 1: 1786.9. Samples: 29905550. Policy #0 lag: (min: 31.0, avg: 47.8, max: 63.0) +[2023-10-08 14:06:06,875][101941] Avg episode reward: [(0, '8.110'), (1, '9.660')] +[2023-10-08 14:06:07,112][102897] Updated weights for policy 0, policy_version 58370 (0.0008) +[2023-10-08 14:06:07,484][102897] Updated weights for policy 0, policy_version 58380 (0.0008) +[2023-10-08 14:06:07,860][102897] Updated weights for policy 0, policy_version 58390 (0.0009) +[2023-10-08 14:06:08,227][102897] Updated weights for policy 0, policy_version 58400 (0.0011) +[2023-10-08 14:06:08,903][102898] Updated weights for policy 1, policy_version 58440 (0.0007) +[2023-10-08 14:06:09,270][102898] Updated weights for policy 1, policy_version 58450 (0.0008) +[2023-10-08 14:06:09,630][102898] Updated weights for policy 1, policy_version 58460 (0.0008) +[2023-10-08 14:06:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 119668736. Throughput: 0: 1781.2, 1: 1766.1. Samples: 29926730. Policy #0 lag: (min: 31.0, avg: 47.8, max: 63.0) +[2023-10-08 14:06:11,876][101941] Avg episode reward: [(0, '7.660'), (1, '8.760')] +[2023-10-08 14:06:12,187][102897] Updated weights for policy 0, policy_version 58410 (0.0008) +[2023-10-08 14:06:12,563][102897] Updated weights for policy 0, policy_version 58420 (0.0007) +[2023-10-08 14:06:12,925][102897] Updated weights for policy 0, policy_version 58430 (0.0007) +[2023-10-08 14:06:13,469][102898] Updated weights for policy 1, policy_version 58470 (0.0009) +[2023-10-08 14:06:13,833][102898] Updated weights for policy 1, policy_version 58480 (0.0010) +[2023-10-08 14:06:14,208][102898] Updated weights for policy 1, policy_version 58490 (0.0012) +[2023-10-08 14:06:16,728][102897] Updated weights for policy 0, policy_version 58440 (0.0007) +[2023-10-08 14:06:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 119734272. Throughput: 0: 1803.9, 1: 1769.6. Samples: 29949184. Policy #0 lag: (min: 31.0, avg: 47.8, max: 63.0) +[2023-10-08 14:06:16,875][101941] Avg episode reward: [(0, '7.490'), (1, '8.700')] +[2023-10-08 14:06:16,884][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000058496_59899904.pth... +[2023-10-08 14:06:16,923][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000056832_58195968.pth +[2023-10-08 14:06:16,928][102760] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p1/milestones/checkpoint_000058496_59899904.pth +[2023-10-08 14:06:17,098][102897] Updated weights for policy 0, policy_version 58450 (0.0008) +[2023-10-08 14:06:17,471][102897] Updated weights for policy 0, policy_version 58460 (0.0009) +[2023-10-08 14:06:17,621][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000058464_59867136.pth... +[2023-10-08 14:06:17,653][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000056768_58130432.pth +[2023-10-08 14:06:17,657][102634] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p0/milestones/checkpoint_000058464_59867136.pth +[2023-10-08 14:06:17,849][102898] Updated weights for policy 1, policy_version 58500 (0.0008) +[2023-10-08 14:06:18,213][102898] Updated weights for policy 1, policy_version 58510 (0.0010) +[2023-10-08 14:06:18,593][102898] Updated weights for policy 1, policy_version 58520 (0.0009) +[2023-10-08 14:06:21,091][102897] Updated weights for policy 0, policy_version 58470 (0.0008) +[2023-10-08 14:06:21,465][102897] Updated weights for policy 0, policy_version 58480 (0.0009) +[2023-10-08 14:06:21,829][102897] Updated weights for policy 0, policy_version 58490 (0.0009) +[2023-10-08 14:06:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 119799808. Throughput: 0: 1778.8, 1: 1773.1. Samples: 29958912. Policy #0 lag: (min: 31.0, avg: 47.8, max: 63.0) +[2023-10-08 14:06:21,876][101941] Avg episode reward: [(0, '7.950'), (1, '8.340')] +[2023-10-08 14:06:22,482][102898] Updated weights for policy 1, policy_version 58530 (0.0009) +[2023-10-08 14:06:22,855][102898] Updated weights for policy 1, policy_version 58540 (0.0007) +[2023-10-08 14:06:23,210][102898] Updated weights for policy 1, policy_version 58550 (0.0007) +[2023-10-08 14:06:23,578][102898] Updated weights for policy 1, policy_version 58560 (0.0007) +[2023-10-08 14:06:25,504][102897] Updated weights for policy 0, policy_version 58500 (0.0010) +[2023-10-08 14:06:25,874][102897] Updated weights for policy 0, policy_version 58510 (0.0010) +[2023-10-08 14:06:26,247][102897] Updated weights for policy 0, policy_version 58520 (0.0009) +[2023-10-08 14:06:26,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 119898112. Throughput: 0: 1809.0, 1: 1766.0. Samples: 29981310. Policy #0 lag: (min: 31.0, avg: 47.8, max: 63.0) +[2023-10-08 14:06:26,876][101941] Avg episode reward: [(0, '8.340'), (1, '8.940')] +[2023-10-08 14:06:27,431][102898] Updated weights for policy 1, policy_version 58570 (0.0009) +[2023-10-08 14:06:27,799][102898] Updated weights for policy 1, policy_version 58580 (0.0009) +[2023-10-08 14:06:28,169][102898] Updated weights for policy 1, policy_version 58590 (0.0008) +[2023-10-08 14:06:30,052][102897] Updated weights for policy 0, policy_version 58530 (0.0008) +[2023-10-08 14:06:30,424][102897] Updated weights for policy 0, policy_version 58540 (0.0008) +[2023-10-08 14:06:30,789][102897] Updated weights for policy 0, policy_version 58550 (0.0007) +[2023-10-08 14:06:31,162][102897] Updated weights for policy 0, policy_version 58560 (0.0008) +[2023-10-08 14:06:31,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 119963648. Throughput: 0: 1784.5, 1: 1797.1. Samples: 30002476. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 14:06:31,876][101941] Avg episode reward: [(0, '7.770'), (1, '9.080')] +[2023-10-08 14:06:31,878][102898] Updated weights for policy 1, policy_version 58600 (0.0007) +[2023-10-08 14:06:32,247][102898] Updated weights for policy 1, policy_version 58610 (0.0009) +[2023-10-08 14:06:32,617][102898] Updated weights for policy 1, policy_version 58620 (0.0008) +[2023-10-08 14:06:34,988][102897] Updated weights for policy 0, policy_version 58570 (0.0010) +[2023-10-08 14:06:35,361][102897] Updated weights for policy 0, policy_version 58580 (0.0008) +[2023-10-08 14:06:35,728][102897] Updated weights for policy 0, policy_version 58590 (0.0008) +[2023-10-08 14:06:36,341][102898] Updated weights for policy 1, policy_version 58630 (0.0008) +[2023-10-08 14:06:36,709][102898] Updated weights for policy 1, policy_version 58640 (0.0008) +[2023-10-08 14:06:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 120029184. Throughput: 0: 1807.5, 1: 1778.3. Samples: 30013626. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 14:06:36,875][101941] Avg episode reward: [(0, '7.410'), (1, '9.210')] +[2023-10-08 14:06:37,072][102898] Updated weights for policy 1, policy_version 58650 (0.0008) +[2023-10-08 14:06:39,374][102897] Updated weights for policy 0, policy_version 58600 (0.0008) +[2023-10-08 14:06:39,746][102897] Updated weights for policy 0, policy_version 58610 (0.0007) +[2023-10-08 14:06:40,120][102897] Updated weights for policy 0, policy_version 58620 (0.0009) +[2023-10-08 14:06:40,749][102898] Updated weights for policy 1, policy_version 58660 (0.0007) +[2023-10-08 14:06:41,113][102898] Updated weights for policy 1, policy_version 58670 (0.0009) +[2023-10-08 14:06:41,491][102898] Updated weights for policy 1, policy_version 58680 (0.0009) +[2023-10-08 14:06:41,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 120127488. Throughput: 0: 1783.7, 1: 1797.6. Samples: 30034740. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 14:06:41,875][101941] Avg episode reward: [(0, '7.730'), (1, '9.610')] +[2023-10-08 14:06:43,930][102897] Updated weights for policy 0, policy_version 58630 (0.0008) +[2023-10-08 14:06:44,305][102897] Updated weights for policy 0, policy_version 58640 (0.0007) +[2023-10-08 14:06:44,676][102897] Updated weights for policy 0, policy_version 58650 (0.0009) +[2023-10-08 14:06:45,370][102898] Updated weights for policy 1, policy_version 58690 (0.0008) +[2023-10-08 14:06:45,759][102898] Updated weights for policy 1, policy_version 58700 (0.0009) +[2023-10-08 14:06:46,119][102898] Updated weights for policy 1, policy_version 58710 (0.0010) +[2023-10-08 14:06:46,482][102898] Updated weights for policy 1, policy_version 58720 (0.0008) +[2023-10-08 14:06:46,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 120193024. Throughput: 0: 1785.6, 1: 1784.3. Samples: 30055732. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 14:06:46,876][101941] Avg episode reward: [(0, '7.640'), (1, '9.150')] +[2023-10-08 14:06:48,471][102897] Updated weights for policy 0, policy_version 58660 (0.0008) +[2023-10-08 14:06:48,851][102897] Updated weights for policy 0, policy_version 58670 (0.0008) +[2023-10-08 14:06:49,225][102897] Updated weights for policy 0, policy_version 58680 (0.0007) +[2023-10-08 14:06:50,156][102898] Updated weights for policy 1, policy_version 58730 (0.0009) +[2023-10-08 14:06:50,517][102898] Updated weights for policy 1, policy_version 58740 (0.0010) +[2023-10-08 14:06:50,870][102898] Updated weights for policy 1, policy_version 58750 (0.0010) +[2023-10-08 14:06:51,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 120258560. Throughput: 0: 1787.5, 1: 1798.7. Samples: 30066930. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 14:06:51,876][101941] Avg episode reward: [(0, '7.460'), (1, '7.730')] +[2023-10-08 14:06:52,891][102897] Updated weights for policy 0, policy_version 58690 (0.0007) +[2023-10-08 14:06:53,261][102897] Updated weights for policy 0, policy_version 58700 (0.0009) +[2023-10-08 14:06:53,639][102897] Updated weights for policy 0, policy_version 58710 (0.0007) +[2023-10-08 14:06:54,011][102897] Updated weights for policy 0, policy_version 58720 (0.0010) +[2023-10-08 14:06:54,665][102898] Updated weights for policy 1, policy_version 58760 (0.0009) +[2023-10-08 14:06:55,035][102898] Updated weights for policy 1, policy_version 58770 (0.0008) +[2023-10-08 14:06:55,400][102898] Updated weights for policy 1, policy_version 58780 (0.0008) +[2023-10-08 14:06:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 120324096. Throughput: 0: 1790.8, 1: 1790.8. Samples: 30087904. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 14:06:56,876][101941] Avg episode reward: [(0, '8.110'), (1, '8.300')] +[2023-10-08 14:06:57,709][102897] Updated weights for policy 0, policy_version 58730 (0.0008) +[2023-10-08 14:06:58,085][102897] Updated weights for policy 0, policy_version 58740 (0.0008) +[2023-10-08 14:06:58,454][102897] Updated weights for policy 0, policy_version 58750 (0.0010) +[2023-10-08 14:06:59,236][102898] Updated weights for policy 1, policy_version 58790 (0.0011) +[2023-10-08 14:06:59,594][102898] Updated weights for policy 1, policy_version 58800 (0.0010) +[2023-10-08 14:06:59,956][102898] Updated weights for policy 1, policy_version 58810 (0.0009) +[2023-10-08 14:07:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 120389632. Throughput: 0: 1792.6, 1: 1784.7. Samples: 30110160. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 14:07:01,876][101941] Avg episode reward: [(0, '7.670'), (1, '9.240')] +[2023-10-08 14:07:02,218][102897] Updated weights for policy 0, policy_version 58760 (0.0009) +[2023-10-08 14:07:02,594][102897] Updated weights for policy 0, policy_version 58770 (0.0009) +[2023-10-08 14:07:02,966][102897] Updated weights for policy 0, policy_version 58780 (0.0007) +[2023-10-08 14:07:03,703][102898] Updated weights for policy 1, policy_version 58820 (0.0008) +[2023-10-08 14:07:04,069][102898] Updated weights for policy 1, policy_version 58830 (0.0008) +[2023-10-08 14:07:04,442][102898] Updated weights for policy 1, policy_version 58840 (0.0007) +[2023-10-08 14:07:06,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 120455168. Throughput: 0: 1792.0, 1: 1792.5. Samples: 30120214. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 14:07:06,875][101941] Avg episode reward: [(0, '7.510'), (1, '9.350')] +[2023-10-08 14:07:06,888][102897] Updated weights for policy 0, policy_version 58790 (0.0011) +[2023-10-08 14:07:07,253][102897] Updated weights for policy 0, policy_version 58800 (0.0007) +[2023-10-08 14:07:07,628][102897] Updated weights for policy 0, policy_version 58810 (0.0008) +[2023-10-08 14:07:08,185][102898] Updated weights for policy 1, policy_version 58850 (0.0008) +[2023-10-08 14:07:08,548][102898] Updated weights for policy 1, policy_version 58860 (0.0010) +[2023-10-08 14:07:08,917][102898] Updated weights for policy 1, policy_version 58870 (0.0009) +[2023-10-08 14:07:09,273][102898] Updated weights for policy 1, policy_version 58880 (0.0009) +[2023-10-08 14:07:11,485][102897] Updated weights for policy 0, policy_version 58820 (0.0009) +[2023-10-08 14:07:11,859][102897] Updated weights for policy 0, policy_version 58830 (0.0009) +[2023-10-08 14:07:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 120520704. Throughput: 0: 1779.1, 1: 1791.5. Samples: 30141988. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 14:07:11,875][101941] Avg episode reward: [(0, '8.210'), (1, '9.170')] +[2023-10-08 14:07:12,228][102897] Updated weights for policy 0, policy_version 58840 (0.0007) +[2023-10-08 14:07:13,048][102898] Updated weights for policy 1, policy_version 58890 (0.0009) +[2023-10-08 14:07:13,424][102898] Updated weights for policy 1, policy_version 58900 (0.0008) +[2023-10-08 14:07:13,778][102898] Updated weights for policy 1, policy_version 58910 (0.0008) +[2023-10-08 14:07:15,954][102897] Updated weights for policy 0, policy_version 58850 (0.0008) +[2023-10-08 14:07:16,324][102897] Updated weights for policy 0, policy_version 58860 (0.0009) +[2023-10-08 14:07:16,697][102897] Updated weights for policy 0, policy_version 58870 (0.0007) +[2023-10-08 14:07:16,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 120586240. Throughput: 0: 1795.0, 1: 1789.9. Samples: 30163798. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:07:16,876][101941] Avg episode reward: [(0, '8.270'), (1, '9.410')] +[2023-10-08 14:07:17,059][102897] Updated weights for policy 0, policy_version 58880 (0.0010) +[2023-10-08 14:07:17,451][102898] Updated weights for policy 1, policy_version 58920 (0.0007) +[2023-10-08 14:07:17,822][102898] Updated weights for policy 1, policy_version 58930 (0.0009) +[2023-10-08 14:07:18,191][102898] Updated weights for policy 1, policy_version 58940 (0.0007) +[2023-10-08 14:07:20,768][102897] Updated weights for policy 0, policy_version 58890 (0.0008) +[2023-10-08 14:07:21,143][102897] Updated weights for policy 0, policy_version 58900 (0.0010) +[2023-10-08 14:07:21,512][102897] Updated weights for policy 0, policy_version 58910 (0.0008) +[2023-10-08 14:07:21,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 120684544. Throughput: 0: 1779.9, 1: 1793.1. Samples: 30174408. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:07:21,876][101941] Avg episode reward: [(0, '8.630'), (1, '9.630')] +[2023-10-08 14:07:21,948][102898] Updated weights for policy 1, policy_version 58950 (0.0010) +[2023-10-08 14:07:22,314][102898] Updated weights for policy 1, policy_version 58960 (0.0008) +[2023-10-08 14:07:22,681][102898] Updated weights for policy 1, policy_version 58970 (0.0008) +[2023-10-08 14:07:25,260][102897] Updated weights for policy 0, policy_version 58920 (0.0010) +[2023-10-08 14:07:25,635][102897] Updated weights for policy 0, policy_version 58930 (0.0010) +[2023-10-08 14:07:25,996][102897] Updated weights for policy 0, policy_version 58940 (0.0007) +[2023-10-08 14:07:26,523][102898] Updated weights for policy 1, policy_version 58980 (0.0008) +[2023-10-08 14:07:26,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 120750080. Throughput: 0: 1796.3, 1: 1789.1. Samples: 30196082. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:07:26,875][101941] Avg episode reward: [(0, '7.870'), (1, '9.510')] +[2023-10-08 14:07:26,893][102898] Updated weights for policy 1, policy_version 58990 (0.0007) +[2023-10-08 14:07:27,250][102898] Updated weights for policy 1, policy_version 59000 (0.0007) +[2023-10-08 14:07:29,880][102897] Updated weights for policy 0, policy_version 58950 (0.0008) +[2023-10-08 14:07:30,249][102897] Updated weights for policy 0, policy_version 58960 (0.0008) +[2023-10-08 14:07:30,616][102897] Updated weights for policy 0, policy_version 58970 (0.0010) +[2023-10-08 14:07:31,149][102898] Updated weights for policy 1, policy_version 59010 (0.0007) +[2023-10-08 14:07:31,556][102898] Updated weights for policy 1, policy_version 59020 (0.0009) +[2023-10-08 14:07:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 120815616. Throughput: 0: 1773.2, 1: 1814.0. Samples: 30217156. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:07:31,876][101941] Avg episode reward: [(0, '7.760'), (1, '8.900')] +[2023-10-08 14:07:31,920][102898] Updated weights for policy 1, policy_version 59030 (0.0010) +[2023-10-08 14:07:32,285][102898] Updated weights for policy 1, policy_version 59040 (0.0009) +[2023-10-08 14:07:34,363][102897] Updated weights for policy 0, policy_version 58980 (0.0009) +[2023-10-08 14:07:34,736][102897] Updated weights for policy 0, policy_version 58990 (0.0010) +[2023-10-08 14:07:35,105][102897] Updated weights for policy 0, policy_version 59000 (0.0009) +[2023-10-08 14:07:36,047][102898] Updated weights for policy 1, policy_version 59050 (0.0010) +[2023-10-08 14:07:36,416][102898] Updated weights for policy 1, policy_version 59060 (0.0008) +[2023-10-08 14:07:36,781][102898] Updated weights for policy 1, policy_version 59070 (0.0011) +[2023-10-08 14:07:36,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 120913920. Throughput: 0: 1801.7, 1: 1787.9. Samples: 30228462. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:07:36,876][101941] Avg episode reward: [(0, '7.570'), (1, '8.380')] +[2023-10-08 14:07:38,792][102897] Updated weights for policy 0, policy_version 59010 (0.0011) +[2023-10-08 14:07:39,150][102897] Updated weights for policy 0, policy_version 59020 (0.0009) +[2023-10-08 14:07:39,529][102897] Updated weights for policy 0, policy_version 59030 (0.0009) +[2023-10-08 14:07:39,893][102897] Updated weights for policy 0, policy_version 59040 (0.0011) +[2023-10-08 14:07:40,473][102898] Updated weights for policy 1, policy_version 59080 (0.0010) +[2023-10-08 14:07:40,825][102898] Updated weights for policy 1, policy_version 59090 (0.0010) +[2023-10-08 14:07:41,187][102898] Updated weights for policy 1, policy_version 59100 (0.0010) +[2023-10-08 14:07:41,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 120979456. Throughput: 0: 1774.6, 1: 1811.3. Samples: 30249270. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:07:41,876][101941] Avg episode reward: [(0, '7.950'), (1, '9.430')] +[2023-10-08 14:07:43,681][102897] Updated weights for policy 0, policy_version 59050 (0.0008) +[2023-10-08 14:07:44,050][102897] Updated weights for policy 0, policy_version 59060 (0.0008) +[2023-10-08 14:07:44,417][102897] Updated weights for policy 0, policy_version 59070 (0.0007) +[2023-10-08 14:07:44,820][102898] Updated weights for policy 1, policy_version 59110 (0.0009) +[2023-10-08 14:07:45,183][102898] Updated weights for policy 1, policy_version 59120 (0.0008) +[2023-10-08 14:07:45,548][102898] Updated weights for policy 1, policy_version 59130 (0.0009) +[2023-10-08 14:07:46,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 121044992. Throughput: 0: 1770.1, 1: 1797.1. Samples: 30270686. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:07:46,876][101941] Avg episode reward: [(0, '8.650'), (1, '9.650')] +[2023-10-08 14:07:48,166][102897] Updated weights for policy 0, policy_version 59080 (0.0008) +[2023-10-08 14:07:48,540][102897] Updated weights for policy 0, policy_version 59090 (0.0008) +[2023-10-08 14:07:48,904][102897] Updated weights for policy 0, policy_version 59100 (0.0008) +[2023-10-08 14:07:49,293][102898] Updated weights for policy 1, policy_version 59140 (0.0007) +[2023-10-08 14:07:49,661][102898] Updated weights for policy 1, policy_version 59150 (0.0008) +[2023-10-08 14:07:50,019][102898] Updated weights for policy 1, policy_version 59160 (0.0008) +[2023-10-08 14:07:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 121110528. Throughput: 0: 1770.3, 1: 1813.1. Samples: 30281468. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:07:51,876][101941] Avg episode reward: [(0, '8.070'), (1, '8.540')] +[2023-10-08 14:07:52,736][102897] Updated weights for policy 0, policy_version 59110 (0.0007) +[2023-10-08 14:07:53,100][102897] Updated weights for policy 0, policy_version 59120 (0.0007) +[2023-10-08 14:07:53,470][102897] Updated weights for policy 0, policy_version 59130 (0.0008) +[2023-10-08 14:07:53,770][102898] Updated weights for policy 1, policy_version 59170 (0.0009) +[2023-10-08 14:07:54,136][102898] Updated weights for policy 1, policy_version 59180 (0.0009) +[2023-10-08 14:07:54,494][102898] Updated weights for policy 1, policy_version 59190 (0.0008) +[2023-10-08 14:07:54,859][102898] Updated weights for policy 1, policy_version 59200 (0.0009) +[2023-10-08 14:07:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 121176064. Throughput: 0: 1777.7, 1: 1793.3. Samples: 30302686. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:07:56,876][101941] Avg episode reward: [(0, '7.150'), (1, '8.760')] +[2023-10-08 14:07:57,301][102897] Updated weights for policy 0, policy_version 59140 (0.0010) +[2023-10-08 14:07:57,667][102897] Updated weights for policy 0, policy_version 59150 (0.0010) +[2023-10-08 14:07:58,037][102897] Updated weights for policy 0, policy_version 59160 (0.0007) +[2023-10-08 14:07:58,713][102898] Updated weights for policy 1, policy_version 59210 (0.0007) +[2023-10-08 14:07:59,083][102898] Updated weights for policy 1, policy_version 59220 (0.0008) +[2023-10-08 14:07:59,449][102898] Updated weights for policy 1, policy_version 59230 (0.0007) +[2023-10-08 14:08:01,855][102897] Updated weights for policy 0, policy_version 59170 (0.0010) +[2023-10-08 14:08:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 121241600. Throughput: 0: 1792.1, 1: 1792.1. Samples: 30325088. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:08:01,876][101941] Avg episode reward: [(0, '7.650'), (1, '9.550')] +[2023-10-08 14:08:02,222][102897] Updated weights for policy 0, policy_version 59180 (0.0008) +[2023-10-08 14:08:02,582][102897] Updated weights for policy 0, policy_version 59190 (0.0010) +[2023-10-08 14:08:02,953][102897] Updated weights for policy 0, policy_version 59200 (0.0010) +[2023-10-08 14:08:03,016][102898] Updated weights for policy 1, policy_version 59240 (0.0008) +[2023-10-08 14:08:03,385][102898] Updated weights for policy 1, policy_version 59250 (0.0009) +[2023-10-08 14:08:03,755][102898] Updated weights for policy 1, policy_version 59260 (0.0007) +[2023-10-08 14:08:06,796][102897] Updated weights for policy 0, policy_version 59210 (0.0007) +[2023-10-08 14:08:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 121307136. Throughput: 0: 1775.7, 1: 1789.9. Samples: 30334858. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:08:06,876][101941] Avg episode reward: [(0, '8.090'), (1, '9.110')] +[2023-10-08 14:08:07,163][102897] Updated weights for policy 0, policy_version 59220 (0.0008) +[2023-10-08 14:08:07,530][102897] Updated weights for policy 0, policy_version 59230 (0.0007) +[2023-10-08 14:08:07,551][102898] Updated weights for policy 1, policy_version 59270 (0.0009) +[2023-10-08 14:08:07,917][102898] Updated weights for policy 1, policy_version 59280 (0.0010) +[2023-10-08 14:08:08,287][102898] Updated weights for policy 1, policy_version 59290 (0.0010) +[2023-10-08 14:08:11,335][102897] Updated weights for policy 0, policy_version 59240 (0.0008) +[2023-10-08 14:08:11,708][102897] Updated weights for policy 0, policy_version 59250 (0.0008) +[2023-10-08 14:08:11,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 121372672. Throughput: 0: 1785.9, 1: 1790.0. Samples: 30357000. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:08:11,876][101941] Avg episode reward: [(0, '8.080'), (1, '8.320')] +[2023-10-08 14:08:12,083][102897] Updated weights for policy 0, policy_version 59260 (0.0008) +[2023-10-08 14:08:12,220][102898] Updated weights for policy 1, policy_version 59300 (0.0008) +[2023-10-08 14:08:12,590][102898] Updated weights for policy 1, policy_version 59310 (0.0008) +[2023-10-08 14:08:12,961][102898] Updated weights for policy 1, policy_version 59320 (0.0007) +[2023-10-08 14:08:15,846][102897] Updated weights for policy 0, policy_version 59270 (0.0009) +[2023-10-08 14:08:16,214][102897] Updated weights for policy 0, policy_version 59280 (0.0008) +[2023-10-08 14:08:16,596][102897] Updated weights for policy 0, policy_version 59290 (0.0008) +[2023-10-08 14:08:16,755][102898] Updated weights for policy 1, policy_version 59330 (0.0007) +[2023-10-08 14:08:16,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 121470976. Throughput: 0: 1786.0, 1: 1799.6. Samples: 30378504. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:08:16,875][101941] Avg episode reward: [(0, '8.060'), (1, '8.370')] +[2023-10-08 14:08:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000059296_60719104.pth... +[2023-10-08 14:08:16,918][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000057600_58982400.pth +[2023-10-08 14:08:17,152][102898] Updated weights for policy 1, policy_version 59340 (0.0007) +[2023-10-08 14:08:17,521][102898] Updated weights for policy 1, policy_version 59350 (0.0008) +[2023-10-08 14:08:17,879][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000059360_60784640.pth... +[2023-10-08 14:08:17,884][102898] Updated weights for policy 1, policy_version 59360 (0.0007) +[2023-10-08 14:08:17,909][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000057664_59047936.pth +[2023-10-08 14:08:20,312][102897] Updated weights for policy 0, policy_version 59300 (0.0010) +[2023-10-08 14:08:20,706][102897] Updated weights for policy 0, policy_version 59310 (0.0010) +[2023-10-08 14:08:21,076][102897] Updated weights for policy 0, policy_version 59320 (0.0009) +[2023-10-08 14:08:21,694][102898] Updated weights for policy 1, policy_version 59370 (0.0009) +[2023-10-08 14:08:21,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 121536512. Throughput: 0: 1778.4, 1: 1785.9. Samples: 30388854. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:08:21,876][101941] Avg episode reward: [(0, '7.860'), (1, '9.020')] +[2023-10-08 14:08:22,071][102898] Updated weights for policy 1, policy_version 59380 (0.0011) +[2023-10-08 14:08:22,441][102898] Updated weights for policy 1, policy_version 59390 (0.0008) +[2023-10-08 14:08:24,950][102897] Updated weights for policy 0, policy_version 59330 (0.0008) +[2023-10-08 14:08:25,326][102897] Updated weights for policy 0, policy_version 59340 (0.0007) +[2023-10-08 14:08:25,693][102897] Updated weights for policy 0, policy_version 59350 (0.0007) +[2023-10-08 14:08:26,069][102897] Updated weights for policy 0, policy_version 59360 (0.0009) +[2023-10-08 14:08:26,290][102898] Updated weights for policy 1, policy_version 59400 (0.0009) +[2023-10-08 14:08:26,646][102898] Updated weights for policy 1, policy_version 59410 (0.0008) +[2023-10-08 14:08:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 121602048. Throughput: 0: 1786.8, 1: 1792.5. Samples: 30410340. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:08:26,875][101941] Avg episode reward: [(0, '7.830'), (1, '9.790')] +[2023-10-08 14:08:27,014][102898] Updated weights for policy 1, policy_version 59420 (0.0009) +[2023-10-08 14:08:29,766][102897] Updated weights for policy 0, policy_version 59370 (0.0007) +[2023-10-08 14:08:30,132][102897] Updated weights for policy 0, policy_version 59380 (0.0007) +[2023-10-08 14:08:30,502][102897] Updated weights for policy 0, policy_version 59390 (0.0008) +[2023-10-08 14:08:30,841][102898] Updated weights for policy 1, policy_version 59430 (0.0007) +[2023-10-08 14:08:31,213][102898] Updated weights for policy 1, policy_version 59440 (0.0010) +[2023-10-08 14:08:31,583][102898] Updated weights for policy 1, policy_version 59450 (0.0007) +[2023-10-08 14:08:31,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 121700352. Throughput: 0: 1774.4, 1: 1785.2. Samples: 30430866. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:08:31,875][101941] Avg episode reward: [(0, '7.640'), (1, '9.390')] +[2023-10-08 14:08:34,352][102897] Updated weights for policy 0, policy_version 59400 (0.0007) +[2023-10-08 14:08:34,734][102897] Updated weights for policy 0, policy_version 59410 (0.0007) +[2023-10-08 14:08:35,102][102897] Updated weights for policy 0, policy_version 59420 (0.0009) +[2023-10-08 14:08:35,293][102898] Updated weights for policy 1, policy_version 59460 (0.0008) +[2023-10-08 14:08:35,647][102898] Updated weights for policy 1, policy_version 59470 (0.0008) +[2023-10-08 14:08:36,019][102898] Updated weights for policy 1, policy_version 59480 (0.0009) +[2023-10-08 14:08:36,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 121765888. Throughput: 0: 1797.8, 1: 1784.0. Samples: 30442646. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:08:36,875][101941] Avg episode reward: [(0, '7.510'), (1, '9.320')] +[2023-10-08 14:08:38,741][102897] Updated weights for policy 0, policy_version 59430 (0.0009) +[2023-10-08 14:08:39,110][102897] Updated weights for policy 0, policy_version 59440 (0.0007) +[2023-10-08 14:08:39,479][102897] Updated weights for policy 0, policy_version 59450 (0.0007) +[2023-10-08 14:08:39,674][102898] Updated weights for policy 1, policy_version 59490 (0.0008) +[2023-10-08 14:08:40,031][102898] Updated weights for policy 1, policy_version 59500 (0.0007) +[2023-10-08 14:08:40,412][102898] Updated weights for policy 1, policy_version 59510 (0.0009) +[2023-10-08 14:08:40,773][102898] Updated weights for policy 1, policy_version 59520 (0.0010) +[2023-10-08 14:08:41,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 121831424. Throughput: 0: 1779.9, 1: 1792.4. Samples: 30463440. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:08:41,876][101941] Avg episode reward: [(0, '8.080'), (1, '9.350')] +[2023-10-08 14:08:43,148][102897] Updated weights for policy 0, policy_version 59460 (0.0007) +[2023-10-08 14:08:43,515][102897] Updated weights for policy 0, policy_version 59470 (0.0007) +[2023-10-08 14:08:43,879][102897] Updated weights for policy 0, policy_version 59480 (0.0009) +[2023-10-08 14:08:44,414][102898] Updated weights for policy 1, policy_version 59530 (0.0008) +[2023-10-08 14:08:44,786][102898] Updated weights for policy 1, policy_version 59540 (0.0011) +[2023-10-08 14:08:45,157][102898] Updated weights for policy 1, policy_version 59550 (0.0008) +[2023-10-08 14:08:46,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 121896960. Throughput: 0: 1777.8, 1: 1784.6. Samples: 30485394. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:08:46,876][101941] Avg episode reward: [(0, '8.250'), (1, '8.500')] +[2023-10-08 14:08:47,545][102897] Updated weights for policy 0, policy_version 59490 (0.0008) +[2023-10-08 14:08:47,916][102897] Updated weights for policy 0, policy_version 59500 (0.0008) +[2023-10-08 14:08:48,295][102897] Updated weights for policy 0, policy_version 59510 (0.0008) +[2023-10-08 14:08:48,666][102897] Updated weights for policy 0, policy_version 59520 (0.0008) +[2023-10-08 14:08:48,916][102898] Updated weights for policy 1, policy_version 59560 (0.0009) +[2023-10-08 14:08:49,280][102898] Updated weights for policy 1, policy_version 59570 (0.0008) +[2023-10-08 14:08:49,650][102898] Updated weights for policy 1, policy_version 59580 (0.0007) +[2023-10-08 14:08:51,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 121962496. Throughput: 0: 1779.5, 1: 1794.5. Samples: 30495688. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:08:51,875][101941] Avg episode reward: [(0, '8.330'), (1, '8.540')] +[2023-10-08 14:08:52,630][102897] Updated weights for policy 0, policy_version 59530 (0.0010) +[2023-10-08 14:08:52,997][102897] Updated weights for policy 0, policy_version 59540 (0.0008) +[2023-10-08 14:08:53,289][102898] Updated weights for policy 1, policy_version 59590 (0.0007) +[2023-10-08 14:08:53,368][102897] Updated weights for policy 0, policy_version 59550 (0.0008) +[2023-10-08 14:08:53,658][102898] Updated weights for policy 1, policy_version 59600 (0.0007) +[2023-10-08 14:08:54,021][102898] Updated weights for policy 1, policy_version 59610 (0.0007) +[2023-10-08 14:08:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 122028032. Throughput: 0: 1779.5, 1: 1789.7. Samples: 30517614. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:08:56,876][101941] Avg episode reward: [(0, '7.750'), (1, '8.460')] +[2023-10-08 14:08:57,075][102897] Updated weights for policy 0, policy_version 59560 (0.0009) +[2023-10-08 14:08:57,445][102897] Updated weights for policy 0, policy_version 59570 (0.0009) +[2023-10-08 14:08:57,751][102898] Updated weights for policy 1, policy_version 59620 (0.0008) +[2023-10-08 14:08:57,822][102897] Updated weights for policy 0, policy_version 59580 (0.0008) +[2023-10-08 14:08:58,116][102898] Updated weights for policy 1, policy_version 59630 (0.0009) +[2023-10-08 14:08:58,489][102898] Updated weights for policy 1, policy_version 59640 (0.0009) +[2023-10-08 14:09:01,571][102897] Updated weights for policy 0, policy_version 59590 (0.0008) +[2023-10-08 14:09:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 122093568. Throughput: 0: 1795.5, 1: 1787.2. Samples: 30539728. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:09:01,875][101941] Avg episode reward: [(0, '8.110'), (1, '8.500')] +[2023-10-08 14:09:01,933][102897] Updated weights for policy 0, policy_version 59600 (0.0010) +[2023-10-08 14:09:02,308][102897] Updated weights for policy 0, policy_version 59610 (0.0008) +[2023-10-08 14:09:02,405][102898] Updated weights for policy 1, policy_version 59650 (0.0007) +[2023-10-08 14:09:02,813][102898] Updated weights for policy 1, policy_version 59660 (0.0007) +[2023-10-08 14:09:03,189][102898] Updated weights for policy 1, policy_version 59670 (0.0007) +[2023-10-08 14:09:03,550][102898] Updated weights for policy 1, policy_version 59680 (0.0008) +[2023-10-08 14:09:06,281][102897] Updated weights for policy 0, policy_version 59620 (0.0008) +[2023-10-08 14:09:06,665][102897] Updated weights for policy 0, policy_version 59630 (0.0007) +[2023-10-08 14:09:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 122159104. Throughput: 0: 1775.1, 1: 1790.4. Samples: 30549302. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:09:06,875][101941] Avg episode reward: [(0, '7.890'), (1, '8.970')] +[2023-10-08 14:09:07,042][102897] Updated weights for policy 0, policy_version 59640 (0.0007) +[2023-10-08 14:09:07,293][102898] Updated weights for policy 1, policy_version 59690 (0.0008) +[2023-10-08 14:09:07,657][102898] Updated weights for policy 1, policy_version 59700 (0.0008) +[2023-10-08 14:09:08,023][102898] Updated weights for policy 1, policy_version 59710 (0.0008) +[2023-10-08 14:09:10,887][102897] Updated weights for policy 0, policy_version 59650 (0.0008) +[2023-10-08 14:09:11,254][102897] Updated weights for policy 0, policy_version 59660 (0.0010) +[2023-10-08 14:09:11,587][102898] Updated weights for policy 1, policy_version 59720 (0.0009) +[2023-10-08 14:09:11,620][102897] Updated weights for policy 0, policy_version 59670 (0.0008) +[2023-10-08 14:09:11,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 122224640. Throughput: 0: 1787.7, 1: 1791.4. Samples: 30571400. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:09:11,876][101941] Avg episode reward: [(0, '8.280'), (1, '9.170')] +[2023-10-08 14:09:11,955][102898] Updated weights for policy 1, policy_version 59730 (0.0008) +[2023-10-08 14:09:11,993][102897] Updated weights for policy 0, policy_version 59680 (0.0007) +[2023-10-08 14:09:12,325][102898] Updated weights for policy 1, policy_version 59740 (0.0009) +[2023-10-08 14:09:15,813][102897] Updated weights for policy 0, policy_version 59690 (0.0010) +[2023-10-08 14:09:16,181][102897] Updated weights for policy 0, policy_version 59700 (0.0007) +[2023-10-08 14:09:16,185][102898] Updated weights for policy 1, policy_version 59750 (0.0010) +[2023-10-08 14:09:16,543][102897] Updated weights for policy 0, policy_version 59710 (0.0009) +[2023-10-08 14:09:16,548][102898] Updated weights for policy 1, policy_version 59760 (0.0008) +[2023-10-08 14:09:16,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 122322944. Throughput: 0: 1773.2, 1: 1805.7. Samples: 30591918. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:09:16,875][101941] Avg episode reward: [(0, '8.280'), (1, '9.210')] +[2023-10-08 14:09:16,923][102898] Updated weights for policy 1, policy_version 59770 (0.0009) +[2023-10-08 14:09:20,371][102897] Updated weights for policy 0, policy_version 59720 (0.0011) +[2023-10-08 14:09:20,734][102897] Updated weights for policy 0, policy_version 59730 (0.0008) +[2023-10-08 14:09:20,911][102898] Updated weights for policy 1, policy_version 59780 (0.0010) +[2023-10-08 14:09:21,110][102897] Updated weights for policy 0, policy_version 59740 (0.0007) +[2023-10-08 14:09:21,273][102898] Updated weights for policy 1, policy_version 59790 (0.0009) +[2023-10-08 14:09:21,645][102898] Updated weights for policy 1, policy_version 59800 (0.0009) +[2023-10-08 14:09:21,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 122388480. Throughput: 0: 1774.3, 1: 1793.5. Samples: 30603194. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:09:21,875][101941] Avg episode reward: [(0, '7.900'), (1, '8.960')] +[2023-10-08 14:09:24,847][102897] Updated weights for policy 0, policy_version 59750 (0.0007) +[2023-10-08 14:09:25,225][102897] Updated weights for policy 0, policy_version 59760 (0.0009) +[2023-10-08 14:09:25,400][102898] Updated weights for policy 1, policy_version 59810 (0.0008) +[2023-10-08 14:09:25,595][102897] Updated weights for policy 0, policy_version 59770 (0.0007) +[2023-10-08 14:09:25,763][102898] Updated weights for policy 1, policy_version 59820 (0.0008) +[2023-10-08 14:09:26,133][102898] Updated weights for policy 1, policy_version 59830 (0.0008) +[2023-10-08 14:09:26,506][102898] Updated weights for policy 1, policy_version 59840 (0.0009) +[2023-10-08 14:09:26,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 122486784. Throughput: 0: 1776.9, 1: 1807.6. Samples: 30624744. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:09:26,876][101941] Avg episode reward: [(0, '7.970'), (1, '8.800')] +[2023-10-08 14:09:29,544][102897] Updated weights for policy 0, policy_version 59780 (0.0007) +[2023-10-08 14:09:29,911][102897] Updated weights for policy 0, policy_version 59790 (0.0009) +[2023-10-08 14:09:30,162][102898] Updated weights for policy 1, policy_version 59850 (0.0008) +[2023-10-08 14:09:30,284][102897] Updated weights for policy 0, policy_version 59800 (0.0008) +[2023-10-08 14:09:30,534][102898] Updated weights for policy 1, policy_version 59860 (0.0007) +[2023-10-08 14:09:30,901][102898] Updated weights for policy 1, policy_version 59870 (0.0008) +[2023-10-08 14:09:31,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 122552320. Throughput: 0: 1761.9, 1: 1786.9. Samples: 30645088. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:09:31,876][101941] Avg episode reward: [(0, '9.130'), (1, '8.580')] +[2023-10-08 14:09:31,883][102634] Saving new best policy, reward=9.130! +[2023-10-08 14:09:34,206][102897] Updated weights for policy 0, policy_version 59810 (0.0009) +[2023-10-08 14:09:34,582][102897] Updated weights for policy 0, policy_version 59820 (0.0008) +[2023-10-08 14:09:34,645][102898] Updated weights for policy 1, policy_version 59880 (0.0008) +[2023-10-08 14:09:34,940][102897] Updated weights for policy 0, policy_version 59830 (0.0007) +[2023-10-08 14:09:35,010][102898] Updated weights for policy 1, policy_version 59890 (0.0009) +[2023-10-08 14:09:35,305][102897] Updated weights for policy 0, policy_version 59840 (0.0007) +[2023-10-08 14:09:35,367][102898] Updated weights for policy 1, policy_version 59900 (0.0008) +[2023-10-08 14:09:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 122617856. Throughput: 0: 1782.5, 1: 1805.5. Samples: 30657152. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:09:36,876][101941] Avg episode reward: [(0, '8.720'), (1, '9.450')] +[2023-10-08 14:09:39,165][102897] Updated weights for policy 0, policy_version 59850 (0.0008) +[2023-10-08 14:09:39,184][102898] Updated weights for policy 1, policy_version 59910 (0.0009) +[2023-10-08 14:09:39,540][102897] Updated weights for policy 0, policy_version 59860 (0.0007) +[2023-10-08 14:09:39,551][102898] Updated weights for policy 1, policy_version 59920 (0.0008) +[2023-10-08 14:09:39,914][102897] Updated weights for policy 0, policy_version 59870 (0.0007) +[2023-10-08 14:09:39,914][102898] Updated weights for policy 1, policy_version 59930 (0.0008) +[2023-10-08 14:09:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 122683392. Throughput: 0: 1761.8, 1: 1781.1. Samples: 30677044. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:09:41,876][101941] Avg episode reward: [(0, '7.410'), (1, '9.970')] +[2023-10-08 14:09:43,734][102897] Updated weights for policy 0, policy_version 59880 (0.0009) +[2023-10-08 14:09:43,823][102898] Updated weights for policy 1, policy_version 59940 (0.0009) +[2023-10-08 14:09:44,098][102897] Updated weights for policy 0, policy_version 59890 (0.0009) +[2023-10-08 14:09:44,200][102898] Updated weights for policy 1, policy_version 59950 (0.0008) +[2023-10-08 14:09:44,469][102897] Updated weights for policy 0, policy_version 59900 (0.0009) +[2023-10-08 14:09:44,560][102898] Updated weights for policy 1, policy_version 59960 (0.0007) +[2023-10-08 14:09:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 122748928. Throughput: 0: 1762.5, 1: 1777.7. Samples: 30699038. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:09:46,876][101941] Avg episode reward: [(0, '7.930'), (1, '9.300')] +[2023-10-08 14:09:48,164][102897] Updated weights for policy 0, policy_version 59910 (0.0008) +[2023-10-08 14:09:48,528][102898] Updated weights for policy 1, policy_version 59970 (0.0008) +[2023-10-08 14:09:48,542][102897] Updated weights for policy 0, policy_version 59920 (0.0007) +[2023-10-08 14:09:48,906][102897] Updated weights for policy 0, policy_version 59930 (0.0007) +[2023-10-08 14:09:48,920][102898] Updated weights for policy 1, policy_version 59980 (0.0009) +[2023-10-08 14:09:49,290][102898] Updated weights for policy 1, policy_version 59990 (0.0009) +[2023-10-08 14:09:49,671][102898] Updated weights for policy 1, policy_version 60000 (0.0011) +[2023-10-08 14:09:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 122814464. Throughput: 0: 1760.5, 1: 1781.7. Samples: 30708702. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:09:51,876][101941] Avg episode reward: [(0, '7.990'), (1, '9.510')] +[2023-10-08 14:09:52,648][102897] Updated weights for policy 0, policy_version 59940 (0.0008) +[2023-10-08 14:09:53,013][102897] Updated weights for policy 0, policy_version 59950 (0.0007) +[2023-10-08 14:09:53,343][102898] Updated weights for policy 1, policy_version 60010 (0.0007) +[2023-10-08 14:09:53,381][102897] Updated weights for policy 0, policy_version 59960 (0.0008) +[2023-10-08 14:09:53,705][102898] Updated weights for policy 1, policy_version 60020 (0.0009) +[2023-10-08 14:09:54,073][102898] Updated weights for policy 1, policy_version 60030 (0.0007) +[2023-10-08 14:09:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 122880000. Throughput: 0: 1766.4, 1: 1769.8. Samples: 30730530. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:09:56,876][101941] Avg episode reward: [(0, '7.960'), (1, '10.520')] +[2023-10-08 14:09:56,878][102760] Saving new best policy, reward=10.520! +[2023-10-08 14:09:57,265][102897] Updated weights for policy 0, policy_version 59970 (0.0009) +[2023-10-08 14:09:57,656][102897] Updated weights for policy 0, policy_version 59980 (0.0009) +[2023-10-08 14:09:57,981][102898] Updated weights for policy 1, policy_version 60040 (0.0008) +[2023-10-08 14:09:58,031][102897] Updated weights for policy 0, policy_version 59990 (0.0007) +[2023-10-08 14:09:58,342][102898] Updated weights for policy 1, policy_version 60050 (0.0007) +[2023-10-08 14:09:58,399][102897] Updated weights for policy 0, policy_version 60000 (0.0008) +[2023-10-08 14:09:58,705][102898] Updated weights for policy 1, policy_version 60060 (0.0007) +[2023-10-08 14:10:01,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 122945536. Throughput: 0: 1790.8, 1: 1780.0. Samples: 30752606. Policy #0 lag: (min: 31.0, avg: 31.2, max: 42.0) +[2023-10-08 14:10:01,875][101941] Avg episode reward: [(0, '8.000'), (1, '10.080')] +[2023-10-08 14:10:02,115][102897] Updated weights for policy 0, policy_version 60010 (0.0007) +[2023-10-08 14:10:02,480][102897] Updated weights for policy 0, policy_version 60020 (0.0009) +[2023-10-08 14:10:02,519][102898] Updated weights for policy 1, policy_version 60070 (0.0007) +[2023-10-08 14:10:02,848][102897] Updated weights for policy 0, policy_version 60030 (0.0008) +[2023-10-08 14:10:02,889][102898] Updated weights for policy 1, policy_version 60080 (0.0007) +[2023-10-08 14:10:03,256][102898] Updated weights for policy 1, policy_version 60090 (0.0007) +[2023-10-08 14:10:06,663][102897] Updated weights for policy 0, policy_version 60040 (0.0010) +[2023-10-08 14:10:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 123011072. Throughput: 0: 1767.7, 1: 1767.7. Samples: 30762288. Policy #0 lag: (min: 31.0, avg: 31.2, max: 42.0) +[2023-10-08 14:10:06,876][101941] Avg episode reward: [(0, '7.530'), (1, '9.510')] +[2023-10-08 14:10:07,026][102898] Updated weights for policy 1, policy_version 60100 (0.0008) +[2023-10-08 14:10:07,041][102897] Updated weights for policy 0, policy_version 60050 (0.0009) +[2023-10-08 14:10:07,395][102898] Updated weights for policy 1, policy_version 60110 (0.0008) +[2023-10-08 14:10:07,424][102897] Updated weights for policy 0, policy_version 60060 (0.0007) +[2023-10-08 14:10:07,758][102898] Updated weights for policy 1, policy_version 60120 (0.0007) +[2023-10-08 14:10:11,256][102897] Updated weights for policy 0, policy_version 60070 (0.0009) +[2023-10-08 14:10:11,551][102898] Updated weights for policy 1, policy_version 60130 (0.0009) +[2023-10-08 14:10:11,620][102897] Updated weights for policy 0, policy_version 60080 (0.0008) +[2023-10-08 14:10:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 123076608. Throughput: 0: 1780.6, 1: 1769.8. Samples: 30784514. Policy #0 lag: (min: 31.0, avg: 31.2, max: 42.0) +[2023-10-08 14:10:11,876][101941] Avg episode reward: [(0, '7.500'), (1, '8.840')] +[2023-10-08 14:10:11,920][102898] Updated weights for policy 1, policy_version 60140 (0.0008) +[2023-10-08 14:10:11,994][102897] Updated weights for policy 0, policy_version 60090 (0.0008) +[2023-10-08 14:10:12,280][102898] Updated weights for policy 1, policy_version 60150 (0.0008) +[2023-10-08 14:10:12,641][102898] Updated weights for policy 1, policy_version 60160 (0.0007) +[2023-10-08 14:10:15,821][102897] Updated weights for policy 0, policy_version 60100 (0.0008) +[2023-10-08 14:10:16,192][102897] Updated weights for policy 0, policy_version 60110 (0.0008) +[2023-10-08 14:10:16,275][102898] Updated weights for policy 1, policy_version 60170 (0.0007) +[2023-10-08 14:10:16,560][102897] Updated weights for policy 0, policy_version 60120 (0.0007) +[2023-10-08 14:10:16,634][102898] Updated weights for policy 1, policy_version 60180 (0.0008) +[2023-10-08 14:10:16,875][101941] Fps is (10 sec: 16383.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 123174912. Throughput: 0: 1775.5, 1: 1784.7. Samples: 30805302. Policy #0 lag: (min: 31.0, avg: 31.2, max: 42.0) +[2023-10-08 14:10:16,876][101941] Avg episode reward: [(0, '8.210'), (1, '8.960')] +[2023-10-08 14:10:16,886][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000060128_61571072.pth... +[2023-10-08 14:10:16,925][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000058464_59867136.pth +[2023-10-08 14:10:16,999][102898] Updated weights for policy 1, policy_version 60190 (0.0009) +[2023-10-08 14:10:17,072][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000060192_61636608.pth... +[2023-10-08 14:10:17,100][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000058496_59899904.pth +[2023-10-08 14:10:20,272][102897] Updated weights for policy 0, policy_version 60130 (0.0007) +[2023-10-08 14:10:20,652][102897] Updated weights for policy 0, policy_version 60140 (0.0007) +[2023-10-08 14:10:20,682][102898] Updated weights for policy 1, policy_version 60200 (0.0008) +[2023-10-08 14:10:21,023][102897] Updated weights for policy 0, policy_version 60150 (0.0008) +[2023-10-08 14:10:21,041][102898] Updated weights for policy 1, policy_version 60210 (0.0009) +[2023-10-08 14:10:21,396][102897] Updated weights for policy 0, policy_version 60160 (0.0007) +[2023-10-08 14:10:21,413][102898] Updated weights for policy 1, policy_version 60220 (0.0007) +[2023-10-08 14:10:21,875][101941] Fps is (10 sec: 19660.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 123273216. Throughput: 0: 1772.7, 1: 1766.8. Samples: 30816428. Policy #0 lag: (min: 31.0, avg: 31.2, max: 42.0) +[2023-10-08 14:10:21,875][101941] Avg episode reward: [(0, '7.990'), (1, '8.670')] +[2023-10-08 14:10:25,268][102897] Updated weights for policy 0, policy_version 60170 (0.0007) +[2023-10-08 14:10:25,319][102898] Updated weights for policy 1, policy_version 60230 (0.0008) +[2023-10-08 14:10:25,638][102897] Updated weights for policy 0, policy_version 60180 (0.0008) +[2023-10-08 14:10:25,682][102898] Updated weights for policy 1, policy_version 60240 (0.0008) +[2023-10-08 14:10:26,008][102897] Updated weights for policy 0, policy_version 60190 (0.0008) +[2023-10-08 14:10:26,059][102898] Updated weights for policy 1, policy_version 60250 (0.0010) +[2023-10-08 14:10:26,875][101941] Fps is (10 sec: 16384.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 123338752. Throughput: 0: 1781.7, 1: 1786.1. Samples: 30837594. Policy #0 lag: (min: 31.0, avg: 31.2, max: 42.0) +[2023-10-08 14:10:26,876][101941] Avg episode reward: [(0, '8.950'), (1, '9.400')] +[2023-10-08 14:10:29,812][102897] Updated weights for policy 0, policy_version 60200 (0.0010) +[2023-10-08 14:10:29,940][102898] Updated weights for policy 1, policy_version 60260 (0.0009) +[2023-10-08 14:10:30,172][102897] Updated weights for policy 0, policy_version 60210 (0.0010) +[2023-10-08 14:10:30,302][102898] Updated weights for policy 1, policy_version 60270 (0.0008) +[2023-10-08 14:10:30,544][102897] Updated weights for policy 0, policy_version 60220 (0.0008) +[2023-10-08 14:10:30,673][102898] Updated weights for policy 1, policy_version 60280 (0.0008) +[2023-10-08 14:10:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 123404288. Throughput: 0: 1761.2, 1: 1763.8. Samples: 30857662. Policy #0 lag: (min: 31.0, avg: 31.2, max: 42.0) +[2023-10-08 14:10:31,876][101941] Avg episode reward: [(0, '8.920'), (1, '8.740')] +[2023-10-08 14:10:34,379][102897] Updated weights for policy 0, policy_version 60230 (0.0009) +[2023-10-08 14:10:34,547][102898] Updated weights for policy 1, policy_version 60290 (0.0008) +[2023-10-08 14:10:34,748][102897] Updated weights for policy 0, policy_version 60240 (0.0007) +[2023-10-08 14:10:34,943][102898] Updated weights for policy 1, policy_version 60300 (0.0009) +[2023-10-08 14:10:35,120][102897] Updated weights for policy 0, policy_version 60250 (0.0008) +[2023-10-08 14:10:35,309][102898] Updated weights for policy 1, policy_version 60310 (0.0009) +[2023-10-08 14:10:35,678][102898] Updated weights for policy 1, policy_version 60320 (0.0010) +[2023-10-08 14:10:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 123469824. Throughput: 0: 1786.8, 1: 1790.4. Samples: 30869674. Policy #0 lag: (min: 31.0, avg: 31.2, max: 42.0) +[2023-10-08 14:10:36,875][101941] Avg episode reward: [(0, '8.470'), (1, '8.860')] +[2023-10-08 14:10:38,850][102897] Updated weights for policy 0, policy_version 60260 (0.0009) +[2023-10-08 14:10:39,214][102897] Updated weights for policy 0, policy_version 60270 (0.0009) +[2023-10-08 14:10:39,454][102898] Updated weights for policy 1, policy_version 60330 (0.0007) +[2023-10-08 14:10:39,582][102897] Updated weights for policy 0, policy_version 60280 (0.0009) +[2023-10-08 14:10:39,818][102898] Updated weights for policy 1, policy_version 60340 (0.0008) +[2023-10-08 14:10:40,187][102898] Updated weights for policy 1, policy_version 60350 (0.0009) +[2023-10-08 14:10:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 123535360. Throughput: 0: 1763.6, 1: 1770.0. Samples: 30889538. Policy #0 lag: (min: 28.0, avg: 35.5, max: 60.0) +[2023-10-08 14:10:41,876][101941] Avg episode reward: [(0, '7.620'), (1, '9.020')] +[2023-10-08 14:10:43,321][102897] Updated weights for policy 0, policy_version 60290 (0.0009) +[2023-10-08 14:10:43,713][102897] Updated weights for policy 0, policy_version 60300 (0.0009) +[2023-10-08 14:10:43,822][102898] Updated weights for policy 1, policy_version 60360 (0.0008) +[2023-10-08 14:10:44,082][102897] Updated weights for policy 0, policy_version 60310 (0.0008) +[2023-10-08 14:10:44,183][102898] Updated weights for policy 1, policy_version 60370 (0.0008) +[2023-10-08 14:10:44,450][102897] Updated weights for policy 0, policy_version 60320 (0.0008) +[2023-10-08 14:10:44,552][102898] Updated weights for policy 1, policy_version 60380 (0.0007) +[2023-10-08 14:10:46,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 123600896. Throughput: 0: 1765.7, 1: 1770.9. Samples: 30911756. Policy #0 lag: (min: 28.0, avg: 35.5, max: 60.0) +[2023-10-08 14:10:46,876][101941] Avg episode reward: [(0, '7.730'), (1, '8.640')] +[2023-10-08 14:10:48,189][102897] Updated weights for policy 0, policy_version 60330 (0.0009) +[2023-10-08 14:10:48,437][102898] Updated weights for policy 1, policy_version 60390 (0.0007) +[2023-10-08 14:10:48,572][102897] Updated weights for policy 0, policy_version 60340 (0.0009) +[2023-10-08 14:10:48,808][102898] Updated weights for policy 1, policy_version 60400 (0.0008) +[2023-10-08 14:10:48,937][102897] Updated weights for policy 0, policy_version 60350 (0.0007) +[2023-10-08 14:10:49,166][102898] Updated weights for policy 1, policy_version 60410 (0.0008) +[2023-10-08 14:10:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 123666432. Throughput: 0: 1767.5, 1: 1771.6. Samples: 30921550. Policy #0 lag: (min: 28.0, avg: 35.5, max: 60.0) +[2023-10-08 14:10:51,876][101941] Avg episode reward: [(0, '7.930'), (1, '8.510')] +[2023-10-08 14:10:52,690][102897] Updated weights for policy 0, policy_version 60360 (0.0008) +[2023-10-08 14:10:52,983][102898] Updated weights for policy 1, policy_version 60420 (0.0008) +[2023-10-08 14:10:53,057][102897] Updated weights for policy 0, policy_version 60370 (0.0008) +[2023-10-08 14:10:53,338][102898] Updated weights for policy 1, policy_version 60430 (0.0007) +[2023-10-08 14:10:53,427][102897] Updated weights for policy 0, policy_version 60380 (0.0007) +[2023-10-08 14:10:53,701][102898] Updated weights for policy 1, policy_version 60440 (0.0007) +[2023-10-08 14:10:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 123731968. Throughput: 0: 1770.6, 1: 1771.1. Samples: 30943890. Policy #0 lag: (min: 28.0, avg: 35.5, max: 60.0) +[2023-10-08 14:10:56,876][101941] Avg episode reward: [(0, '8.620'), (1, '8.960')] +[2023-10-08 14:10:57,253][102897] Updated weights for policy 0, policy_version 60390 (0.0008) +[2023-10-08 14:10:57,560][102898] Updated weights for policy 1, policy_version 60450 (0.0007) +[2023-10-08 14:10:57,630][102897] Updated weights for policy 0, policy_version 60400 (0.0007) +[2023-10-08 14:10:57,933][102898] Updated weights for policy 1, policy_version 60460 (0.0009) +[2023-10-08 14:10:57,997][102897] Updated weights for policy 0, policy_version 60410 (0.0007) +[2023-10-08 14:10:58,295][102898] Updated weights for policy 1, policy_version 60470 (0.0007) +[2023-10-08 14:10:58,656][102898] Updated weights for policy 1, policy_version 60480 (0.0007) +[2023-10-08 14:11:01,851][102897] Updated weights for policy 0, policy_version 60420 (0.0008) +[2023-10-08 14:11:01,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 123797504. Throughput: 0: 1787.4, 1: 1784.4. Samples: 30966032. Policy #0 lag: (min: 28.0, avg: 35.5, max: 60.0) +[2023-10-08 14:11:01,875][101941] Avg episode reward: [(0, '7.760'), (1, '8.750')] +[2023-10-08 14:11:02,225][102897] Updated weights for policy 0, policy_version 60430 (0.0009) +[2023-10-08 14:11:02,338][102898] Updated weights for policy 1, policy_version 60490 (0.0007) +[2023-10-08 14:11:02,598][102897] Updated weights for policy 0, policy_version 60440 (0.0008) +[2023-10-08 14:11:02,708][102898] Updated weights for policy 1, policy_version 60500 (0.0010) +[2023-10-08 14:11:03,072][102898] Updated weights for policy 1, policy_version 60510 (0.0007) +[2023-10-08 14:11:06,347][102897] Updated weights for policy 0, policy_version 60450 (0.0008) +[2023-10-08 14:11:06,717][102897] Updated weights for policy 0, policy_version 60460 (0.0009) +[2023-10-08 14:11:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 123863040. Throughput: 0: 1765.0, 1: 1773.6. Samples: 30975666. Policy #0 lag: (min: 28.0, avg: 35.5, max: 60.0) +[2023-10-08 14:11:06,876][101941] Avg episode reward: [(0, '8.280'), (1, '9.500')] +[2023-10-08 14:11:06,878][102898] Updated weights for policy 1, policy_version 60520 (0.0007) +[2023-10-08 14:11:07,079][102897] Updated weights for policy 0, policy_version 60470 (0.0007) +[2023-10-08 14:11:07,245][102898] Updated weights for policy 1, policy_version 60530 (0.0009) +[2023-10-08 14:11:07,447][102897] Updated weights for policy 0, policy_version 60480 (0.0007) +[2023-10-08 14:11:07,601][102898] Updated weights for policy 1, policy_version 60540 (0.0009) +[2023-10-08 14:11:11,441][102898] Updated weights for policy 1, policy_version 60550 (0.0008) +[2023-10-08 14:11:11,495][102897] Updated weights for policy 0, policy_version 60490 (0.0007) +[2023-10-08 14:11:11,806][102898] Updated weights for policy 1, policy_version 60560 (0.0008) +[2023-10-08 14:11:11,855][102897] Updated weights for policy 0, policy_version 60500 (0.0009) +[2023-10-08 14:11:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 123928576. Throughput: 0: 1773.9, 1: 1780.9. Samples: 30997562. Policy #0 lag: (min: 28.0, avg: 35.5, max: 60.0) +[2023-10-08 14:11:11,876][101941] Avg episode reward: [(0, '8.410'), (1, '8.360')] +[2023-10-08 14:11:12,165][102898] Updated weights for policy 1, policy_version 60570 (0.0008) +[2023-10-08 14:11:12,230][102897] Updated weights for policy 0, policy_version 60510 (0.0007) +[2023-10-08 14:11:15,970][102898] Updated weights for policy 1, policy_version 60580 (0.0009) +[2023-10-08 14:11:15,975][102897] Updated weights for policy 0, policy_version 60520 (0.0007) +[2023-10-08 14:11:16,333][102897] Updated weights for policy 0, policy_version 60530 (0.0008) +[2023-10-08 14:11:16,336][102898] Updated weights for policy 1, policy_version 60590 (0.0008) +[2023-10-08 14:11:16,704][102897] Updated weights for policy 0, policy_version 60540 (0.0009) +[2023-10-08 14:11:16,707][102898] Updated weights for policy 1, policy_version 60600 (0.0008) +[2023-10-08 14:11:16,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.6, 300 sec: 14329.1). Total num frames: 124026880. Throughput: 0: 1774.4, 1: 1787.3. Samples: 31017936. Policy #0 lag: (min: 28.0, avg: 35.5, max: 60.0) +[2023-10-08 14:11:16,875][101941] Avg episode reward: [(0, '6.950'), (1, '7.930')] +[2023-10-08 14:11:20,493][102897] Updated weights for policy 0, policy_version 60550 (0.0008) +[2023-10-08 14:11:20,536][102898] Updated weights for policy 1, policy_version 60610 (0.0009) +[2023-10-08 14:11:20,865][102897] Updated weights for policy 0, policy_version 60560 (0.0008) +[2023-10-08 14:11:20,943][102898] Updated weights for policy 1, policy_version 60620 (0.0007) +[2023-10-08 14:11:21,239][102897] Updated weights for policy 0, policy_version 60570 (0.0007) +[2023-10-08 14:11:21,307][102898] Updated weights for policy 1, policy_version 60630 (0.0008) +[2023-10-08 14:11:21,673][102898] Updated weights for policy 1, policy_version 60640 (0.0007) +[2023-10-08 14:11:21,875][101941] Fps is (10 sec: 19660.6, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 124125184. Throughput: 0: 1768.3, 1: 1776.3. Samples: 31029180. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:11:21,876][101941] Avg episode reward: [(0, '7.500'), (1, '9.610')] +[2023-10-08 14:11:24,993][102897] Updated weights for policy 0, policy_version 60580 (0.0007) +[2023-10-08 14:11:25,361][102897] Updated weights for policy 0, policy_version 60590 (0.0010) +[2023-10-08 14:11:25,394][102898] Updated weights for policy 1, policy_version 60650 (0.0008) +[2023-10-08 14:11:25,735][102897] Updated weights for policy 0, policy_version 60600 (0.0010) +[2023-10-08 14:11:25,757][102898] Updated weights for policy 1, policy_version 60660 (0.0008) +[2023-10-08 14:11:26,131][102898] Updated weights for policy 1, policy_version 60670 (0.0009) +[2023-10-08 14:11:26,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 124190720. Throughput: 0: 1778.4, 1: 1791.4. Samples: 31050176. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:11:26,876][101941] Avg episode reward: [(0, '8.220'), (1, '10.620')] +[2023-10-08 14:11:26,877][102760] Saving new best policy, reward=10.620! +[2023-10-08 14:11:29,629][102897] Updated weights for policy 0, policy_version 60610 (0.0009) +[2023-10-08 14:11:29,732][102898] Updated weights for policy 1, policy_version 60680 (0.0009) +[2023-10-08 14:11:30,034][102897] Updated weights for policy 0, policy_version 60620 (0.0010) +[2023-10-08 14:11:30,098][102898] Updated weights for policy 1, policy_version 60690 (0.0009) +[2023-10-08 14:11:30,401][102897] Updated weights for policy 0, policy_version 60630 (0.0007) +[2023-10-08 14:11:30,473][102898] Updated weights for policy 1, policy_version 60700 (0.0010) +[2023-10-08 14:11:30,772][102897] Updated weights for policy 0, policy_version 60640 (0.0008) +[2023-10-08 14:11:31,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 124256256. Throughput: 0: 1756.9, 1: 1774.1. Samples: 31070650. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:11:31,875][101941] Avg episode reward: [(0, '8.070'), (1, '9.770')] +[2023-10-08 14:11:34,264][102898] Updated weights for policy 1, policy_version 60710 (0.0008) +[2023-10-08 14:11:34,444][102897] Updated weights for policy 0, policy_version 60650 (0.0009) +[2023-10-08 14:11:34,624][102898] Updated weights for policy 1, policy_version 60720 (0.0009) +[2023-10-08 14:11:34,817][102897] Updated weights for policy 0, policy_version 60660 (0.0009) +[2023-10-08 14:11:34,989][102898] Updated weights for policy 1, policy_version 60730 (0.0009) +[2023-10-08 14:11:35,186][102897] Updated weights for policy 0, policy_version 60670 (0.0009) +[2023-10-08 14:11:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 124321792. Throughput: 0: 1785.7, 1: 1793.3. Samples: 31082604. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:11:36,876][101941] Avg episode reward: [(0, '8.650'), (1, '10.000')] +[2023-10-08 14:11:38,866][102898] Updated weights for policy 1, policy_version 60740 (0.0008) +[2023-10-08 14:11:39,087][102897] Updated weights for policy 0, policy_version 60680 (0.0008) +[2023-10-08 14:11:39,229][102898] Updated weights for policy 1, policy_version 60750 (0.0007) +[2023-10-08 14:11:39,445][102897] Updated weights for policy 0, policy_version 60690 (0.0007) +[2023-10-08 14:11:39,597][102898] Updated weights for policy 1, policy_version 60760 (0.0007) +[2023-10-08 14:11:39,812][102897] Updated weights for policy 0, policy_version 60700 (0.0007) +[2023-10-08 14:11:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 124387328. Throughput: 0: 1754.8, 1: 1774.7. Samples: 31102714. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:11:41,875][101941] Avg episode reward: [(0, '8.310'), (1, '9.550')] +[2023-10-08 14:11:43,437][102898] Updated weights for policy 1, policy_version 60770 (0.0008) +[2023-10-08 14:11:43,639][102897] Updated weights for policy 0, policy_version 60710 (0.0007) +[2023-10-08 14:11:43,805][102898] Updated weights for policy 1, policy_version 60780 (0.0008) +[2023-10-08 14:11:44,005][102897] Updated weights for policy 0, policy_version 60720 (0.0008) +[2023-10-08 14:11:44,177][102898] Updated weights for policy 1, policy_version 60790 (0.0009) +[2023-10-08 14:11:44,370][102897] Updated weights for policy 0, policy_version 60730 (0.0008) +[2023-10-08 14:11:44,544][102898] Updated weights for policy 1, policy_version 60800 (0.0008) +[2023-10-08 14:11:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 124452864. Throughput: 0: 1758.1, 1: 1774.9. Samples: 31125020. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:11:46,875][101941] Avg episode reward: [(0, '8.540'), (1, '9.800')] +[2023-10-08 14:11:48,222][102897] Updated weights for policy 0, policy_version 60740 (0.0009) +[2023-10-08 14:11:48,407][102898] Updated weights for policy 1, policy_version 60810 (0.0009) +[2023-10-08 14:11:48,587][102897] Updated weights for policy 0, policy_version 60750 (0.0008) +[2023-10-08 14:11:48,773][102898] Updated weights for policy 1, policy_version 60820 (0.0007) +[2023-10-08 14:11:48,954][102897] Updated weights for policy 0, policy_version 60760 (0.0009) +[2023-10-08 14:11:49,143][102898] Updated weights for policy 1, policy_version 60830 (0.0009) +[2023-10-08 14:11:51,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 124518400. Throughput: 0: 1760.6, 1: 1771.8. Samples: 31134624. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:11:51,876][101941] Avg episode reward: [(0, '8.570'), (1, '9.780')] +[2023-10-08 14:11:52,619][102897] Updated weights for policy 0, policy_version 60770 (0.0009) +[2023-10-08 14:11:52,993][102897] Updated weights for policy 0, policy_version 60780 (0.0007) +[2023-10-08 14:11:53,071][102898] Updated weights for policy 1, policy_version 60840 (0.0008) +[2023-10-08 14:11:53,372][102897] Updated weights for policy 0, policy_version 60790 (0.0008) +[2023-10-08 14:11:53,443][102898] Updated weights for policy 1, policy_version 60850 (0.0008) +[2023-10-08 14:11:53,738][102897] Updated weights for policy 0, policy_version 60800 (0.0009) +[2023-10-08 14:11:53,803][102898] Updated weights for policy 1, policy_version 60860 (0.0008) +[2023-10-08 14:11:56,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 124583936. Throughput: 0: 1765.3, 1: 1767.7. Samples: 31156548. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:11:56,876][101941] Avg episode reward: [(0, '7.510'), (1, '9.920')] +[2023-10-08 14:11:57,528][102898] Updated weights for policy 1, policy_version 60870 (0.0007) +[2023-10-08 14:11:57,533][102897] Updated weights for policy 0, policy_version 60810 (0.0009) +[2023-10-08 14:11:57,896][102898] Updated weights for policy 1, policy_version 60880 (0.0007) +[2023-10-08 14:11:57,898][102897] Updated weights for policy 0, policy_version 60820 (0.0009) +[2023-10-08 14:11:58,263][102898] Updated weights for policy 1, policy_version 60890 (0.0007) +[2023-10-08 14:11:58,269][102897] Updated weights for policy 0, policy_version 60830 (0.0010) +[2023-10-08 14:12:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 124649472. Throughput: 0: 1784.1, 1: 1787.3. Samples: 31178650. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:12:01,876][101941] Avg episode reward: [(0, '7.680'), (1, '10.520')] +[2023-10-08 14:12:01,950][102898] Updated weights for policy 1, policy_version 60900 (0.0008) +[2023-10-08 14:12:02,153][102897] Updated weights for policy 0, policy_version 60840 (0.0008) +[2023-10-08 14:12:02,321][102898] Updated weights for policy 1, policy_version 60910 (0.0008) +[2023-10-08 14:12:02,528][102897] Updated weights for policy 0, policy_version 60850 (0.0007) +[2023-10-08 14:12:02,693][102898] Updated weights for policy 1, policy_version 60920 (0.0008) +[2023-10-08 14:12:02,906][102897] Updated weights for policy 0, policy_version 60860 (0.0007) +[2023-10-08 14:12:06,630][102898] Updated weights for policy 1, policy_version 60930 (0.0008) +[2023-10-08 14:12:06,748][102897] Updated weights for policy 0, policy_version 60870 (0.0008) +[2023-10-08 14:12:06,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 124715008. Throughput: 0: 1763.7, 1: 1771.8. Samples: 31188280. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:12:06,876][101941] Avg episode reward: [(0, '7.700'), (1, '9.450')] +[2023-10-08 14:12:07,039][102898] Updated weights for policy 1, policy_version 60940 (0.0007) +[2023-10-08 14:12:07,110][102897] Updated weights for policy 0, policy_version 60880 (0.0008) +[2023-10-08 14:12:07,402][102898] Updated weights for policy 1, policy_version 60950 (0.0007) +[2023-10-08 14:12:07,490][102897] Updated weights for policy 0, policy_version 60890 (0.0008) +[2023-10-08 14:12:07,774][102898] Updated weights for policy 1, policy_version 60960 (0.0009) +[2023-10-08 14:12:11,312][102897] Updated weights for policy 0, policy_version 60900 (0.0008) +[2023-10-08 14:12:11,456][102898] Updated weights for policy 1, policy_version 60970 (0.0009) +[2023-10-08 14:12:11,693][102897] Updated weights for policy 0, policy_version 60910 (0.0009) +[2023-10-08 14:12:11,820][102898] Updated weights for policy 1, policy_version 60980 (0.0007) +[2023-10-08 14:12:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 124780544. Throughput: 0: 1772.6, 1: 1780.6. Samples: 31210068. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:12:11,876][101941] Avg episode reward: [(0, '7.500'), (1, '9.180')] +[2023-10-08 14:12:12,054][102897] Updated weights for policy 0, policy_version 60920 (0.0010) +[2023-10-08 14:12:12,187][102898] Updated weights for policy 1, policy_version 60990 (0.0007) +[2023-10-08 14:12:15,859][102897] Updated weights for policy 0, policy_version 60930 (0.0009) +[2023-10-08 14:12:16,154][102898] Updated weights for policy 1, policy_version 61000 (0.0008) +[2023-10-08 14:12:16,266][102897] Updated weights for policy 0, policy_version 60940 (0.0007) +[2023-10-08 14:12:16,517][102898] Updated weights for policy 1, policy_version 61010 (0.0008) +[2023-10-08 14:12:16,628][102897] Updated weights for policy 0, policy_version 60950 (0.0007) +[2023-10-08 14:12:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 14106.9). Total num frames: 124846080. Throughput: 0: 1779.4, 1: 1780.4. Samples: 31230842. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:12:16,875][101941] Avg episode reward: [(0, '7.520'), (1, '8.610')] +[2023-10-08 14:12:16,880][102898] Updated weights for policy 1, policy_version 61020 (0.0009) +[2023-10-08 14:12:16,997][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000060960_62423040.pth... +[2023-10-08 14:12:17,000][102897] Updated weights for policy 0, policy_version 60960 (0.0007) +[2023-10-08 14:12:17,026][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000059296_60719104.pth +[2023-10-08 14:12:17,027][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000061024_62488576.pth... +[2023-10-08 14:12:17,055][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000059360_60784640.pth +[2023-10-08 14:12:20,770][102898] Updated weights for policy 1, policy_version 61030 (0.0008) +[2023-10-08 14:12:20,780][102897] Updated weights for policy 0, policy_version 60970 (0.0010) +[2023-10-08 14:12:21,131][102898] Updated weights for policy 1, policy_version 61040 (0.0008) +[2023-10-08 14:12:21,148][102897] Updated weights for policy 0, policy_version 60980 (0.0008) +[2023-10-08 14:12:21,497][102898] Updated weights for policy 1, policy_version 61050 (0.0007) +[2023-10-08 14:12:21,527][102897] Updated weights for policy 0, policy_version 60990 (0.0008) +[2023-10-08 14:12:21,875][101941] Fps is (10 sec: 19660.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 124977152. Throughput: 0: 1767.1, 1: 1774.2. Samples: 31241964. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:12:21,876][101941] Avg episode reward: [(0, '8.540'), (1, '7.880')] +[2023-10-08 14:12:25,321][102898] Updated weights for policy 1, policy_version 61060 (0.0008) +[2023-10-08 14:12:25,326][102897] Updated weights for policy 0, policy_version 61000 (0.0009) +[2023-10-08 14:12:25,683][102898] Updated weights for policy 1, policy_version 61070 (0.0008) +[2023-10-08 14:12:25,693][102897] Updated weights for policy 0, policy_version 61010 (0.0008) +[2023-10-08 14:12:26,044][102898] Updated weights for policy 1, policy_version 61080 (0.0007) +[2023-10-08 14:12:26,071][102897] Updated weights for policy 0, policy_version 61020 (0.0008) +[2023-10-08 14:12:26,875][101941] Fps is (10 sec: 19660.3, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 125042688. Throughput: 0: 1784.3, 1: 1783.5. Samples: 31263264. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:12:26,876][101941] Avg episode reward: [(0, '8.210'), (1, '7.870')] +[2023-10-08 14:12:29,682][102898] Updated weights for policy 1, policy_version 61090 (0.0007) +[2023-10-08 14:12:29,899][102897] Updated weights for policy 0, policy_version 61030 (0.0007) +[2023-10-08 14:12:30,050][102898] Updated weights for policy 1, policy_version 61100 (0.0007) +[2023-10-08 14:12:30,272][102897] Updated weights for policy 0, policy_version 61040 (0.0009) +[2023-10-08 14:12:30,414][102898] Updated weights for policy 1, policy_version 61110 (0.0008) +[2023-10-08 14:12:30,631][102897] Updated weights for policy 0, policy_version 61050 (0.0008) +[2023-10-08 14:12:30,772][102898] Updated weights for policy 1, policy_version 61120 (0.0010) +[2023-10-08 14:12:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 125108224. Throughput: 0: 1760.4, 1: 1757.1. Samples: 31283310. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:12:31,876][101941] Avg episode reward: [(0, '8.110'), (1, '8.210')] +[2023-10-08 14:12:34,576][102897] Updated weights for policy 0, policy_version 61060 (0.0008) +[2023-10-08 14:12:34,689][102898] Updated weights for policy 1, policy_version 61130 (0.0009) +[2023-10-08 14:12:34,934][102897] Updated weights for policy 0, policy_version 61070 (0.0008) +[2023-10-08 14:12:35,055][102898] Updated weights for policy 1, policy_version 61140 (0.0009) +[2023-10-08 14:12:35,300][102897] Updated weights for policy 0, policy_version 61080 (0.0008) +[2023-10-08 14:12:35,418][102898] Updated weights for policy 1, policy_version 61150 (0.0008) +[2023-10-08 14:12:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 125173760. Throughput: 0: 1791.1, 1: 1781.3. Samples: 31295384. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:12:36,876][101941] Avg episode reward: [(0, '8.240'), (1, '9.270')] +[2023-10-08 14:12:39,240][102897] Updated weights for policy 0, policy_version 61090 (0.0008) +[2023-10-08 14:12:39,412][102898] Updated weights for policy 1, policy_version 61160 (0.0007) +[2023-10-08 14:12:39,606][102897] Updated weights for policy 0, policy_version 61100 (0.0008) +[2023-10-08 14:12:39,777][102898] Updated weights for policy 1, policy_version 61170 (0.0009) +[2023-10-08 14:12:39,984][102897] Updated weights for policy 0, policy_version 61110 (0.0009) +[2023-10-08 14:12:40,144][102898] Updated weights for policy 1, policy_version 61180 (0.0007) +[2023-10-08 14:12:40,351][102897] Updated weights for policy 0, policy_version 61120 (0.0007) +[2023-10-08 14:12:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 125239296. Throughput: 0: 1752.1, 1: 1760.4. Samples: 31314608. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:12:41,876][101941] Avg episode reward: [(0, '7.560'), (1, '9.490')] +[2023-10-08 14:12:43,789][102898] Updated weights for policy 1, policy_version 61190 (0.0008) +[2023-10-08 14:12:44,050][102897] Updated weights for policy 0, policy_version 61130 (0.0007) +[2023-10-08 14:12:44,165][102898] Updated weights for policy 1, policy_version 61200 (0.0010) +[2023-10-08 14:12:44,418][102897] Updated weights for policy 0, policy_version 61140 (0.0008) +[2023-10-08 14:12:44,538][102898] Updated weights for policy 1, policy_version 61210 (0.0009) +[2023-10-08 14:12:44,789][102897] Updated weights for policy 0, policy_version 61150 (0.0008) +[2023-10-08 14:12:46,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 125304832. Throughput: 0: 1758.1, 1: 1757.0. Samples: 31336828. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 14:12:46,875][101941] Avg episode reward: [(0, '8.220'), (1, '8.820')] +[2023-10-08 14:12:48,264][102898] Updated weights for policy 1, policy_version 61220 (0.0008) +[2023-10-08 14:12:48,531][102897] Updated weights for policy 0, policy_version 61160 (0.0008) +[2023-10-08 14:12:48,636][102898] Updated weights for policy 1, policy_version 61230 (0.0007) +[2023-10-08 14:12:48,905][102897] Updated weights for policy 0, policy_version 61170 (0.0007) +[2023-10-08 14:12:48,995][102898] Updated weights for policy 1, policy_version 61240 (0.0008) +[2023-10-08 14:12:49,272][102897] Updated weights for policy 0, policy_version 61180 (0.0008) +[2023-10-08 14:12:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 125370368. Throughput: 0: 1761.9, 1: 1756.8. Samples: 31346620. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 14:12:51,876][101941] Avg episode reward: [(0, '8.880'), (1, '8.590')] +[2023-10-08 14:12:52,859][102898] Updated weights for policy 1, policy_version 61250 (0.0008) +[2023-10-08 14:12:53,129][102897] Updated weights for policy 0, policy_version 61190 (0.0009) +[2023-10-08 14:12:53,211][102898] Updated weights for policy 1, policy_version 61260 (0.0007) +[2023-10-08 14:12:53,505][102897] Updated weights for policy 0, policy_version 61200 (0.0009) +[2023-10-08 14:12:53,580][102898] Updated weights for policy 1, policy_version 61270 (0.0009) +[2023-10-08 14:12:53,876][102897] Updated weights for policy 0, policy_version 61210 (0.0009) +[2023-10-08 14:12:53,941][102898] Updated weights for policy 1, policy_version 61280 (0.0009) +[2023-10-08 14:12:56,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 125435904. Throughput: 0: 1762.9, 1: 1761.2. Samples: 31368650. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 14:12:56,876][101941] Avg episode reward: [(0, '9.040'), (1, '9.590')] +[2023-10-08 14:12:57,743][102897] Updated weights for policy 0, policy_version 61220 (0.0009) +[2023-10-08 14:12:57,803][102898] Updated weights for policy 1, policy_version 61290 (0.0007) +[2023-10-08 14:12:58,110][102897] Updated weights for policy 0, policy_version 61230 (0.0009) +[2023-10-08 14:12:58,176][102898] Updated weights for policy 1, policy_version 61300 (0.0009) +[2023-10-08 14:12:58,480][102897] Updated weights for policy 0, policy_version 61240 (0.0009) +[2023-10-08 14:12:58,537][102898] Updated weights for policy 1, policy_version 61310 (0.0007) +[2023-10-08 14:13:01,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 125501440. Throughput: 0: 1775.2, 1: 1773.3. Samples: 31390526. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 14:13:01,876][101941] Avg episode reward: [(0, '8.510'), (1, '9.300')] +[2023-10-08 14:13:02,270][102897] Updated weights for policy 0, policy_version 61250 (0.0009) +[2023-10-08 14:13:02,315][102898] Updated weights for policy 1, policy_version 61320 (0.0007) +[2023-10-08 14:13:02,666][102897] Updated weights for policy 0, policy_version 61260 (0.0008) +[2023-10-08 14:13:02,679][102898] Updated weights for policy 1, policy_version 61330 (0.0008) +[2023-10-08 14:13:03,031][102897] Updated weights for policy 0, policy_version 61270 (0.0007) +[2023-10-08 14:13:03,039][102898] Updated weights for policy 1, policy_version 61340 (0.0007) +[2023-10-08 14:13:03,405][102897] Updated weights for policy 0, policy_version 61280 (0.0008) +[2023-10-08 14:13:06,863][102898] Updated weights for policy 1, policy_version 61350 (0.0007) +[2023-10-08 14:13:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 125566976. Throughput: 0: 1751.3, 1: 1760.5. Samples: 31399996. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 14:13:06,876][101941] Avg episode reward: [(0, '7.640'), (1, '8.970')] +[2023-10-08 14:13:07,220][102898] Updated weights for policy 1, policy_version 61360 (0.0007) +[2023-10-08 14:13:07,332][102897] Updated weights for policy 0, policy_version 61290 (0.0008) +[2023-10-08 14:13:07,588][102898] Updated weights for policy 1, policy_version 61370 (0.0009) +[2023-10-08 14:13:07,712][102897] Updated weights for policy 0, policy_version 61300 (0.0007) +[2023-10-08 14:13:08,070][102897] Updated weights for policy 0, policy_version 61310 (0.0008) +[2023-10-08 14:13:11,471][102898] Updated weights for policy 1, policy_version 61380 (0.0007) +[2023-10-08 14:13:11,840][102898] Updated weights for policy 1, policy_version 61390 (0.0009) +[2023-10-08 14:13:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14106.9). Total num frames: 125632512. Throughput: 0: 1757.8, 1: 1763.7. Samples: 31421728. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 14:13:11,876][101941] Avg episode reward: [(0, '7.380'), (1, '9.130')] +[2023-10-08 14:13:11,911][102897] Updated weights for policy 0, policy_version 61320 (0.0008) +[2023-10-08 14:13:12,201][102898] Updated weights for policy 1, policy_version 61400 (0.0008) +[2023-10-08 14:13:12,279][102897] Updated weights for policy 0, policy_version 61330 (0.0009) +[2023-10-08 14:13:12,660][102897] Updated weights for policy 0, policy_version 61340 (0.0009) +[2023-10-08 14:13:15,942][102898] Updated weights for policy 1, policy_version 61410 (0.0009) +[2023-10-08 14:13:16,313][102898] Updated weights for policy 1, policy_version 61420 (0.0009) +[2023-10-08 14:13:16,448][102897] Updated weights for policy 0, policy_version 61350 (0.0008) +[2023-10-08 14:13:16,676][102898] Updated weights for policy 1, policy_version 61430 (0.0008) +[2023-10-08 14:13:16,821][102897] Updated weights for policy 0, policy_version 61360 (0.0007) +[2023-10-08 14:13:16,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14106.9). Total num frames: 125698048. Throughput: 0: 1780.6, 1: 1775.9. Samples: 31443352. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 14:13:16,876][101941] Avg episode reward: [(0, '7.710'), (1, '8.740')] +[2023-10-08 14:13:17,038][102898] Updated weights for policy 1, policy_version 61440 (0.0008) +[2023-10-08 14:13:17,191][102897] Updated weights for policy 0, policy_version 61370 (0.0007) +[2023-10-08 14:13:20,927][102898] Updated weights for policy 1, policy_version 61450 (0.0009) +[2023-10-08 14:13:21,016][102897] Updated weights for policy 0, policy_version 61380 (0.0007) +[2023-10-08 14:13:21,293][102898] Updated weights for policy 1, policy_version 61460 (0.0007) +[2023-10-08 14:13:21,388][102897] Updated weights for policy 0, policy_version 61390 (0.0008) +[2023-10-08 14:13:21,665][102898] Updated weights for policy 1, policy_version 61470 (0.0008) +[2023-10-08 14:13:21,744][102897] Updated weights for policy 0, policy_version 61400 (0.0009) +[2023-10-08 14:13:21,875][101941] Fps is (10 sec: 16384.0, 60 sec: 13653.3, 300 sec: 14218.0). Total num frames: 125796352. Throughput: 0: 1754.3, 1: 1766.0. Samples: 31453794. Policy #0 lag: (min: 29.0, avg: 29.0, max: 29.0) +[2023-10-08 14:13:21,876][101941] Avg episode reward: [(0, '8.200'), (1, '7.770')] +[2023-10-08 14:13:25,531][102897] Updated weights for policy 0, policy_version 61410 (0.0008) +[2023-10-08 14:13:25,614][102898] Updated weights for policy 1, policy_version 61480 (0.0008) +[2023-10-08 14:13:25,900][102897] Updated weights for policy 0, policy_version 61420 (0.0008) +[2023-10-08 14:13:25,979][102898] Updated weights for policy 1, policy_version 61490 (0.0007) +[2023-10-08 14:13:26,272][102897] Updated weights for policy 0, policy_version 61430 (0.0007) +[2023-10-08 14:13:26,354][102898] Updated weights for policy 1, policy_version 61500 (0.0009) +[2023-10-08 14:13:26,637][102897] Updated weights for policy 0, policy_version 61440 (0.0008) +[2023-10-08 14:13:26,875][101941] Fps is (10 sec: 19660.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 125894656. Throughput: 0: 1799.5, 1: 1789.3. Samples: 31476106. Policy #0 lag: (min: 12.0, avg: 13.2, max: 35.0) +[2023-10-08 14:13:26,876][101941] Avg episode reward: [(0, '8.570'), (1, '7.760')] +[2023-10-08 14:13:29,888][102898] Updated weights for policy 1, policy_version 61510 (0.0009) +[2023-10-08 14:13:30,253][102898] Updated weights for policy 1, policy_version 61520 (0.0008) +[2023-10-08 14:13:30,372][102897] Updated weights for policy 0, policy_version 61450 (0.0009) +[2023-10-08 14:13:30,622][102898] Updated weights for policy 1, policy_version 61530 (0.0008) +[2023-10-08 14:13:30,741][102897] Updated weights for policy 0, policy_version 61460 (0.0007) +[2023-10-08 14:13:31,120][102897] Updated weights for policy 0, policy_version 61470 (0.0010) +[2023-10-08 14:13:31,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 125960192. Throughput: 0: 1765.9, 1: 1773.9. Samples: 31496120. Policy #0 lag: (min: 12.0, avg: 13.2, max: 35.0) +[2023-10-08 14:13:31,876][101941] Avg episode reward: [(0, '8.830'), (1, '7.330')] +[2023-10-08 14:13:34,518][102898] Updated weights for policy 1, policy_version 61540 (0.0009) +[2023-10-08 14:13:34,889][102898] Updated weights for policy 1, policy_version 61550 (0.0007) +[2023-10-08 14:13:35,004][102897] Updated weights for policy 0, policy_version 61480 (0.0008) +[2023-10-08 14:13:35,250][102898] Updated weights for policy 1, policy_version 61560 (0.0007) +[2023-10-08 14:13:35,379][102897] Updated weights for policy 0, policy_version 61490 (0.0008) +[2023-10-08 14:13:35,742][102897] Updated weights for policy 0, policy_version 61500 (0.0008) +[2023-10-08 14:13:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 126025728. Throughput: 0: 1795.4, 1: 1799.0. Samples: 31508368. Policy #0 lag: (min: 12.0, avg: 13.2, max: 35.0) +[2023-10-08 14:13:36,876][101941] Avg episode reward: [(0, '8.550'), (1, '7.020')] +[2023-10-08 14:13:39,153][102898] Updated weights for policy 1, policy_version 61570 (0.0007) +[2023-10-08 14:13:39,397][102897] Updated weights for policy 0, policy_version 61510 (0.0008) +[2023-10-08 14:13:39,512][102898] Updated weights for policy 1, policy_version 61580 (0.0007) +[2023-10-08 14:13:39,762][102897] Updated weights for policy 0, policy_version 61520 (0.0009) +[2023-10-08 14:13:39,874][102898] Updated weights for policy 1, policy_version 61590 (0.0009) +[2023-10-08 14:13:40,130][102897] Updated weights for policy 0, policy_version 61530 (0.0007) +[2023-10-08 14:13:40,233][102898] Updated weights for policy 1, policy_version 61600 (0.0009) +[2023-10-08 14:13:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 126091264. Throughput: 0: 1771.6, 1: 1769.9. Samples: 31528016. Policy #0 lag: (min: 12.0, avg: 13.2, max: 35.0) +[2023-10-08 14:13:41,876][101941] Avg episode reward: [(0, '8.280'), (1, '6.920')] +[2023-10-08 14:13:43,852][102897] Updated weights for policy 0, policy_version 61540 (0.0009) +[2023-10-08 14:13:44,162][102898] Updated weights for policy 1, policy_version 61610 (0.0007) +[2023-10-08 14:13:44,221][102897] Updated weights for policy 0, policy_version 61550 (0.0008) +[2023-10-08 14:13:44,540][102898] Updated weights for policy 1, policy_version 61620 (0.0007) +[2023-10-08 14:13:44,593][102897] Updated weights for policy 0, policy_version 61560 (0.0007) +[2023-10-08 14:13:44,917][102898] Updated weights for policy 1, policy_version 61630 (0.0007) +[2023-10-08 14:13:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 126156800. Throughput: 0: 1773.3, 1: 1770.8. Samples: 31550012. Policy #0 lag: (min: 12.0, avg: 13.2, max: 35.0) +[2023-10-08 14:13:46,876][101941] Avg episode reward: [(0, '8.130'), (1, '7.470')] +[2023-10-08 14:13:48,503][102897] Updated weights for policy 0, policy_version 61570 (0.0008) +[2023-10-08 14:13:48,698][102898] Updated weights for policy 1, policy_version 61640 (0.0008) +[2023-10-08 14:13:48,896][102897] Updated weights for policy 0, policy_version 61580 (0.0007) +[2023-10-08 14:13:49,060][102898] Updated weights for policy 1, policy_version 61650 (0.0007) +[2023-10-08 14:13:49,262][102897] Updated weights for policy 0, policy_version 61590 (0.0008) +[2023-10-08 14:13:49,431][102898] Updated weights for policy 1, policy_version 61660 (0.0007) +[2023-10-08 14:13:49,631][102897] Updated weights for policy 0, policy_version 61600 (0.0008) +[2023-10-08 14:13:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 126222336. Throughput: 0: 1784.8, 1: 1770.8. Samples: 31560002. Policy #0 lag: (min: 12.0, avg: 13.2, max: 35.0) +[2023-10-08 14:13:51,876][101941] Avg episode reward: [(0, '7.700'), (1, '7.300')] +[2023-10-08 14:13:53,163][102897] Updated weights for policy 0, policy_version 61610 (0.0007) +[2023-10-08 14:13:53,325][102898] Updated weights for policy 1, policy_version 61670 (0.0008) +[2023-10-08 14:13:53,529][102897] Updated weights for policy 0, policy_version 61620 (0.0008) +[2023-10-08 14:13:53,695][102898] Updated weights for policy 1, policy_version 61680 (0.0008) +[2023-10-08 14:13:53,904][102897] Updated weights for policy 0, policy_version 61630 (0.0010) +[2023-10-08 14:13:54,058][102898] Updated weights for policy 1, policy_version 61690 (0.0007) +[2023-10-08 14:13:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 126287872. Throughput: 0: 1786.8, 1: 1771.8. Samples: 31581864. Policy #0 lag: (min: 12.0, avg: 13.2, max: 35.0) +[2023-10-08 14:13:56,875][101941] Avg episode reward: [(0, '7.940'), (1, '7.270')] +[2023-10-08 14:13:57,674][102897] Updated weights for policy 0, policy_version 61640 (0.0008) +[2023-10-08 14:13:57,765][102898] Updated weights for policy 1, policy_version 61700 (0.0009) +[2023-10-08 14:13:58,046][102897] Updated weights for policy 0, policy_version 61650 (0.0009) +[2023-10-08 14:13:58,124][102898] Updated weights for policy 1, policy_version 61710 (0.0009) +[2023-10-08 14:13:58,418][102897] Updated weights for policy 0, policy_version 61660 (0.0007) +[2023-10-08 14:13:58,491][102898] Updated weights for policy 1, policy_version 61720 (0.0010) +[2023-10-08 14:14:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 126353408. Throughput: 0: 1789.3, 1: 1784.9. Samples: 31604192. Policy #0 lag: (min: 12.0, avg: 13.2, max: 35.0) +[2023-10-08 14:14:01,876][101941] Avg episode reward: [(0, '8.190'), (1, '7.690')] +[2023-10-08 14:14:02,062][102897] Updated weights for policy 0, policy_version 61670 (0.0008) +[2023-10-08 14:14:02,356][102898] Updated weights for policy 1, policy_version 61730 (0.0008) +[2023-10-08 14:14:02,439][102897] Updated weights for policy 0, policy_version 61680 (0.0009) +[2023-10-08 14:14:02,723][102898] Updated weights for policy 1, policy_version 61740 (0.0008) +[2023-10-08 14:14:02,798][102897] Updated weights for policy 0, policy_version 61690 (0.0008) +[2023-10-08 14:14:03,086][102898] Updated weights for policy 1, policy_version 61750 (0.0007) +[2023-10-08 14:14:03,447][102898] Updated weights for policy 1, policy_version 61760 (0.0009) +[2023-10-08 14:14:06,668][102897] Updated weights for policy 0, policy_version 61700 (0.0008) +[2023-10-08 14:14:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 126418944. Throughput: 0: 1782.4, 1: 1772.8. Samples: 31613782. Policy #0 lag: (min: 12.0, avg: 13.2, max: 35.0) +[2023-10-08 14:14:06,876][101941] Avg episode reward: [(0, '8.470'), (1, '7.850')] +[2023-10-08 14:14:07,032][102897] Updated weights for policy 0, policy_version 61710 (0.0009) +[2023-10-08 14:14:07,279][102898] Updated weights for policy 1, policy_version 61770 (0.0007) +[2023-10-08 14:14:07,408][102897] Updated weights for policy 0, policy_version 61720 (0.0008) +[2023-10-08 14:14:07,655][102898] Updated weights for policy 1, policy_version 61780 (0.0007) +[2023-10-08 14:14:08,021][102898] Updated weights for policy 1, policy_version 61790 (0.0008) +[2023-10-08 14:14:11,157][102897] Updated weights for policy 0, policy_version 61730 (0.0009) +[2023-10-08 14:14:11,527][102897] Updated weights for policy 0, policy_version 61740 (0.0008) +[2023-10-08 14:14:11,842][102898] Updated weights for policy 1, policy_version 61800 (0.0008) +[2023-10-08 14:14:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14106.9). Total num frames: 126484480. Throughput: 0: 1780.7, 1: 1773.4. Samples: 31636038. Policy #0 lag: (min: 31.0, avg: 31.2, max: 40.0) +[2023-10-08 14:14:11,876][101941] Avg episode reward: [(0, '7.860'), (1, '7.880')] +[2023-10-08 14:14:11,896][102897] Updated weights for policy 0, policy_version 61750 (0.0008) +[2023-10-08 14:14:12,206][102898] Updated weights for policy 1, policy_version 61810 (0.0007) +[2023-10-08 14:14:12,264][102897] Updated weights for policy 0, policy_version 61760 (0.0008) +[2023-10-08 14:14:12,582][102898] Updated weights for policy 1, policy_version 61820 (0.0008) +[2023-10-08 14:14:16,112][102897] Updated weights for policy 0, policy_version 61770 (0.0007) +[2023-10-08 14:14:16,193][102898] Updated weights for policy 1, policy_version 61830 (0.0008) +[2023-10-08 14:14:16,480][102897] Updated weights for policy 0, policy_version 61780 (0.0007) +[2023-10-08 14:14:16,551][102898] Updated weights for policy 1, policy_version 61840 (0.0007) +[2023-10-08 14:14:16,849][102897] Updated weights for policy 0, policy_version 61790 (0.0007) +[2023-10-08 14:14:16,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14106.9). Total num frames: 126550016. Throughput: 0: 1797.3, 1: 1781.9. Samples: 31657186. Policy #0 lag: (min: 31.0, avg: 31.2, max: 40.0) +[2023-10-08 14:14:16,876][101941] Avg episode reward: [(0, '8.150'), (1, '8.300')] +[2023-10-08 14:14:16,915][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000061792_63275008.pth... +[2023-10-08 14:14:16,921][102898] Updated weights for policy 1, policy_version 61850 (0.0007) +[2023-10-08 14:14:16,948][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000060128_61571072.pth +[2023-10-08 14:14:17,140][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000061856_63340544.pth... +[2023-10-08 14:14:17,169][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000060192_61636608.pth +[2023-10-08 14:14:20,657][102898] Updated weights for policy 1, policy_version 61860 (0.0009) +[2023-10-08 14:14:20,693][102897] Updated weights for policy 0, policy_version 61800 (0.0008) +[2023-10-08 14:14:21,021][102898] Updated weights for policy 1, policy_version 61870 (0.0007) +[2023-10-08 14:14:21,067][102897] Updated weights for policy 0, policy_version 61810 (0.0008) +[2023-10-08 14:14:21,375][102898] Updated weights for policy 1, policy_version 61880 (0.0008) +[2023-10-08 14:14:21,437][102897] Updated weights for policy 0, policy_version 61820 (0.0008) +[2023-10-08 14:14:21,875][101941] Fps is (10 sec: 19661.3, 60 sec: 14745.7, 300 sec: 14218.0). Total num frames: 126681088. Throughput: 0: 1780.0, 1: 1771.3. Samples: 31668174. Policy #0 lag: (min: 31.0, avg: 31.2, max: 40.0) +[2023-10-08 14:14:21,875][101941] Avg episode reward: [(0, '8.720'), (1, '8.110')] +[2023-10-08 14:14:25,093][102897] Updated weights for policy 0, policy_version 61830 (0.0008) +[2023-10-08 14:14:25,309][102898] Updated weights for policy 1, policy_version 61890 (0.0009) +[2023-10-08 14:14:25,456][102897] Updated weights for policy 0, policy_version 61840 (0.0008) +[2023-10-08 14:14:25,674][102898] Updated weights for policy 1, policy_version 61900 (0.0008) +[2023-10-08 14:14:25,832][102897] Updated weights for policy 0, policy_version 61850 (0.0007) +[2023-10-08 14:14:26,046][102898] Updated weights for policy 1, policy_version 61910 (0.0009) +[2023-10-08 14:14:26,413][102898] Updated weights for policy 1, policy_version 61920 (0.0010) +[2023-10-08 14:14:26,875][101941] Fps is (10 sec: 19661.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 126746624. Throughput: 0: 1804.1, 1: 1793.6. Samples: 31689914. Policy #0 lag: (min: 31.0, avg: 31.2, max: 40.0) +[2023-10-08 14:14:26,876][101941] Avg episode reward: [(0, '8.380'), (1, '7.810')] +[2023-10-08 14:14:29,333][102897] Updated weights for policy 0, policy_version 61860 (0.0007) +[2023-10-08 14:14:29,703][102897] Updated weights for policy 0, policy_version 61870 (0.0009) +[2023-10-08 14:14:30,071][102897] Updated weights for policy 0, policy_version 61880 (0.0007) +[2023-10-08 14:14:30,301][102898] Updated weights for policy 1, policy_version 61930 (0.0009) +[2023-10-08 14:14:30,663][102898] Updated weights for policy 1, policy_version 61940 (0.0007) +[2023-10-08 14:14:31,039][102898] Updated weights for policy 1, policy_version 61950 (0.0009) +[2023-10-08 14:14:31,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 126812160. Throughput: 0: 1798.7, 1: 1767.7. Samples: 31710502. Policy #0 lag: (min: 31.0, avg: 31.2, max: 40.0) +[2023-10-08 14:14:31,876][101941] Avg episode reward: [(0, '8.250'), (1, '8.030')] +[2023-10-08 14:14:33,848][102897] Updated weights for policy 0, policy_version 61890 (0.0010) +[2023-10-08 14:14:34,240][102897] Updated weights for policy 0, policy_version 61900 (0.0009) +[2023-10-08 14:14:34,613][102897] Updated weights for policy 0, policy_version 61910 (0.0009) +[2023-10-08 14:14:34,776][102898] Updated weights for policy 1, policy_version 61960 (0.0009) +[2023-10-08 14:14:34,988][102897] Updated weights for policy 0, policy_version 61920 (0.0007) +[2023-10-08 14:14:35,146][102898] Updated weights for policy 1, policy_version 61970 (0.0009) +[2023-10-08 14:14:35,512][102898] Updated weights for policy 1, policy_version 61980 (0.0009) +[2023-10-08 14:14:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 126877696. Throughput: 0: 1805.5, 1: 1802.1. Samples: 31722346. Policy #0 lag: (min: 31.0, avg: 31.2, max: 40.0) +[2023-10-08 14:14:36,876][101941] Avg episode reward: [(0, '8.190'), (1, '8.090')] +[2023-10-08 14:14:38,712][102897] Updated weights for policy 0, policy_version 61930 (0.0010) +[2023-10-08 14:14:39,079][102897] Updated weights for policy 0, policy_version 61940 (0.0008) +[2023-10-08 14:14:39,229][102898] Updated weights for policy 1, policy_version 61990 (0.0010) +[2023-10-08 14:14:39,451][102897] Updated weights for policy 0, policy_version 61950 (0.0008) +[2023-10-08 14:14:39,589][102898] Updated weights for policy 1, policy_version 62000 (0.0009) +[2023-10-08 14:14:39,952][102898] Updated weights for policy 1, policy_version 62010 (0.0009) +[2023-10-08 14:14:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 126943232. Throughput: 0: 1791.2, 1: 1775.5. Samples: 31742370. Policy #0 lag: (min: 31.0, avg: 31.2, max: 40.0) +[2023-10-08 14:14:41,876][101941] Avg episode reward: [(0, '8.070'), (1, '7.480')] +[2023-10-08 14:14:43,113][102897] Updated weights for policy 0, policy_version 61960 (0.0007) +[2023-10-08 14:14:43,480][102897] Updated weights for policy 0, policy_version 61970 (0.0007) +[2023-10-08 14:14:43,767][102898] Updated weights for policy 1, policy_version 62020 (0.0009) +[2023-10-08 14:14:43,852][102897] Updated weights for policy 0, policy_version 61980 (0.0009) +[2023-10-08 14:14:44,125][102898] Updated weights for policy 1, policy_version 62030 (0.0008) +[2023-10-08 14:14:44,493][102898] Updated weights for policy 1, policy_version 62040 (0.0008) +[2023-10-08 14:14:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 127008768. Throughput: 0: 1796.9, 1: 1774.3. Samples: 31764898. Policy #0 lag: (min: 31.0, avg: 31.2, max: 40.0) +[2023-10-08 14:14:46,876][101941] Avg episode reward: [(0, '7.670'), (1, '7.600')] +[2023-10-08 14:14:47,695][102897] Updated weights for policy 0, policy_version 61990 (0.0007) +[2023-10-08 14:14:48,059][102897] Updated weights for policy 0, policy_version 62000 (0.0008) +[2023-10-08 14:14:48,348][102898] Updated weights for policy 1, policy_version 62050 (0.0008) +[2023-10-08 14:14:48,429][102897] Updated weights for policy 0, policy_version 62010 (0.0009) +[2023-10-08 14:14:48,720][102898] Updated weights for policy 1, policy_version 62060 (0.0007) +[2023-10-08 14:14:49,091][102898] Updated weights for policy 1, policy_version 62070 (0.0009) +[2023-10-08 14:14:49,452][102898] Updated weights for policy 1, policy_version 62080 (0.0010) +[2023-10-08 14:14:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 127074304. Throughput: 0: 1796.5, 1: 1776.8. Samples: 31774582. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:14:51,875][101941] Avg episode reward: [(0, '7.400'), (1, '6.950')] +[2023-10-08 14:14:52,322][102897] Updated weights for policy 0, policy_version 62020 (0.0009) +[2023-10-08 14:14:52,694][102897] Updated weights for policy 0, policy_version 62030 (0.0009) +[2023-10-08 14:14:53,073][102897] Updated weights for policy 0, policy_version 62040 (0.0008) +[2023-10-08 14:14:53,343][102898] Updated weights for policy 1, policy_version 62090 (0.0009) +[2023-10-08 14:14:53,706][102898] Updated weights for policy 1, policy_version 62100 (0.0009) +[2023-10-08 14:14:54,072][102898] Updated weights for policy 1, policy_version 62110 (0.0008) +[2023-10-08 14:14:56,851][102897] Updated weights for policy 0, policy_version 62050 (0.0009) +[2023-10-08 14:14:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 127139840. Throughput: 0: 1793.5, 1: 1780.7. Samples: 31796878. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:14:56,876][101941] Avg episode reward: [(0, '7.600'), (1, '7.310')] +[2023-10-08 14:14:57,227][102897] Updated weights for policy 0, policy_version 62060 (0.0010) +[2023-10-08 14:14:57,598][102897] Updated weights for policy 0, policy_version 62070 (0.0007) +[2023-10-08 14:14:57,811][102898] Updated weights for policy 1, policy_version 62120 (0.0008) +[2023-10-08 14:14:57,967][102897] Updated weights for policy 0, policy_version 62080 (0.0008) +[2023-10-08 14:14:58,182][102898] Updated weights for policy 1, policy_version 62130 (0.0009) +[2023-10-08 14:14:58,544][102898] Updated weights for policy 1, policy_version 62140 (0.0008) +[2023-10-08 14:15:01,728][102897] Updated weights for policy 0, policy_version 62090 (0.0009) +[2023-10-08 14:15:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 127205376. Throughput: 0: 1807.8, 1: 1784.5. Samples: 31818838. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:15:01,876][101941] Avg episode reward: [(0, '7.730'), (1, '8.320')] +[2023-10-08 14:15:02,097][102897] Updated weights for policy 0, policy_version 62100 (0.0009) +[2023-10-08 14:15:02,254][102898] Updated weights for policy 1, policy_version 62150 (0.0009) +[2023-10-08 14:15:02,464][102897] Updated weights for policy 0, policy_version 62110 (0.0010) +[2023-10-08 14:15:02,608][102898] Updated weights for policy 1, policy_version 62160 (0.0007) +[2023-10-08 14:15:02,979][102898] Updated weights for policy 1, policy_version 62170 (0.0007) +[2023-10-08 14:15:06,175][102897] Updated weights for policy 0, policy_version 62120 (0.0008) +[2023-10-08 14:15:06,537][102897] Updated weights for policy 0, policy_version 62130 (0.0010) +[2023-10-08 14:15:06,830][102898] Updated weights for policy 1, policy_version 62180 (0.0008) +[2023-10-08 14:15:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 127270912. Throughput: 0: 1796.4, 1: 1769.0. Samples: 31828618. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:15:06,876][101941] Avg episode reward: [(0, '7.350'), (1, '8.440')] +[2023-10-08 14:15:06,909][102897] Updated weights for policy 0, policy_version 62140 (0.0007) +[2023-10-08 14:15:07,198][102898] Updated weights for policy 1, policy_version 62190 (0.0008) +[2023-10-08 14:15:07,550][102898] Updated weights for policy 1, policy_version 62200 (0.0010) +[2023-10-08 14:15:10,767][102897] Updated weights for policy 0, policy_version 62150 (0.0008) +[2023-10-08 14:15:11,139][102897] Updated weights for policy 0, policy_version 62160 (0.0007) +[2023-10-08 14:15:11,232][102898] Updated weights for policy 1, policy_version 62210 (0.0007) +[2023-10-08 14:15:11,508][102897] Updated weights for policy 0, policy_version 62170 (0.0007) +[2023-10-08 14:15:11,596][102898] Updated weights for policy 1, policy_version 62220 (0.0008) +[2023-10-08 14:15:11,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14218.0). Total num frames: 127369216. Throughput: 0: 1796.6, 1: 1779.0. Samples: 31850814. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:15:11,876][101941] Avg episode reward: [(0, '7.890'), (1, '7.670')] +[2023-10-08 14:15:11,963][102898] Updated weights for policy 1, policy_version 62230 (0.0008) +[2023-10-08 14:15:12,334][102898] Updated weights for policy 1, policy_version 62240 (0.0007) +[2023-10-08 14:15:15,271][102897] Updated weights for policy 0, policy_version 62180 (0.0007) +[2023-10-08 14:15:15,643][102897] Updated weights for policy 0, policy_version 62190 (0.0009) +[2023-10-08 14:15:16,014][102897] Updated weights for policy 0, policy_version 62200 (0.0008) +[2023-10-08 14:15:16,271][102898] Updated weights for policy 1, policy_version 62250 (0.0007) +[2023-10-08 14:15:16,645][102898] Updated weights for policy 1, policy_version 62260 (0.0008) +[2023-10-08 14:15:16,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.7, 300 sec: 14106.9). Total num frames: 127434752. Throughput: 0: 1769.8, 1: 1789.7. Samples: 31870678. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:15:16,876][101941] Avg episode reward: [(0, '7.980'), (1, '7.490')] +[2023-10-08 14:15:17,012][102898] Updated weights for policy 1, policy_version 62270 (0.0009) +[2023-10-08 14:15:19,997][102897] Updated weights for policy 0, policy_version 62210 (0.0007) +[2023-10-08 14:15:20,406][102897] Updated weights for policy 0, policy_version 62220 (0.0007) +[2023-10-08 14:15:20,776][102897] Updated weights for policy 0, policy_version 62230 (0.0007) +[2023-10-08 14:15:20,893][102898] Updated weights for policy 1, policy_version 62280 (0.0008) +[2023-10-08 14:15:21,146][102897] Updated weights for policy 0, policy_version 62240 (0.0008) +[2023-10-08 14:15:21,262][102898] Updated weights for policy 1, policy_version 62290 (0.0008) +[2023-10-08 14:15:21,623][102898] Updated weights for policy 1, policy_version 62300 (0.0009) +[2023-10-08 14:15:21,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 127533056. Throughput: 0: 1785.2, 1: 1765.4. Samples: 31882122. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:15:21,876][101941] Avg episode reward: [(0, '7.510'), (1, '8.420')] +[2023-10-08 14:15:24,987][102897] Updated weights for policy 0, policy_version 62250 (0.0007) +[2023-10-08 14:15:25,352][102897] Updated weights for policy 0, policy_version 62260 (0.0008) +[2023-10-08 14:15:25,432][102898] Updated weights for policy 1, policy_version 62310 (0.0008) +[2023-10-08 14:15:25,719][102897] Updated weights for policy 0, policy_version 62270 (0.0008) +[2023-10-08 14:15:25,786][102898] Updated weights for policy 1, policy_version 62320 (0.0008) +[2023-10-08 14:15:26,153][102898] Updated weights for policy 1, policy_version 62330 (0.0010) +[2023-10-08 14:15:26,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 127598592. Throughput: 0: 1775.6, 1: 1787.5. Samples: 31902708. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:15:26,875][101941] Avg episode reward: [(0, '7.540'), (1, '8.650')] +[2023-10-08 14:15:29,468][102897] Updated weights for policy 0, policy_version 62280 (0.0007) +[2023-10-08 14:15:29,852][102897] Updated weights for policy 0, policy_version 62290 (0.0007) +[2023-10-08 14:15:29,970][102898] Updated weights for policy 1, policy_version 62340 (0.0009) +[2023-10-08 14:15:30,215][102897] Updated weights for policy 0, policy_version 62300 (0.0007) +[2023-10-08 14:15:30,344][102898] Updated weights for policy 1, policy_version 62350 (0.0008) +[2023-10-08 14:15:30,703][102898] Updated weights for policy 1, policy_version 62360 (0.0010) +[2023-10-08 14:15:31,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 127664128. Throughput: 0: 1758.8, 1: 1763.0. Samples: 31923382. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 14:15:31,876][101941] Avg episode reward: [(0, '7.690'), (1, '8.760')] +[2023-10-08 14:15:34,069][102897] Updated weights for policy 0, policy_version 62310 (0.0007) +[2023-10-08 14:15:34,435][102897] Updated weights for policy 0, policy_version 62320 (0.0009) +[2023-10-08 14:15:34,517][102898] Updated weights for policy 1, policy_version 62370 (0.0009) +[2023-10-08 14:15:34,804][102897] Updated weights for policy 0, policy_version 62330 (0.0008) +[2023-10-08 14:15:34,890][102898] Updated weights for policy 1, policy_version 62380 (0.0007) +[2023-10-08 14:15:35,252][102898] Updated weights for policy 1, policy_version 62390 (0.0007) +[2023-10-08 14:15:35,616][102898] Updated weights for policy 1, policy_version 62400 (0.0008) +[2023-10-08 14:15:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 127729664. Throughput: 0: 1776.9, 1: 1791.5. Samples: 31935160. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 14:15:36,876][101941] Avg episode reward: [(0, '7.460'), (1, '8.830')] +[2023-10-08 14:15:38,491][102897] Updated weights for policy 0, policy_version 62340 (0.0009) +[2023-10-08 14:15:38,865][102897] Updated weights for policy 0, policy_version 62350 (0.0008) +[2023-10-08 14:15:39,233][102897] Updated weights for policy 0, policy_version 62360 (0.0009) +[2023-10-08 14:15:39,418][102898] Updated weights for policy 1, policy_version 62410 (0.0007) +[2023-10-08 14:15:39,782][102898] Updated weights for policy 1, policy_version 62420 (0.0008) +[2023-10-08 14:15:40,147][102898] Updated weights for policy 1, policy_version 62430 (0.0007) +[2023-10-08 14:15:41,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 127795200. Throughput: 0: 1758.4, 1: 1757.4. Samples: 31955088. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 14:15:41,875][101941] Avg episode reward: [(0, '8.020'), (1, '8.390')] +[2023-10-08 14:15:43,207][102897] Updated weights for policy 0, policy_version 62370 (0.0008) +[2023-10-08 14:15:43,574][102897] Updated weights for policy 0, policy_version 62380 (0.0007) +[2023-10-08 14:15:43,943][102897] Updated weights for policy 0, policy_version 62390 (0.0009) +[2023-10-08 14:15:43,966][102898] Updated weights for policy 1, policy_version 62440 (0.0008) +[2023-10-08 14:15:44,316][102897] Updated weights for policy 0, policy_version 62400 (0.0007) +[2023-10-08 14:15:44,325][102898] Updated weights for policy 1, policy_version 62450 (0.0007) +[2023-10-08 14:15:44,684][102898] Updated weights for policy 1, policy_version 62460 (0.0009) +[2023-10-08 14:15:46,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 127860736. Throughput: 0: 1761.5, 1: 1759.7. Samples: 31977292. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 14:15:46,876][101941] Avg episode reward: [(0, '8.150'), (1, '7.920')] +[2023-10-08 14:15:48,079][102897] Updated weights for policy 0, policy_version 62410 (0.0011) +[2023-10-08 14:15:48,438][102897] Updated weights for policy 0, policy_version 62420 (0.0007) +[2023-10-08 14:15:48,558][102898] Updated weights for policy 1, policy_version 62470 (0.0009) +[2023-10-08 14:15:48,812][102897] Updated weights for policy 0, policy_version 62430 (0.0007) +[2023-10-08 14:15:48,924][102898] Updated weights for policy 1, policy_version 62480 (0.0007) +[2023-10-08 14:15:49,287][102898] Updated weights for policy 1, policy_version 62490 (0.0007) +[2023-10-08 14:15:51,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 127926272. Throughput: 0: 1759.2, 1: 1761.6. Samples: 31987056. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 14:15:51,876][101941] Avg episode reward: [(0, '8.390'), (1, '7.700')] +[2023-10-08 14:15:52,522][102897] Updated weights for policy 0, policy_version 62440 (0.0007) +[2023-10-08 14:15:52,894][102897] Updated weights for policy 0, policy_version 62450 (0.0008) +[2023-10-08 14:15:53,197][102898] Updated weights for policy 1, policy_version 62500 (0.0007) +[2023-10-08 14:15:53,258][102897] Updated weights for policy 0, policy_version 62460 (0.0008) +[2023-10-08 14:15:53,563][102898] Updated weights for policy 1, policy_version 62510 (0.0007) +[2023-10-08 14:15:53,923][102898] Updated weights for policy 1, policy_version 62520 (0.0009) +[2023-10-08 14:15:56,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 127991808. Throughput: 0: 1764.7, 1: 1757.0. Samples: 32009290. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 14:15:56,875][101941] Avg episode reward: [(0, '7.580'), (1, '8.030')] +[2023-10-08 14:15:57,061][102897] Updated weights for policy 0, policy_version 62470 (0.0009) +[2023-10-08 14:15:57,431][102897] Updated weights for policy 0, policy_version 62480 (0.0010) +[2023-10-08 14:15:57,621][102898] Updated weights for policy 1, policy_version 62530 (0.0008) +[2023-10-08 14:15:57,805][102897] Updated weights for policy 0, policy_version 62490 (0.0008) +[2023-10-08 14:15:57,993][102898] Updated weights for policy 1, policy_version 62540 (0.0007) +[2023-10-08 14:15:58,362][102898] Updated weights for policy 1, policy_version 62550 (0.0009) +[2023-10-08 14:15:58,735][102898] Updated weights for policy 1, policy_version 62560 (0.0007) +[2023-10-08 14:16:01,609][102897] Updated weights for policy 0, policy_version 62500 (0.0008) +[2023-10-08 14:16:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 128057344. Throughput: 0: 1794.7, 1: 1779.2. Samples: 32031506. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 14:16:01,876][101941] Avg episode reward: [(0, '7.570'), (1, '7.800')] +[2023-10-08 14:16:01,986][102897] Updated weights for policy 0, policy_version 62510 (0.0009) +[2023-10-08 14:16:02,353][102897] Updated weights for policy 0, policy_version 62520 (0.0008) +[2023-10-08 14:16:02,397][102898] Updated weights for policy 1, policy_version 62570 (0.0009) +[2023-10-08 14:16:02,766][102898] Updated weights for policy 1, policy_version 62580 (0.0009) +[2023-10-08 14:16:03,140][102898] Updated weights for policy 1, policy_version 62590 (0.0008) +[2023-10-08 14:16:06,059][102897] Updated weights for policy 0, policy_version 62530 (0.0007) +[2023-10-08 14:16:06,462][102897] Updated weights for policy 0, policy_version 62540 (0.0010) +[2023-10-08 14:16:06,828][102897] Updated weights for policy 0, policy_version 62550 (0.0009) +[2023-10-08 14:16:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 128122880. Throughput: 0: 1770.1, 1: 1766.5. Samples: 32041268. Policy #0 lag: (min: 15.0, avg: 15.0, max: 15.0) +[2023-10-08 14:16:06,876][101941] Avg episode reward: [(0, '7.940'), (1, '8.620')] +[2023-10-08 14:16:06,971][102898] Updated weights for policy 1, policy_version 62600 (0.0008) +[2023-10-08 14:16:07,197][102897] Updated weights for policy 0, policy_version 62560 (0.0007) +[2023-10-08 14:16:07,340][102898] Updated weights for policy 1, policy_version 62610 (0.0009) +[2023-10-08 14:16:07,712][102898] Updated weights for policy 1, policy_version 62620 (0.0011) +[2023-10-08 14:16:11,025][102897] Updated weights for policy 0, policy_version 62570 (0.0010) +[2023-10-08 14:16:11,389][102897] Updated weights for policy 0, policy_version 62580 (0.0009) +[2023-10-08 14:16:11,512][102898] Updated weights for policy 1, policy_version 62630 (0.0009) +[2023-10-08 14:16:11,768][102897] Updated weights for policy 0, policy_version 62590 (0.0007) +[2023-10-08 14:16:11,874][102898] Updated weights for policy 1, policy_version 62640 (0.0009) +[2023-10-08 14:16:11,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 128221184. Throughput: 0: 1797.7, 1: 1776.2. Samples: 32063532. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:16:11,875][101941] Avg episode reward: [(0, '8.390'), (1, '8.260')] +[2023-10-08 14:16:12,250][102898] Updated weights for policy 1, policy_version 62650 (0.0010) +[2023-10-08 14:16:15,422][102897] Updated weights for policy 0, policy_version 62600 (0.0007) +[2023-10-08 14:16:15,787][102897] Updated weights for policy 0, policy_version 62610 (0.0009) +[2023-10-08 14:16:16,098][102898] Updated weights for policy 1, policy_version 62660 (0.0009) +[2023-10-08 14:16:16,161][102897] Updated weights for policy 0, policy_version 62620 (0.0009) +[2023-10-08 14:16:16,464][102898] Updated weights for policy 1, policy_version 62670 (0.0009) +[2023-10-08 14:16:16,831][102898] Updated weights for policy 1, policy_version 62680 (0.0010) +[2023-10-08 14:16:16,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14106.9). Total num frames: 128286720. Throughput: 0: 1777.7, 1: 1785.5. Samples: 32083726. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:16:16,876][101941] Avg episode reward: [(0, '7.890'), (1, '7.340')] +[2023-10-08 14:16:16,888][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000062624_64126976.pth... +[2023-10-08 14:16:16,917][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000060960_62423040.pth +[2023-10-08 14:16:17,125][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000062688_64192512.pth... +[2023-10-08 14:16:17,154][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000061024_62488576.pth +[2023-10-08 14:16:19,811][102897] Updated weights for policy 0, policy_version 62630 (0.0011) +[2023-10-08 14:16:20,193][102897] Updated weights for policy 0, policy_version 62640 (0.0008) +[2023-10-08 14:16:20,539][102898] Updated weights for policy 1, policy_version 62690 (0.0008) +[2023-10-08 14:16:20,554][102897] Updated weights for policy 0, policy_version 62650 (0.0009) +[2023-10-08 14:16:20,900][102898] Updated weights for policy 1, policy_version 62700 (0.0008) +[2023-10-08 14:16:21,266][102898] Updated weights for policy 1, policy_version 62710 (0.0010) +[2023-10-08 14:16:21,630][102898] Updated weights for policy 1, policy_version 62720 (0.0010) +[2023-10-08 14:16:21,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 128385024. Throughput: 0: 1797.8, 1: 1767.1. Samples: 32095578. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:16:21,876][101941] Avg episode reward: [(0, '7.520'), (1, '7.740')] +[2023-10-08 14:16:24,482][102897] Updated weights for policy 0, policy_version 62660 (0.0008) +[2023-10-08 14:16:24,853][102897] Updated weights for policy 0, policy_version 62670 (0.0007) +[2023-10-08 14:16:25,228][102897] Updated weights for policy 0, policy_version 62680 (0.0007) +[2023-10-08 14:16:25,619][102898] Updated weights for policy 1, policy_version 62730 (0.0008) +[2023-10-08 14:16:25,981][102898] Updated weights for policy 1, policy_version 62740 (0.0010) +[2023-10-08 14:16:26,350][102898] Updated weights for policy 1, policy_version 62750 (0.0010) +[2023-10-08 14:16:26,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 128450560. Throughput: 0: 1790.8, 1: 1793.3. Samples: 32116372. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:16:26,876][101941] Avg episode reward: [(0, '7.770'), (1, '8.330')] +[2023-10-08 14:16:28,799][102897] Updated weights for policy 0, policy_version 62690 (0.0007) +[2023-10-08 14:16:29,181][102897] Updated weights for policy 0, policy_version 62700 (0.0008) +[2023-10-08 14:16:29,549][102897] Updated weights for policy 0, policy_version 62710 (0.0009) +[2023-10-08 14:16:29,925][102897] Updated weights for policy 0, policy_version 62720 (0.0008) +[2023-10-08 14:16:30,206][102898] Updated weights for policy 1, policy_version 62760 (0.0008) +[2023-10-08 14:16:30,567][102898] Updated weights for policy 1, policy_version 62770 (0.0008) +[2023-10-08 14:16:30,924][102898] Updated weights for policy 1, policy_version 62780 (0.0008) +[2023-10-08 14:16:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 128516096. Throughput: 0: 1781.2, 1: 1770.6. Samples: 32137122. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:16:31,876][101941] Avg episode reward: [(0, '7.650'), (1, '8.380')] +[2023-10-08 14:16:33,793][102897] Updated weights for policy 0, policy_version 62730 (0.0009) +[2023-10-08 14:16:34,157][102897] Updated weights for policy 0, policy_version 62740 (0.0009) +[2023-10-08 14:16:34,521][102897] Updated weights for policy 0, policy_version 62750 (0.0009) +[2023-10-08 14:16:34,623][102898] Updated weights for policy 1, policy_version 62790 (0.0008) +[2023-10-08 14:16:34,989][102898] Updated weights for policy 1, policy_version 62800 (0.0008) +[2023-10-08 14:16:35,363][102898] Updated weights for policy 1, policy_version 62810 (0.0008) +[2023-10-08 14:16:36,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 128581632. Throughput: 0: 1786.4, 1: 1800.8. Samples: 32148476. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:16:36,875][101941] Avg episode reward: [(0, '7.640'), (1, '8.300')] +[2023-10-08 14:16:38,206][102897] Updated weights for policy 0, policy_version 62760 (0.0008) +[2023-10-08 14:16:38,566][102897] Updated weights for policy 0, policy_version 62770 (0.0009) +[2023-10-08 14:16:38,942][102897] Updated weights for policy 0, policy_version 62780 (0.0008) +[2023-10-08 14:16:38,965][102898] Updated weights for policy 1, policy_version 62820 (0.0010) +[2023-10-08 14:16:39,331][102898] Updated weights for policy 1, policy_version 62830 (0.0007) +[2023-10-08 14:16:39,696][102898] Updated weights for policy 1, policy_version 62840 (0.0007) +[2023-10-08 14:16:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 128647168. Throughput: 0: 1784.9, 1: 1775.1. Samples: 32169490. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:16:41,876][101941] Avg episode reward: [(0, '7.030'), (1, '8.240')] +[2023-10-08 14:16:42,707][102897] Updated weights for policy 0, policy_version 62790 (0.0007) +[2023-10-08 14:16:43,079][102897] Updated weights for policy 0, policy_version 62800 (0.0008) +[2023-10-08 14:16:43,445][102897] Updated weights for policy 0, policy_version 62810 (0.0007) +[2023-10-08 14:16:43,480][102898] Updated weights for policy 1, policy_version 62850 (0.0010) +[2023-10-08 14:16:43,850][102898] Updated weights for policy 1, policy_version 62860 (0.0011) +[2023-10-08 14:16:44,222][102898] Updated weights for policy 1, policy_version 62870 (0.0011) +[2023-10-08 14:16:44,597][102898] Updated weights for policy 1, policy_version 62880 (0.0011) +[2023-10-08 14:16:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 128712704. Throughput: 0: 1791.6, 1: 1769.2. Samples: 32191740. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:16:46,875][101941] Avg episode reward: [(0, '7.750'), (1, '8.210')] +[2023-10-08 14:16:47,134][102897] Updated weights for policy 0, policy_version 62820 (0.0007) +[2023-10-08 14:16:47,505][102897] Updated weights for policy 0, policy_version 62830 (0.0007) +[2023-10-08 14:16:47,874][102897] Updated weights for policy 0, policy_version 62840 (0.0009) +[2023-10-08 14:16:48,387][102898] Updated weights for policy 1, policy_version 62890 (0.0011) +[2023-10-08 14:16:48,757][102898] Updated weights for policy 1, policy_version 62900 (0.0010) +[2023-10-08 14:16:49,117][102898] Updated weights for policy 1, policy_version 62910 (0.0007) +[2023-10-08 14:16:51,702][102897] Updated weights for policy 0, policy_version 62850 (0.0008) +[2023-10-08 14:16:51,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 128778240. Throughput: 0: 1788.2, 1: 1770.4. Samples: 32201404. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:16:51,876][101941] Avg episode reward: [(0, '7.710'), (1, '8.190')] +[2023-10-08 14:16:52,095][102897] Updated weights for policy 0, policy_version 62860 (0.0009) +[2023-10-08 14:16:52,460][102897] Updated weights for policy 0, policy_version 62870 (0.0007) +[2023-10-08 14:16:52,831][102897] Updated weights for policy 0, policy_version 62880 (0.0008) +[2023-10-08 14:16:52,946][102898] Updated weights for policy 1, policy_version 62920 (0.0008) +[2023-10-08 14:16:53,311][102898] Updated weights for policy 1, policy_version 62930 (0.0010) +[2023-10-08 14:16:53,683][102898] Updated weights for policy 1, policy_version 62940 (0.0007) +[2023-10-08 14:16:56,635][102897] Updated weights for policy 0, policy_version 62890 (0.0011) +[2023-10-08 14:16:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 128843776. Throughput: 0: 1786.6, 1: 1770.6. Samples: 32223606. Policy #0 lag: (min: 18.0, avg: 18.0, max: 22.0) +[2023-10-08 14:16:56,875][101941] Avg episode reward: [(0, '8.100'), (1, '7.920')] +[2023-10-08 14:16:57,009][102897] Updated weights for policy 0, policy_version 62900 (0.0010) +[2023-10-08 14:16:57,371][102897] Updated weights for policy 0, policy_version 62910 (0.0009) +[2023-10-08 14:16:57,630][102898] Updated weights for policy 1, policy_version 62950 (0.0007) +[2023-10-08 14:16:57,994][102898] Updated weights for policy 1, policy_version 62960 (0.0008) +[2023-10-08 14:16:58,365][102898] Updated weights for policy 1, policy_version 62970 (0.0009) +[2023-10-08 14:17:01,097][102897] Updated weights for policy 0, policy_version 62920 (0.0008) +[2023-10-08 14:17:01,471][102897] Updated weights for policy 0, policy_version 62930 (0.0007) +[2023-10-08 14:17:01,830][102897] Updated weights for policy 0, policy_version 62940 (0.0010) +[2023-10-08 14:17:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 128909312. Throughput: 0: 1802.7, 1: 1788.4. Samples: 32245322. Policy #0 lag: (min: 18.0, avg: 18.0, max: 22.0) +[2023-10-08 14:17:01,875][101941] Avg episode reward: [(0, '7.900'), (1, '7.920')] +[2023-10-08 14:17:02,078][102898] Updated weights for policy 1, policy_version 62980 (0.0008) +[2023-10-08 14:17:02,448][102898] Updated weights for policy 1, policy_version 62990 (0.0007) +[2023-10-08 14:17:02,822][102898] Updated weights for policy 1, policy_version 63000 (0.0008) +[2023-10-08 14:17:05,583][102897] Updated weights for policy 0, policy_version 62950 (0.0009) +[2023-10-08 14:17:05,941][102897] Updated weights for policy 0, policy_version 62960 (0.0007) +[2023-10-08 14:17:06,319][102897] Updated weights for policy 0, policy_version 62970 (0.0008) +[2023-10-08 14:17:06,633][102898] Updated weights for policy 1, policy_version 63010 (0.0009) +[2023-10-08 14:17:06,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 129007616. Throughput: 0: 1784.9, 1: 1773.6. Samples: 32255710. Policy #0 lag: (min: 18.0, avg: 18.0, max: 22.0) +[2023-10-08 14:17:06,876][101941] Avg episode reward: [(0, '8.750'), (1, '8.400')] +[2023-10-08 14:17:07,008][102898] Updated weights for policy 1, policy_version 63020 (0.0009) +[2023-10-08 14:17:07,377][102898] Updated weights for policy 1, policy_version 63030 (0.0008) +[2023-10-08 14:17:07,738][102898] Updated weights for policy 1, policy_version 63040 (0.0007) +[2023-10-08 14:17:09,993][102897] Updated weights for policy 0, policy_version 62980 (0.0007) +[2023-10-08 14:17:10,357][102897] Updated weights for policy 0, policy_version 62990 (0.0008) +[2023-10-08 14:17:10,729][102897] Updated weights for policy 0, policy_version 63000 (0.0010) +[2023-10-08 14:17:11,488][102898] Updated weights for policy 1, policy_version 63050 (0.0008) +[2023-10-08 14:17:11,863][102898] Updated weights for policy 1, policy_version 63060 (0.0009) +[2023-10-08 14:17:11,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 129073152. Throughput: 0: 1803.5, 1: 1780.4. Samples: 32277646. Policy #0 lag: (min: 18.0, avg: 18.0, max: 22.0) +[2023-10-08 14:17:11,875][101941] Avg episode reward: [(0, '9.350'), (1, '8.280')] +[2023-10-08 14:17:11,876][102634] Saving new best policy, reward=9.350! +[2023-10-08 14:17:12,223][102898] Updated weights for policy 1, policy_version 63070 (0.0007) +[2023-10-08 14:17:14,393][102897] Updated weights for policy 0, policy_version 63010 (0.0009) +[2023-10-08 14:17:14,768][102897] Updated weights for policy 0, policy_version 63020 (0.0007) +[2023-10-08 14:17:15,143][102897] Updated weights for policy 0, policy_version 63030 (0.0010) +[2023-10-08 14:17:15,516][102897] Updated weights for policy 0, policy_version 63040 (0.0008) +[2023-10-08 14:17:15,877][102898] Updated weights for policy 1, policy_version 63080 (0.0008) +[2023-10-08 14:17:16,243][102898] Updated weights for policy 1, policy_version 63090 (0.0009) +[2023-10-08 14:17:16,613][102898] Updated weights for policy 1, policy_version 63100 (0.0007) +[2023-10-08 14:17:16,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14218.0). Total num frames: 129171456. Throughput: 0: 1797.2, 1: 1789.3. Samples: 32298514. Policy #0 lag: (min: 18.0, avg: 18.0, max: 22.0) +[2023-10-08 14:17:16,876][101941] Avg episode reward: [(0, '9.130'), (1, '8.350')] +[2023-10-08 14:17:19,226][102897] Updated weights for policy 0, policy_version 63050 (0.0007) +[2023-10-08 14:17:19,606][102897] Updated weights for policy 0, policy_version 63060 (0.0007) +[2023-10-08 14:17:19,975][102897] Updated weights for policy 0, policy_version 63070 (0.0008) +[2023-10-08 14:17:20,450][102898] Updated weights for policy 1, policy_version 63110 (0.0009) +[2023-10-08 14:17:20,819][102898] Updated weights for policy 1, policy_version 63120 (0.0008) +[2023-10-08 14:17:21,194][102898] Updated weights for policy 1, policy_version 63130 (0.0007) +[2023-10-08 14:17:21,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 129236992. Throughput: 0: 1813.0, 1: 1780.1. Samples: 32310166. Policy #0 lag: (min: 18.0, avg: 18.0, max: 22.0) +[2023-10-08 14:17:21,876][101941] Avg episode reward: [(0, '8.860'), (1, '8.960')] +[2023-10-08 14:17:23,602][102897] Updated weights for policy 0, policy_version 63080 (0.0008) +[2023-10-08 14:17:23,963][102897] Updated weights for policy 0, policy_version 63090 (0.0007) +[2023-10-08 14:17:24,337][102897] Updated weights for policy 0, policy_version 63100 (0.0009) +[2023-10-08 14:17:25,061][102898] Updated weights for policy 1, policy_version 63140 (0.0008) +[2023-10-08 14:17:25,432][102898] Updated weights for policy 1, policy_version 63150 (0.0008) +[2023-10-08 14:17:25,799][102898] Updated weights for policy 1, policy_version 63160 (0.0010) +[2023-10-08 14:17:26,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 129302528. Throughput: 0: 1799.1, 1: 1794.3. Samples: 32331192. Policy #0 lag: (min: 18.0, avg: 18.0, max: 22.0) +[2023-10-08 14:17:26,876][101941] Avg episode reward: [(0, '8.980'), (1, '8.380')] +[2023-10-08 14:17:28,145][102897] Updated weights for policy 0, policy_version 63110 (0.0007) +[2023-10-08 14:17:28,514][102897] Updated weights for policy 0, policy_version 63120 (0.0009) +[2023-10-08 14:17:28,888][102897] Updated weights for policy 0, policy_version 63130 (0.0008) +[2023-10-08 14:17:29,550][102898] Updated weights for policy 1, policy_version 63170 (0.0009) +[2023-10-08 14:17:29,916][102898] Updated weights for policy 1, policy_version 63180 (0.0010) +[2023-10-08 14:17:30,289][102898] Updated weights for policy 1, policy_version 63190 (0.0008) +[2023-10-08 14:17:30,662][102898] Updated weights for policy 1, policy_version 63200 (0.0008) +[2023-10-08 14:17:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 129368064. Throughput: 0: 1800.8, 1: 1779.8. Samples: 32352866. Policy #0 lag: (min: 18.0, avg: 18.0, max: 22.0) +[2023-10-08 14:17:31,876][101941] Avg episode reward: [(0, '8.980'), (1, '8.200')] +[2023-10-08 14:17:32,596][102897] Updated weights for policy 0, policy_version 63140 (0.0009) +[2023-10-08 14:17:32,969][102897] Updated weights for policy 0, policy_version 63150 (0.0007) +[2023-10-08 14:17:33,337][102897] Updated weights for policy 0, policy_version 63160 (0.0007) +[2023-10-08 14:17:34,443][102898] Updated weights for policy 1, policy_version 63210 (0.0007) +[2023-10-08 14:17:34,806][102898] Updated weights for policy 1, policy_version 63220 (0.0007) +[2023-10-08 14:17:35,175][102898] Updated weights for policy 1, policy_version 63230 (0.0007) +[2023-10-08 14:17:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 129433600. Throughput: 0: 1798.2, 1: 1804.0. Samples: 32363506. Policy #0 lag: (min: 31.0, avg: 41.8, max: 63.0) +[2023-10-08 14:17:36,876][101941] Avg episode reward: [(0, '8.620'), (1, '7.820')] +[2023-10-08 14:17:37,111][102897] Updated weights for policy 0, policy_version 63170 (0.0008) +[2023-10-08 14:17:37,531][102897] Updated weights for policy 0, policy_version 63180 (0.0008) +[2023-10-08 14:17:37,893][102897] Updated weights for policy 0, policy_version 63190 (0.0007) +[2023-10-08 14:17:38,255][102897] Updated weights for policy 0, policy_version 63200 (0.0009) +[2023-10-08 14:17:38,787][102898] Updated weights for policy 1, policy_version 63240 (0.0009) +[2023-10-08 14:17:39,153][102898] Updated weights for policy 1, policy_version 63250 (0.0007) +[2023-10-08 14:17:39,517][102898] Updated weights for policy 1, policy_version 63260 (0.0007) +[2023-10-08 14:17:41,864][102897] Updated weights for policy 0, policy_version 63210 (0.0011) +[2023-10-08 14:17:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 129499136. Throughput: 0: 1804.1, 1: 1783.8. Samples: 32385062. Policy #0 lag: (min: 31.0, avg: 41.8, max: 63.0) +[2023-10-08 14:17:41,876][101941] Avg episode reward: [(0, '9.080'), (1, '8.140')] +[2023-10-08 14:17:42,239][102897] Updated weights for policy 0, policy_version 63220 (0.0009) +[2023-10-08 14:17:42,601][102897] Updated weights for policy 0, policy_version 63230 (0.0007) +[2023-10-08 14:17:43,334][102898] Updated weights for policy 1, policy_version 63270 (0.0009) +[2023-10-08 14:17:43,707][102898] Updated weights for policy 1, policy_version 63280 (0.0008) +[2023-10-08 14:17:44,077][102898] Updated weights for policy 1, policy_version 63290 (0.0008) +[2023-10-08 14:17:46,367][102897] Updated weights for policy 0, policy_version 63240 (0.0008) +[2023-10-08 14:17:46,751][102897] Updated weights for policy 0, policy_version 63250 (0.0010) +[2023-10-08 14:17:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 129564672. Throughput: 0: 1811.5, 1: 1783.2. Samples: 32407082. Policy #0 lag: (min: 31.0, avg: 41.8, max: 63.0) +[2023-10-08 14:17:46,875][101941] Avg episode reward: [(0, '8.420'), (1, '8.070')] +[2023-10-08 14:17:47,119][102897] Updated weights for policy 0, policy_version 63260 (0.0009) +[2023-10-08 14:17:47,811][102898] Updated weights for policy 1, policy_version 63300 (0.0009) +[2023-10-08 14:17:48,185][102898] Updated weights for policy 1, policy_version 63310 (0.0011) +[2023-10-08 14:17:48,548][102898] Updated weights for policy 1, policy_version 63320 (0.0010) +[2023-10-08 14:17:51,107][102897] Updated weights for policy 0, policy_version 63270 (0.0008) +[2023-10-08 14:17:51,487][102897] Updated weights for policy 0, policy_version 63280 (0.0009) +[2023-10-08 14:17:51,857][102897] Updated weights for policy 0, policy_version 63290 (0.0007) +[2023-10-08 14:17:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 129630208. Throughput: 0: 1799.7, 1: 1787.0. Samples: 32417110. Policy #0 lag: (min: 31.0, avg: 41.8, max: 63.0) +[2023-10-08 14:17:51,876][101941] Avg episode reward: [(0, '8.180'), (1, '8.870')] +[2023-10-08 14:17:52,288][102898] Updated weights for policy 1, policy_version 63330 (0.0010) +[2023-10-08 14:17:52,648][102898] Updated weights for policy 1, policy_version 63340 (0.0008) +[2023-10-08 14:17:53,021][102898] Updated weights for policy 1, policy_version 63350 (0.0008) +[2023-10-08 14:17:53,386][102898] Updated weights for policy 1, policy_version 63360 (0.0007) +[2023-10-08 14:17:55,720][102897] Updated weights for policy 0, policy_version 63300 (0.0008) +[2023-10-08 14:17:56,088][102897] Updated weights for policy 0, policy_version 63310 (0.0011) +[2023-10-08 14:17:56,457][102897] Updated weights for policy 0, policy_version 63320 (0.0009) +[2023-10-08 14:17:56,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 129728512. Throughput: 0: 1803.3, 1: 1790.9. Samples: 32439386. Policy #0 lag: (min: 31.0, avg: 41.8, max: 63.0) +[2023-10-08 14:17:56,875][101941] Avg episode reward: [(0, '8.040'), (1, '9.420')] +[2023-10-08 14:17:57,061][102898] Updated weights for policy 1, policy_version 63370 (0.0009) +[2023-10-08 14:17:57,437][102898] Updated weights for policy 1, policy_version 63380 (0.0011) +[2023-10-08 14:17:57,808][102898] Updated weights for policy 1, policy_version 63390 (0.0008) +[2023-10-08 14:18:00,191][102897] Updated weights for policy 0, policy_version 63330 (0.0008) +[2023-10-08 14:18:00,557][102897] Updated weights for policy 0, policy_version 63340 (0.0009) +[2023-10-08 14:18:00,926][102897] Updated weights for policy 0, policy_version 63350 (0.0009) +[2023-10-08 14:18:01,296][102897] Updated weights for policy 0, policy_version 63360 (0.0011) +[2023-10-08 14:18:01,588][102898] Updated weights for policy 1, policy_version 63400 (0.0010) +[2023-10-08 14:18:01,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 129794048. Throughput: 0: 1782.6, 1: 1804.2. Samples: 32459920. Policy #0 lag: (min: 31.0, avg: 41.8, max: 63.0) +[2023-10-08 14:18:01,876][101941] Avg episode reward: [(0, '7.860'), (1, '9.240')] +[2023-10-08 14:18:01,954][102898] Updated weights for policy 1, policy_version 63410 (0.0007) +[2023-10-08 14:18:02,322][102898] Updated weights for policy 1, policy_version 63420 (0.0007) +[2023-10-08 14:18:05,068][102897] Updated weights for policy 0, policy_version 63370 (0.0008) +[2023-10-08 14:18:05,443][102897] Updated weights for policy 0, policy_version 63380 (0.0009) +[2023-10-08 14:18:05,804][102897] Updated weights for policy 0, policy_version 63390 (0.0008) +[2023-10-08 14:18:06,146][102898] Updated weights for policy 1, policy_version 63430 (0.0010) +[2023-10-08 14:18:06,503][102898] Updated weights for policy 1, policy_version 63440 (0.0010) +[2023-10-08 14:18:06,867][102898] Updated weights for policy 1, policy_version 63450 (0.0010) +[2023-10-08 14:18:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 129859584. Throughput: 0: 1797.6, 1: 1785.9. Samples: 32471420. Policy #0 lag: (min: 31.0, avg: 41.8, max: 63.0) +[2023-10-08 14:18:06,876][101941] Avg episode reward: [(0, '7.820'), (1, '9.050')] +[2023-10-08 14:18:09,628][102897] Updated weights for policy 0, policy_version 63400 (0.0009) +[2023-10-08 14:18:10,004][102897] Updated weights for policy 0, policy_version 63410 (0.0008) +[2023-10-08 14:18:10,371][102897] Updated weights for policy 0, policy_version 63420 (0.0007) +[2023-10-08 14:18:10,676][102898] Updated weights for policy 1, policy_version 63460 (0.0009) +[2023-10-08 14:18:11,044][102898] Updated weights for policy 1, policy_version 63470 (0.0008) +[2023-10-08 14:18:11,408][102898] Updated weights for policy 1, policy_version 63480 (0.0009) +[2023-10-08 14:18:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 129957888. Throughput: 0: 1787.8, 1: 1801.2. Samples: 32492700. Policy #0 lag: (min: 31.0, avg: 41.8, max: 63.0) +[2023-10-08 14:18:11,876][101941] Avg episode reward: [(0, '7.500'), (1, '8.090')] +[2023-10-08 14:18:14,004][102897] Updated weights for policy 0, policy_version 63430 (0.0009) +[2023-10-08 14:18:14,388][102897] Updated weights for policy 0, policy_version 63440 (0.0007) +[2023-10-08 14:18:14,768][102897] Updated weights for policy 0, policy_version 63450 (0.0010) +[2023-10-08 14:18:15,100][102898] Updated weights for policy 1, policy_version 63490 (0.0009) +[2023-10-08 14:18:15,475][102898] Updated weights for policy 1, policy_version 63500 (0.0007) +[2023-10-08 14:18:15,834][102898] Updated weights for policy 1, policy_version 63510 (0.0009) +[2023-10-08 14:18:16,200][102898] Updated weights for policy 1, policy_version 63520 (0.0008) +[2023-10-08 14:18:16,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.6, 300 sec: 14329.1). Total num frames: 130023424. Throughput: 0: 1784.9, 1: 1788.7. Samples: 32513678. Policy #0 lag: (min: 31.0, avg: 44.9, max: 63.0) +[2023-10-08 14:18:16,875][101941] Avg episode reward: [(0, '7.420'), (1, '8.220')] +[2023-10-08 14:18:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000063456_64978944.pth... +[2023-10-08 14:18:16,884][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000063520_65044480.pth... +[2023-10-08 14:18:16,922][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000061792_63275008.pth +[2023-10-08 14:18:16,923][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000061856_63340544.pth +[2023-10-08 14:18:18,342][102897] Updated weights for policy 0, policy_version 63460 (0.0008) +[2023-10-08 14:18:18,710][102897] Updated weights for policy 0, policy_version 63470 (0.0010) +[2023-10-08 14:18:19,071][102897] Updated weights for policy 0, policy_version 63480 (0.0009) +[2023-10-08 14:18:19,968][102898] Updated weights for policy 1, policy_version 63530 (0.0009) +[2023-10-08 14:18:20,326][102898] Updated weights for policy 1, policy_version 63540 (0.0010) +[2023-10-08 14:18:20,691][102898] Updated weights for policy 1, policy_version 63550 (0.0009) +[2023-10-08 14:18:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 130088960. Throughput: 0: 1787.0, 1: 1799.3. Samples: 32524890. Policy #0 lag: (min: 31.0, avg: 44.9, max: 63.0) +[2023-10-08 14:18:21,875][101941] Avg episode reward: [(0, '7.630'), (1, '8.850')] +[2023-10-08 14:18:22,825][102897] Updated weights for policy 0, policy_version 63490 (0.0008) +[2023-10-08 14:18:23,212][102897] Updated weights for policy 0, policy_version 63500 (0.0008) +[2023-10-08 14:18:23,580][102897] Updated weights for policy 0, policy_version 63510 (0.0007) +[2023-10-08 14:18:23,948][102897] Updated weights for policy 0, policy_version 63520 (0.0009) +[2023-10-08 14:18:24,550][102898] Updated weights for policy 1, policy_version 63560 (0.0009) +[2023-10-08 14:18:24,917][102898] Updated weights for policy 1, policy_version 63570 (0.0008) +[2023-10-08 14:18:25,278][102898] Updated weights for policy 1, policy_version 63580 (0.0010) +[2023-10-08 14:18:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 130154496. Throughput: 0: 1788.1, 1: 1786.0. Samples: 32545898. Policy #0 lag: (min: 31.0, avg: 44.9, max: 63.0) +[2023-10-08 14:18:26,876][101941] Avg episode reward: [(0, '8.800'), (1, '8.500')] +[2023-10-08 14:18:27,762][102897] Updated weights for policy 0, policy_version 63530 (0.0008) +[2023-10-08 14:18:28,143][102897] Updated weights for policy 0, policy_version 63540 (0.0010) +[2023-10-08 14:18:28,511][102897] Updated weights for policy 0, policy_version 63550 (0.0010) +[2023-10-08 14:18:29,042][102898] Updated weights for policy 1, policy_version 63590 (0.0010) +[2023-10-08 14:18:29,402][102898] Updated weights for policy 1, policy_version 63600 (0.0008) +[2023-10-08 14:18:29,778][102898] Updated weights for policy 1, policy_version 63610 (0.0007) +[2023-10-08 14:18:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 130220032. Throughput: 0: 1791.4, 1: 1788.9. Samples: 32568198. Policy #0 lag: (min: 31.0, avg: 44.9, max: 63.0) +[2023-10-08 14:18:31,876][101941] Avg episode reward: [(0, '8.280'), (1, '9.230')] +[2023-10-08 14:18:32,238][102897] Updated weights for policy 0, policy_version 63560 (0.0008) +[2023-10-08 14:18:32,606][102897] Updated weights for policy 0, policy_version 63570 (0.0007) +[2023-10-08 14:18:32,967][102897] Updated weights for policy 0, policy_version 63580 (0.0007) +[2023-10-08 14:18:33,459][102898] Updated weights for policy 1, policy_version 63620 (0.0008) +[2023-10-08 14:18:33,832][102898] Updated weights for policy 1, policy_version 63630 (0.0010) +[2023-10-08 14:18:34,199][102898] Updated weights for policy 1, policy_version 63640 (0.0011) +[2023-10-08 14:18:36,704][102897] Updated weights for policy 0, policy_version 63590 (0.0008) +[2023-10-08 14:18:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 130285568. Throughput: 0: 1787.6, 1: 1792.4. Samples: 32578214. Policy #0 lag: (min: 31.0, avg: 44.9, max: 63.0) +[2023-10-08 14:18:36,876][101941] Avg episode reward: [(0, '8.120'), (1, '9.080')] +[2023-10-08 14:18:37,067][102897] Updated weights for policy 0, policy_version 63600 (0.0010) +[2023-10-08 14:18:37,443][102897] Updated weights for policy 0, policy_version 63610 (0.0010) +[2023-10-08 14:18:38,060][102898] Updated weights for policy 1, policy_version 63650 (0.0010) +[2023-10-08 14:18:38,422][102898] Updated weights for policy 1, policy_version 63660 (0.0008) +[2023-10-08 14:18:38,782][102898] Updated weights for policy 1, policy_version 63670 (0.0011) +[2023-10-08 14:18:39,147][102898] Updated weights for policy 1, policy_version 63680 (0.0007) +[2023-10-08 14:18:41,218][102897] Updated weights for policy 0, policy_version 63620 (0.0008) +[2023-10-08 14:18:41,597][102897] Updated weights for policy 0, policy_version 63630 (0.0009) +[2023-10-08 14:18:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 130351104. Throughput: 0: 1791.0, 1: 1784.1. Samples: 32600268. Policy #0 lag: (min: 31.0, avg: 44.9, max: 63.0) +[2023-10-08 14:18:41,876][101941] Avg episode reward: [(0, '7.700'), (1, '8.820')] +[2023-10-08 14:18:41,961][102897] Updated weights for policy 0, policy_version 63640 (0.0008) +[2023-10-08 14:18:43,038][102898] Updated weights for policy 1, policy_version 63690 (0.0007) +[2023-10-08 14:18:43,411][102898] Updated weights for policy 1, policy_version 63700 (0.0007) +[2023-10-08 14:18:43,771][102898] Updated weights for policy 1, policy_version 63710 (0.0007) +[2023-10-08 14:18:45,738][102897] Updated weights for policy 0, policy_version 63650 (0.0009) +[2023-10-08 14:18:46,105][102897] Updated weights for policy 0, policy_version 63660 (0.0008) +[2023-10-08 14:18:46,476][102897] Updated weights for policy 0, policy_version 63670 (0.0008) +[2023-10-08 14:18:46,840][102897] Updated weights for policy 0, policy_version 63680 (0.0010) +[2023-10-08 14:18:46,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 130449408. Throughput: 0: 1808.7, 1: 1793.3. Samples: 32622010. Policy #0 lag: (min: 31.0, avg: 44.9, max: 63.0) +[2023-10-08 14:18:46,876][101941] Avg episode reward: [(0, '7.540'), (1, '9.820')] +[2023-10-08 14:18:47,343][102898] Updated weights for policy 1, policy_version 63720 (0.0010) +[2023-10-08 14:18:47,710][102898] Updated weights for policy 1, policy_version 63730 (0.0010) +[2023-10-08 14:18:48,063][102898] Updated weights for policy 1, policy_version 63740 (0.0008) +[2023-10-08 14:18:50,683][102897] Updated weights for policy 0, policy_version 63690 (0.0008) +[2023-10-08 14:18:51,047][102897] Updated weights for policy 0, policy_version 63700 (0.0008) +[2023-10-08 14:18:51,430][102897] Updated weights for policy 0, policy_version 63710 (0.0007) +[2023-10-08 14:18:51,818][102898] Updated weights for policy 1, policy_version 63750 (0.0010) +[2023-10-08 14:18:51,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 130514944. Throughput: 0: 1793.1, 1: 1790.1. Samples: 32632666. Policy #0 lag: (min: 31.0, avg: 44.9, max: 63.0) +[2023-10-08 14:18:51,876][101941] Avg episode reward: [(0, '7.260'), (1, '9.150')] +[2023-10-08 14:18:52,183][102898] Updated weights for policy 1, policy_version 63760 (0.0009) +[2023-10-08 14:18:52,547][102898] Updated weights for policy 1, policy_version 63770 (0.0007) +[2023-10-08 14:18:55,185][102897] Updated weights for policy 0, policy_version 63720 (0.0009) +[2023-10-08 14:18:55,560][102897] Updated weights for policy 0, policy_version 63730 (0.0009) +[2023-10-08 14:18:55,936][102897] Updated weights for policy 0, policy_version 63740 (0.0008) +[2023-10-08 14:18:56,375][102898] Updated weights for policy 1, policy_version 63780 (0.0009) +[2023-10-08 14:18:56,737][102898] Updated weights for policy 1, policy_version 63790 (0.0008) +[2023-10-08 14:18:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 130580480. Throughput: 0: 1802.0, 1: 1789.2. Samples: 32654304. Policy #0 lag: (min: 21.0, avg: 22.9, max: 52.0) +[2023-10-08 14:18:56,876][101941] Avg episode reward: [(0, '8.260'), (1, '9.200')] +[2023-10-08 14:18:57,112][102898] Updated weights for policy 1, policy_version 63800 (0.0008) +[2023-10-08 14:18:59,674][102897] Updated weights for policy 0, policy_version 63750 (0.0008) +[2023-10-08 14:19:00,039][102897] Updated weights for policy 0, policy_version 63760 (0.0010) +[2023-10-08 14:19:00,415][102897] Updated weights for policy 0, policy_version 63770 (0.0010) +[2023-10-08 14:19:00,935][102898] Updated weights for policy 1, policy_version 63810 (0.0007) +[2023-10-08 14:19:01,304][102898] Updated weights for policy 1, policy_version 63820 (0.0010) +[2023-10-08 14:19:01,662][102898] Updated weights for policy 1, policy_version 63830 (0.0008) +[2023-10-08 14:19:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 130646016. Throughput: 0: 1779.5, 1: 1801.6. Samples: 32674826. Policy #0 lag: (min: 21.0, avg: 22.9, max: 52.0) +[2023-10-08 14:19:01,876][101941] Avg episode reward: [(0, '8.710'), (1, '9.110')] +[2023-10-08 14:19:02,023][102898] Updated weights for policy 1, policy_version 63840 (0.0009) +[2023-10-08 14:19:04,120][102897] Updated weights for policy 0, policy_version 63780 (0.0009) +[2023-10-08 14:19:04,480][102897] Updated weights for policy 0, policy_version 63790 (0.0009) +[2023-10-08 14:19:04,854][102897] Updated weights for policy 0, policy_version 63800 (0.0009) +[2023-10-08 14:19:05,812][102898] Updated weights for policy 1, policy_version 63850 (0.0009) +[2023-10-08 14:19:06,175][102898] Updated weights for policy 1, policy_version 63860 (0.0007) +[2023-10-08 14:19:06,547][102898] Updated weights for policy 1, policy_version 63870 (0.0008) +[2023-10-08 14:19:06,875][101941] Fps is (10 sec: 16383.3, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 130744320. Throughput: 0: 1804.7, 1: 1783.9. Samples: 32686380. Policy #0 lag: (min: 21.0, avg: 22.9, max: 52.0) +[2023-10-08 14:19:06,877][101941] Avg episode reward: [(0, '8.330'), (1, '9.190')] +[2023-10-08 14:19:08,532][102897] Updated weights for policy 0, policy_version 63810 (0.0008) +[2023-10-08 14:19:08,902][102897] Updated weights for policy 0, policy_version 63820 (0.0008) +[2023-10-08 14:19:09,262][102897] Updated weights for policy 0, policy_version 63830 (0.0008) +[2023-10-08 14:19:09,629][102897] Updated weights for policy 0, policy_version 63840 (0.0008) +[2023-10-08 14:19:10,312][102898] Updated weights for policy 1, policy_version 63880 (0.0007) +[2023-10-08 14:19:10,680][102898] Updated weights for policy 1, policy_version 63890 (0.0007) +[2023-10-08 14:19:11,045][102898] Updated weights for policy 1, policy_version 63900 (0.0008) +[2023-10-08 14:19:11,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14440.2). Total num frames: 130809856. Throughput: 0: 1777.7, 1: 1805.7. Samples: 32707152. Policy #0 lag: (min: 21.0, avg: 22.9, max: 52.0) +[2023-10-08 14:19:11,875][101941] Avg episode reward: [(0, '7.470'), (1, '9.150')] +[2023-10-08 14:19:13,433][102897] Updated weights for policy 0, policy_version 63850 (0.0009) +[2023-10-08 14:19:13,818][102897] Updated weights for policy 0, policy_version 63860 (0.0010) +[2023-10-08 14:19:14,191][102897] Updated weights for policy 0, policy_version 63870 (0.0010) +[2023-10-08 14:19:14,721][102898] Updated weights for policy 1, policy_version 63910 (0.0008) +[2023-10-08 14:19:15,076][102898] Updated weights for policy 1, policy_version 63920 (0.0010) +[2023-10-08 14:19:15,447][102898] Updated weights for policy 1, policy_version 63930 (0.0010) +[2023-10-08 14:19:16,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 130875392. Throughput: 0: 1784.4, 1: 1786.4. Samples: 32728882. Policy #0 lag: (min: 21.0, avg: 22.9, max: 52.0) +[2023-10-08 14:19:16,876][101941] Avg episode reward: [(0, '7.890'), (1, '8.760')] +[2023-10-08 14:19:17,953][102897] Updated weights for policy 0, policy_version 63880 (0.0008) +[2023-10-08 14:19:18,330][102897] Updated weights for policy 0, policy_version 63890 (0.0008) +[2023-10-08 14:19:18,703][102897] Updated weights for policy 0, policy_version 63900 (0.0009) +[2023-10-08 14:19:19,138][102898] Updated weights for policy 1, policy_version 63940 (0.0008) +[2023-10-08 14:19:19,498][102898] Updated weights for policy 1, policy_version 63950 (0.0009) +[2023-10-08 14:19:19,864][102898] Updated weights for policy 1, policy_version 63960 (0.0008) +[2023-10-08 14:19:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 130940928. Throughput: 0: 1785.9, 1: 1800.6. Samples: 32739608. Policy #0 lag: (min: 21.0, avg: 22.9, max: 52.0) +[2023-10-08 14:19:21,875][101941] Avg episode reward: [(0, '8.090'), (1, '8.360')] +[2023-10-08 14:19:22,457][102897] Updated weights for policy 0, policy_version 63910 (0.0009) +[2023-10-08 14:19:22,837][102897] Updated weights for policy 0, policy_version 63920 (0.0008) +[2023-10-08 14:19:23,215][102897] Updated weights for policy 0, policy_version 63930 (0.0007) +[2023-10-08 14:19:23,706][102898] Updated weights for policy 1, policy_version 63970 (0.0007) +[2023-10-08 14:19:24,066][102898] Updated weights for policy 1, policy_version 63980 (0.0007) +[2023-10-08 14:19:24,437][102898] Updated weights for policy 1, policy_version 63990 (0.0008) +[2023-10-08 14:19:24,794][102898] Updated weights for policy 1, policy_version 64000 (0.0009) +[2023-10-08 14:19:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 131006464. Throughput: 0: 1790.8, 1: 1785.4. Samples: 32761198. Policy #0 lag: (min: 21.0, avg: 22.9, max: 52.0) +[2023-10-08 14:19:26,876][101941] Avg episode reward: [(0, '7.580'), (1, '8.420')] +[2023-10-08 14:19:26,933][102897] Updated weights for policy 0, policy_version 63940 (0.0008) +[2023-10-08 14:19:27,310][102897] Updated weights for policy 0, policy_version 63950 (0.0009) +[2023-10-08 14:19:27,675][102897] Updated weights for policy 0, policy_version 63960 (0.0008) +[2023-10-08 14:19:28,451][102898] Updated weights for policy 1, policy_version 64010 (0.0008) +[2023-10-08 14:19:28,821][102898] Updated weights for policy 1, policy_version 64020 (0.0009) +[2023-10-08 14:19:29,189][102898] Updated weights for policy 1, policy_version 64030 (0.0007) +[2023-10-08 14:19:31,445][102897] Updated weights for policy 0, policy_version 63970 (0.0008) +[2023-10-08 14:19:31,809][102897] Updated weights for policy 0, policy_version 63980 (0.0009) +[2023-10-08 14:19:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 131072000. Throughput: 0: 1808.0, 1: 1789.3. Samples: 32783890. Policy #0 lag: (min: 21.0, avg: 22.9, max: 52.0) +[2023-10-08 14:19:31,876][101941] Avg episode reward: [(0, '7.940'), (1, '7.850')] +[2023-10-08 14:19:32,186][102897] Updated weights for policy 0, policy_version 63990 (0.0008) +[2023-10-08 14:19:32,548][102897] Updated weights for policy 0, policy_version 64000 (0.0008) +[2023-10-08 14:19:32,883][102898] Updated weights for policy 1, policy_version 64040 (0.0009) +[2023-10-08 14:19:33,249][102898] Updated weights for policy 1, policy_version 64050 (0.0009) +[2023-10-08 14:19:33,616][102898] Updated weights for policy 1, policy_version 64060 (0.0009) +[2023-10-08 14:19:36,215][102897] Updated weights for policy 0, policy_version 64010 (0.0008) +[2023-10-08 14:19:36,589][102897] Updated weights for policy 0, policy_version 64020 (0.0007) +[2023-10-08 14:19:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 131137536. Throughput: 0: 1788.9, 1: 1790.6. Samples: 32793746. Policy #0 lag: (min: 21.0, avg: 22.9, max: 52.0) +[2023-10-08 14:19:36,876][101941] Avg episode reward: [(0, '8.430'), (1, '7.890')] +[2023-10-08 14:19:36,958][102897] Updated weights for policy 0, policy_version 64030 (0.0007) +[2023-10-08 14:19:37,361][102898] Updated weights for policy 1, policy_version 64070 (0.0008) +[2023-10-08 14:19:37,739][102898] Updated weights for policy 1, policy_version 64080 (0.0009) +[2023-10-08 14:19:38,101][102898] Updated weights for policy 1, policy_version 64090 (0.0010) +[2023-10-08 14:19:40,879][102897] Updated weights for policy 0, policy_version 64040 (0.0010) +[2023-10-08 14:19:41,250][102897] Updated weights for policy 0, policy_version 64050 (0.0008) +[2023-10-08 14:19:41,626][102897] Updated weights for policy 0, policy_version 64060 (0.0010) +[2023-10-08 14:19:41,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 131235840. Throughput: 0: 1802.6, 1: 1800.2. Samples: 32816432. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 14:19:41,876][101941] Avg episode reward: [(0, '8.350'), (1, '8.710')] +[2023-10-08 14:19:41,910][102898] Updated weights for policy 1, policy_version 64100 (0.0008) +[2023-10-08 14:19:42,276][102898] Updated weights for policy 1, policy_version 64110 (0.0007) +[2023-10-08 14:19:42,643][102898] Updated weights for policy 1, policy_version 64120 (0.0007) +[2023-10-08 14:19:45,298][102897] Updated weights for policy 0, policy_version 64070 (0.0009) +[2023-10-08 14:19:45,678][102897] Updated weights for policy 0, policy_version 64080 (0.0009) +[2023-10-08 14:19:46,041][102897] Updated weights for policy 0, policy_version 64090 (0.0008) +[2023-10-08 14:19:46,445][102898] Updated weights for policy 1, policy_version 64130 (0.0008) +[2023-10-08 14:19:46,816][102898] Updated weights for policy 1, policy_version 64140 (0.0008) +[2023-10-08 14:19:46,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 131301376. Throughput: 0: 1793.6, 1: 1812.4. Samples: 32837098. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 14:19:46,875][101941] Avg episode reward: [(0, '8.300'), (1, '8.310')] +[2023-10-08 14:19:47,179][102898] Updated weights for policy 1, policy_version 64150 (0.0009) +[2023-10-08 14:19:47,542][102898] Updated weights for policy 1, policy_version 64160 (0.0007) +[2023-10-08 14:19:49,866][102897] Updated weights for policy 0, policy_version 64100 (0.0007) +[2023-10-08 14:19:50,245][102897] Updated weights for policy 0, policy_version 64110 (0.0009) +[2023-10-08 14:19:50,608][102897] Updated weights for policy 0, policy_version 64120 (0.0008) +[2023-10-08 14:19:51,503][102898] Updated weights for policy 1, policy_version 64170 (0.0008) +[2023-10-08 14:19:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 131366912. Throughput: 0: 1803.7, 1: 1796.4. Samples: 32848384. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 14:19:51,876][101941] Avg episode reward: [(0, '7.920'), (1, '8.330')] +[2023-10-08 14:19:51,881][102898] Updated weights for policy 1, policy_version 64180 (0.0008) +[2023-10-08 14:19:52,250][102898] Updated weights for policy 1, policy_version 64190 (0.0008) +[2023-10-08 14:19:54,440][102897] Updated weights for policy 0, policy_version 64130 (0.0007) +[2023-10-08 14:19:54,808][102897] Updated weights for policy 0, policy_version 64140 (0.0009) +[2023-10-08 14:19:55,177][102897] Updated weights for policy 0, policy_version 64150 (0.0008) +[2023-10-08 14:19:55,547][102897] Updated weights for policy 0, policy_version 64160 (0.0009) +[2023-10-08 14:19:55,915][102898] Updated weights for policy 1, policy_version 64200 (0.0008) +[2023-10-08 14:19:56,285][102898] Updated weights for policy 1, policy_version 64210 (0.0007) +[2023-10-08 14:19:56,661][102898] Updated weights for policy 1, policy_version 64220 (0.0008) +[2023-10-08 14:19:56,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 131465216. Throughput: 0: 1795.6, 1: 1809.2. Samples: 32869368. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 14:19:56,876][101941] Avg episode reward: [(0, '8.190'), (1, '8.790')] +[2023-10-08 14:19:59,146][102897] Updated weights for policy 0, policy_version 64170 (0.0008) +[2023-10-08 14:19:59,523][102897] Updated weights for policy 0, policy_version 64180 (0.0009) +[2023-10-08 14:19:59,893][102897] Updated weights for policy 0, policy_version 64190 (0.0009) +[2023-10-08 14:20:00,394][102898] Updated weights for policy 1, policy_version 64230 (0.0010) +[2023-10-08 14:20:00,764][102898] Updated weights for policy 1, policy_version 64240 (0.0010) +[2023-10-08 14:20:01,136][102898] Updated weights for policy 1, policy_version 64250 (0.0008) +[2023-10-08 14:20:01,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 131530752. Throughput: 0: 1791.9, 1: 1792.6. Samples: 32890184. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 14:20:01,875][101941] Avg episode reward: [(0, '8.500'), (1, '9.110')] +[2023-10-08 14:20:03,522][102897] Updated weights for policy 0, policy_version 64200 (0.0007) +[2023-10-08 14:20:03,897][102897] Updated weights for policy 0, policy_version 64210 (0.0007) +[2023-10-08 14:20:04,258][102897] Updated weights for policy 0, policy_version 64220 (0.0007) +[2023-10-08 14:20:04,873][102898] Updated weights for policy 1, policy_version 64260 (0.0009) +[2023-10-08 14:20:05,236][102898] Updated weights for policy 1, policy_version 64270 (0.0007) +[2023-10-08 14:20:05,605][102898] Updated weights for policy 1, policy_version 64280 (0.0008) +[2023-10-08 14:20:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.6, 300 sec: 14329.1). Total num frames: 131596288. Throughput: 0: 1790.3, 1: 1811.3. Samples: 32901680. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 14:20:06,875][101941] Avg episode reward: [(0, '8.110'), (1, '8.650')] +[2023-10-08 14:20:08,183][102897] Updated weights for policy 0, policy_version 64230 (0.0007) +[2023-10-08 14:20:08,551][102897] Updated weights for policy 0, policy_version 64240 (0.0008) +[2023-10-08 14:20:08,919][102897] Updated weights for policy 0, policy_version 64250 (0.0008) +[2023-10-08 14:20:09,289][102898] Updated weights for policy 1, policy_version 64290 (0.0009) +[2023-10-08 14:20:09,655][102898] Updated weights for policy 1, policy_version 64300 (0.0007) +[2023-10-08 14:20:10,015][102898] Updated weights for policy 1, policy_version 64310 (0.0009) +[2023-10-08 14:20:10,383][102898] Updated weights for policy 1, policy_version 64320 (0.0011) +[2023-10-08 14:20:11,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 131661824. Throughput: 0: 1783.8, 1: 1798.4. Samples: 32922398. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 14:20:11,876][101941] Avg episode reward: [(0, '9.040'), (1, '7.930')] +[2023-10-08 14:20:12,663][102897] Updated weights for policy 0, policy_version 64260 (0.0007) +[2023-10-08 14:20:13,032][102897] Updated weights for policy 0, policy_version 64270 (0.0011) +[2023-10-08 14:20:13,405][102897] Updated weights for policy 0, policy_version 64280 (0.0010) +[2023-10-08 14:20:14,264][102898] Updated weights for policy 1, policy_version 64330 (0.0011) +[2023-10-08 14:20:14,626][102898] Updated weights for policy 1, policy_version 64340 (0.0009) +[2023-10-08 14:20:15,006][102898] Updated weights for policy 1, policy_version 64350 (0.0009) +[2023-10-08 14:20:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 131727360. Throughput: 0: 1780.8, 1: 1793.6. Samples: 32944736. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 14:20:16,875][101941] Avg episode reward: [(0, '9.080'), (1, '8.370')] +[2023-10-08 14:20:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000064288_65830912.pth... +[2023-10-08 14:20:16,883][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000064352_65896448.pth... +[2023-10-08 14:20:16,913][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000062624_64126976.pth +[2023-10-08 14:20:16,923][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000062688_64192512.pth +[2023-10-08 14:20:17,361][102897] Updated weights for policy 0, policy_version 64290 (0.0009) +[2023-10-08 14:20:17,732][102897] Updated weights for policy 0, policy_version 64300 (0.0007) +[2023-10-08 14:20:18,101][102897] Updated weights for policy 0, policy_version 64310 (0.0008) +[2023-10-08 14:20:18,470][102897] Updated weights for policy 0, policy_version 64320 (0.0007) +[2023-10-08 14:20:18,753][102898] Updated weights for policy 1, policy_version 64360 (0.0008) +[2023-10-08 14:20:19,111][102898] Updated weights for policy 1, policy_version 64370 (0.0008) +[2023-10-08 14:20:19,477][102898] Updated weights for policy 1, policy_version 64380 (0.0010) +[2023-10-08 14:20:21,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 131792896. Throughput: 0: 1781.0, 1: 1799.8. Samples: 32954884. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 14:20:21,875][101941] Avg episode reward: [(0, '8.260'), (1, '8.360')] +[2023-10-08 14:20:22,217][102897] Updated weights for policy 0, policy_version 64330 (0.0007) +[2023-10-08 14:20:22,595][102897] Updated weights for policy 0, policy_version 64340 (0.0008) +[2023-10-08 14:20:22,963][102897] Updated weights for policy 0, policy_version 64350 (0.0007) +[2023-10-08 14:20:23,065][102898] Updated weights for policy 1, policy_version 64390 (0.0009) +[2023-10-08 14:20:23,430][102898] Updated weights for policy 1, policy_version 64400 (0.0007) +[2023-10-08 14:20:23,791][102898] Updated weights for policy 1, policy_version 64410 (0.0009) +[2023-10-08 14:20:26,668][102897] Updated weights for policy 0, policy_version 64360 (0.0007) +[2023-10-08 14:20:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 131858432. Throughput: 0: 1786.4, 1: 1789.2. Samples: 32977334. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 14:20:26,875][101941] Avg episode reward: [(0, '7.570'), (1, '8.110')] +[2023-10-08 14:20:27,037][102897] Updated weights for policy 0, policy_version 64370 (0.0009) +[2023-10-08 14:20:27,415][102897] Updated weights for policy 0, policy_version 64380 (0.0010) +[2023-10-08 14:20:27,486][102898] Updated weights for policy 1, policy_version 64420 (0.0008) +[2023-10-08 14:20:27,859][102898] Updated weights for policy 1, policy_version 64430 (0.0007) +[2023-10-08 14:20:28,216][102898] Updated weights for policy 1, policy_version 64440 (0.0008) +[2023-10-08 14:20:31,064][102897] Updated weights for policy 0, policy_version 64390 (0.0007) +[2023-10-08 14:20:31,444][102897] Updated weights for policy 0, policy_version 64400 (0.0009) +[2023-10-08 14:20:31,825][102897] Updated weights for policy 0, policy_version 64410 (0.0009) +[2023-10-08 14:20:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 131923968. Throughput: 0: 1808.2, 1: 1790.8. Samples: 32999052. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 14:20:31,876][101941] Avg episode reward: [(0, '7.630'), (1, '9.030')] +[2023-10-08 14:20:32,032][102898] Updated weights for policy 1, policy_version 64450 (0.0008) +[2023-10-08 14:20:32,388][102898] Updated weights for policy 1, policy_version 64460 (0.0010) +[2023-10-08 14:20:32,767][102898] Updated weights for policy 1, policy_version 64470 (0.0007) +[2023-10-08 14:20:33,125][102898] Updated weights for policy 1, policy_version 64480 (0.0007) +[2023-10-08 14:20:35,632][102897] Updated weights for policy 0, policy_version 64420 (0.0008) +[2023-10-08 14:20:36,010][102897] Updated weights for policy 0, policy_version 64430 (0.0008) +[2023-10-08 14:20:36,378][102897] Updated weights for policy 0, policy_version 64440 (0.0009) +[2023-10-08 14:20:36,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 132022272. Throughput: 0: 1788.0, 1: 1791.6. Samples: 33009466. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 14:20:36,875][101941] Avg episode reward: [(0, '8.020'), (1, '9.540')] +[2023-10-08 14:20:36,943][102898] Updated weights for policy 1, policy_version 64490 (0.0008) +[2023-10-08 14:20:37,326][102898] Updated weights for policy 1, policy_version 64500 (0.0009) +[2023-10-08 14:20:37,683][102898] Updated weights for policy 1, policy_version 64510 (0.0008) +[2023-10-08 14:20:40,137][102897] Updated weights for policy 0, policy_version 64450 (0.0009) +[2023-10-08 14:20:40,508][102897] Updated weights for policy 0, policy_version 64460 (0.0008) +[2023-10-08 14:20:40,873][102897] Updated weights for policy 0, policy_version 64470 (0.0007) +[2023-10-08 14:20:41,246][102897] Updated weights for policy 0, policy_version 64480 (0.0007) +[2023-10-08 14:20:41,405][102898] Updated weights for policy 1, policy_version 64520 (0.0007) +[2023-10-08 14:20:41,768][102898] Updated weights for policy 1, policy_version 64530 (0.0008) +[2023-10-08 14:20:41,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 132087808. Throughput: 0: 1805.3, 1: 1788.8. Samples: 33031102. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 14:20:41,876][101941] Avg episode reward: [(0, '7.880'), (1, '9.720')] +[2023-10-08 14:20:42,133][102898] Updated weights for policy 1, policy_version 64540 (0.0007) +[2023-10-08 14:20:45,111][102897] Updated weights for policy 0, policy_version 64490 (0.0008) +[2023-10-08 14:20:45,475][102897] Updated weights for policy 0, policy_version 64500 (0.0008) +[2023-10-08 14:20:45,841][102897] Updated weights for policy 0, policy_version 64510 (0.0009) +[2023-10-08 14:20:46,008][102898] Updated weights for policy 1, policy_version 64550 (0.0008) +[2023-10-08 14:20:46,380][102898] Updated weights for policy 1, policy_version 64560 (0.0009) +[2023-10-08 14:20:46,744][102898] Updated weights for policy 1, policy_version 64570 (0.0007) +[2023-10-08 14:20:46,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 132153344. Throughput: 0: 1781.4, 1: 1804.2. Samples: 33051536. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 14:20:46,876][101941] Avg episode reward: [(0, '8.050'), (1, '9.900')] +[2023-10-08 14:20:49,603][102897] Updated weights for policy 0, policy_version 64520 (0.0008) +[2023-10-08 14:20:49,981][102897] Updated weights for policy 0, policy_version 64530 (0.0011) +[2023-10-08 14:20:50,348][102897] Updated weights for policy 0, policy_version 64540 (0.0011) +[2023-10-08 14:20:50,592][102898] Updated weights for policy 1, policy_version 64580 (0.0009) +[2023-10-08 14:20:50,966][102898] Updated weights for policy 1, policy_version 64590 (0.0009) +[2023-10-08 14:20:51,329][102898] Updated weights for policy 1, policy_version 64600 (0.0008) +[2023-10-08 14:20:51,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 132251648. Throughput: 0: 1811.7, 1: 1779.9. Samples: 33063300. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 14:20:51,875][101941] Avg episode reward: [(0, '8.500'), (1, '8.560')] +[2023-10-08 14:20:53,823][102897] Updated weights for policy 0, policy_version 64550 (0.0009) +[2023-10-08 14:20:54,197][102897] Updated weights for policy 0, policy_version 64560 (0.0009) +[2023-10-08 14:20:54,570][102897] Updated weights for policy 0, policy_version 64570 (0.0007) +[2023-10-08 14:20:54,957][102898] Updated weights for policy 1, policy_version 64610 (0.0007) +[2023-10-08 14:20:55,322][102898] Updated weights for policy 1, policy_version 64620 (0.0009) +[2023-10-08 14:20:55,692][102898] Updated weights for policy 1, policy_version 64630 (0.0011) +[2023-10-08 14:20:56,061][102898] Updated weights for policy 1, policy_version 64640 (0.0009) +[2023-10-08 14:20:56,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 132317184. Throughput: 0: 1789.5, 1: 1804.3. Samples: 33084118. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 14:20:56,875][101941] Avg episode reward: [(0, '9.020'), (1, '8.700')] +[2023-10-08 14:20:58,399][102897] Updated weights for policy 0, policy_version 64580 (0.0007) +[2023-10-08 14:20:58,781][102897] Updated weights for policy 0, policy_version 64590 (0.0007) +[2023-10-08 14:20:59,147][102897] Updated weights for policy 0, policy_version 64600 (0.0007) +[2023-10-08 14:20:59,963][102898] Updated weights for policy 1, policy_version 64650 (0.0007) +[2023-10-08 14:21:00,336][102898] Updated weights for policy 1, policy_version 64660 (0.0008) +[2023-10-08 14:21:00,709][102898] Updated weights for policy 1, policy_version 64670 (0.0008) +[2023-10-08 14:21:01,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 132382720. Throughput: 0: 1790.5, 1: 1784.0. Samples: 33105590. Policy #0 lag: (min: 26.0, avg: 28.7, max: 55.0) +[2023-10-08 14:21:01,876][101941] Avg episode reward: [(0, '9.350'), (1, '8.940')] +[2023-10-08 14:21:02,945][102897] Updated weights for policy 0, policy_version 64610 (0.0007) +[2023-10-08 14:21:03,324][102897] Updated weights for policy 0, policy_version 64620 (0.0007) +[2023-10-08 14:21:03,697][102897] Updated weights for policy 0, policy_version 64630 (0.0007) +[2023-10-08 14:21:04,071][102897] Updated weights for policy 0, policy_version 64640 (0.0008) +[2023-10-08 14:21:04,241][102898] Updated weights for policy 1, policy_version 64680 (0.0009) +[2023-10-08 14:21:04,615][102898] Updated weights for policy 1, policy_version 64690 (0.0009) +[2023-10-08 14:21:04,975][102898] Updated weights for policy 1, policy_version 64700 (0.0008) +[2023-10-08 14:21:06,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 132448256. Throughput: 0: 1788.9, 1: 1798.3. Samples: 33116310. Policy #0 lag: (min: 26.0, avg: 28.7, max: 55.0) +[2023-10-08 14:21:06,876][101941] Avg episode reward: [(0, '8.960'), (1, '8.780')] +[2023-10-08 14:21:07,857][102897] Updated weights for policy 0, policy_version 64650 (0.0007) +[2023-10-08 14:21:08,228][102897] Updated weights for policy 0, policy_version 64660 (0.0007) +[2023-10-08 14:21:08,597][102897] Updated weights for policy 0, policy_version 64670 (0.0007) +[2023-10-08 14:21:08,742][102898] Updated weights for policy 1, policy_version 64710 (0.0008) +[2023-10-08 14:21:09,118][102898] Updated weights for policy 1, policy_version 64720 (0.0009) +[2023-10-08 14:21:09,485][102898] Updated weights for policy 1, policy_version 64730 (0.0008) +[2023-10-08 14:21:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 132513792. Throughput: 0: 1787.2, 1: 1783.1. Samples: 33137996. Policy #0 lag: (min: 26.0, avg: 28.7, max: 55.0) +[2023-10-08 14:21:11,876][101941] Avg episode reward: [(0, '8.220'), (1, '8.170')] +[2023-10-08 14:21:12,334][102897] Updated weights for policy 0, policy_version 64680 (0.0008) +[2023-10-08 14:21:12,700][102897] Updated weights for policy 0, policy_version 64690 (0.0009) +[2023-10-08 14:21:13,076][102897] Updated weights for policy 0, policy_version 64700 (0.0007) +[2023-10-08 14:21:13,302][102898] Updated weights for policy 1, policy_version 64740 (0.0008) +[2023-10-08 14:21:13,666][102898] Updated weights for policy 1, policy_version 64750 (0.0010) +[2023-10-08 14:21:14,029][102898] Updated weights for policy 1, policy_version 64760 (0.0011) +[2023-10-08 14:21:16,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 132579328. Throughput: 0: 1793.6, 1: 1795.6. Samples: 33160566. Policy #0 lag: (min: 26.0, avg: 28.7, max: 55.0) +[2023-10-08 14:21:16,876][101941] Avg episode reward: [(0, '7.560'), (1, '8.370')] +[2023-10-08 14:21:16,909][102897] Updated weights for policy 0, policy_version 64710 (0.0008) +[2023-10-08 14:21:17,282][102897] Updated weights for policy 0, policy_version 64720 (0.0008) +[2023-10-08 14:21:17,653][102897] Updated weights for policy 0, policy_version 64730 (0.0007) +[2023-10-08 14:21:17,720][102898] Updated weights for policy 1, policy_version 64770 (0.0009) +[2023-10-08 14:21:18,092][102898] Updated weights for policy 1, policy_version 64780 (0.0007) +[2023-10-08 14:21:18,461][102898] Updated weights for policy 1, policy_version 64790 (0.0010) +[2023-10-08 14:21:18,821][102898] Updated weights for policy 1, policy_version 64800 (0.0007) +[2023-10-08 14:21:21,404][102897] Updated weights for policy 0, policy_version 64740 (0.0007) +[2023-10-08 14:21:21,769][102897] Updated weights for policy 0, policy_version 64750 (0.0009) +[2023-10-08 14:21:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 132644864. Throughput: 0: 1778.5, 1: 1796.7. Samples: 33170352. Policy #0 lag: (min: 26.0, avg: 28.7, max: 55.0) +[2023-10-08 14:21:21,876][101941] Avg episode reward: [(0, '8.190'), (1, '7.850')] +[2023-10-08 14:21:22,137][102897] Updated weights for policy 0, policy_version 64760 (0.0008) +[2023-10-08 14:21:22,475][102898] Updated weights for policy 1, policy_version 64810 (0.0010) +[2023-10-08 14:21:22,828][102898] Updated weights for policy 1, policy_version 64820 (0.0008) +[2023-10-08 14:21:23,208][102898] Updated weights for policy 1, policy_version 64830 (0.0008) +[2023-10-08 14:21:25,845][102897] Updated weights for policy 0, policy_version 64770 (0.0008) +[2023-10-08 14:21:26,221][102897] Updated weights for policy 0, policy_version 64780 (0.0007) +[2023-10-08 14:21:26,589][102897] Updated weights for policy 0, policy_version 64790 (0.0007) +[2023-10-08 14:21:26,873][102898] Updated weights for policy 1, policy_version 64840 (0.0007) +[2023-10-08 14:21:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 132710400. Throughput: 0: 1794.9, 1: 1799.9. Samples: 33192868. Policy #0 lag: (min: 26.0, avg: 28.7, max: 55.0) +[2023-10-08 14:21:26,875][101941] Avg episode reward: [(0, '8.500'), (1, '8.240')] +[2023-10-08 14:21:26,961][102897] Updated weights for policy 0, policy_version 64800 (0.0007) +[2023-10-08 14:21:27,234][102898] Updated weights for policy 1, policy_version 64850 (0.0009) +[2023-10-08 14:21:27,603][102898] Updated weights for policy 1, policy_version 64860 (0.0007) +[2023-10-08 14:21:30,871][102897] Updated weights for policy 0, policy_version 64810 (0.0008) +[2023-10-08 14:21:31,258][102897] Updated weights for policy 0, policy_version 64820 (0.0007) +[2023-10-08 14:21:31,387][102898] Updated weights for policy 1, policy_version 64870 (0.0008) +[2023-10-08 14:21:31,622][102897] Updated weights for policy 0, policy_version 64830 (0.0007) +[2023-10-08 14:21:31,748][102898] Updated weights for policy 1, policy_version 64880 (0.0009) +[2023-10-08 14:21:31,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 132808704. Throughput: 0: 1791.3, 1: 1807.9. Samples: 33213502. Policy #0 lag: (min: 26.0, avg: 28.7, max: 55.0) +[2023-10-08 14:21:31,875][101941] Avg episode reward: [(0, '9.040'), (1, '8.550')] +[2023-10-08 14:21:32,110][102898] Updated weights for policy 1, policy_version 64890 (0.0010) +[2023-10-08 14:21:35,296][102897] Updated weights for policy 0, policy_version 64840 (0.0009) +[2023-10-08 14:21:35,671][102897] Updated weights for policy 0, policy_version 64850 (0.0009) +[2023-10-08 14:21:35,862][102898] Updated weights for policy 1, policy_version 64900 (0.0008) +[2023-10-08 14:21:36,048][102897] Updated weights for policy 0, policy_version 64860 (0.0010) +[2023-10-08 14:21:36,235][102898] Updated weights for policy 1, policy_version 64910 (0.0009) +[2023-10-08 14:21:36,602][102898] Updated weights for policy 1, policy_version 64920 (0.0008) +[2023-10-08 14:21:36,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 132874240. Throughput: 0: 1785.5, 1: 1803.9. Samples: 33224820. Policy #0 lag: (min: 26.0, avg: 28.7, max: 55.0) +[2023-10-08 14:21:36,876][101941] Avg episode reward: [(0, '8.100'), (1, '9.690')] +[2023-10-08 14:21:39,929][102897] Updated weights for policy 0, policy_version 64870 (0.0007) +[2023-10-08 14:21:40,311][102897] Updated weights for policy 0, policy_version 64880 (0.0008) +[2023-10-08 14:21:40,591][102898] Updated weights for policy 1, policy_version 64930 (0.0008) +[2023-10-08 14:21:40,686][102897] Updated weights for policy 0, policy_version 64890 (0.0008) +[2023-10-08 14:21:40,961][102898] Updated weights for policy 1, policy_version 64940 (0.0009) +[2023-10-08 14:21:41,329][102898] Updated weights for policy 1, policy_version 64950 (0.0009) +[2023-10-08 14:21:41,690][102898] Updated weights for policy 1, policy_version 64960 (0.0008) +[2023-10-08 14:21:41,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 132972544. Throughput: 0: 1785.3, 1: 1813.1. Samples: 33246046. Policy #0 lag: (min: 26.0, avg: 27.4, max: 52.0) +[2023-10-08 14:21:41,876][101941] Avg episode reward: [(0, '8.190'), (1, '8.920')] +[2023-10-08 14:21:44,536][102897] Updated weights for policy 0, policy_version 64900 (0.0009) +[2023-10-08 14:21:44,909][102897] Updated weights for policy 0, policy_version 64910 (0.0009) +[2023-10-08 14:21:45,275][102897] Updated weights for policy 0, policy_version 64920 (0.0008) +[2023-10-08 14:21:45,438][102898] Updated weights for policy 1, policy_version 64970 (0.0008) +[2023-10-08 14:21:45,807][102898] Updated weights for policy 1, policy_version 64980 (0.0009) +[2023-10-08 14:21:46,183][102898] Updated weights for policy 1, policy_version 64990 (0.0009) +[2023-10-08 14:21:46,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 133038080. Throughput: 0: 1767.1, 1: 1800.0. Samples: 33266108. Policy #0 lag: (min: 26.0, avg: 27.4, max: 52.0) +[2023-10-08 14:21:46,876][101941] Avg episode reward: [(0, '7.960'), (1, '8.740')] +[2023-10-08 14:21:49,174][102897] Updated weights for policy 0, policy_version 64930 (0.0010) +[2023-10-08 14:21:49,548][102897] Updated weights for policy 0, policy_version 64940 (0.0008) +[2023-10-08 14:21:49,929][102897] Updated weights for policy 0, policy_version 64950 (0.0007) +[2023-10-08 14:21:49,940][102898] Updated weights for policy 1, policy_version 65000 (0.0007) +[2023-10-08 14:21:50,295][102897] Updated weights for policy 0, policy_version 64960 (0.0008) +[2023-10-08 14:21:50,304][102898] Updated weights for policy 1, policy_version 65010 (0.0007) +[2023-10-08 14:21:50,662][102898] Updated weights for policy 1, policy_version 65020 (0.0007) +[2023-10-08 14:21:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 133103616. Throughput: 0: 1788.5, 1: 1812.5. Samples: 33278354. Policy #0 lag: (min: 26.0, avg: 27.4, max: 52.0) +[2023-10-08 14:21:51,876][101941] Avg episode reward: [(0, '7.440'), (1, '8.470')] +[2023-10-08 14:21:54,133][102897] Updated weights for policy 0, policy_version 64970 (0.0007) +[2023-10-08 14:21:54,376][102898] Updated weights for policy 1, policy_version 65030 (0.0008) +[2023-10-08 14:21:54,505][102897] Updated weights for policy 0, policy_version 64980 (0.0007) +[2023-10-08 14:21:54,739][102898] Updated weights for policy 1, policy_version 65040 (0.0009) +[2023-10-08 14:21:54,870][102897] Updated weights for policy 0, policy_version 64990 (0.0007) +[2023-10-08 14:21:55,109][102898] Updated weights for policy 1, policy_version 65050 (0.0009) +[2023-10-08 14:21:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 133169152. Throughput: 0: 1760.1, 1: 1798.6. Samples: 33298138. Policy #0 lag: (min: 26.0, avg: 27.4, max: 52.0) +[2023-10-08 14:21:56,876][101941] Avg episode reward: [(0, '8.330'), (1, '8.330')] +[2023-10-08 14:21:58,579][102897] Updated weights for policy 0, policy_version 65000 (0.0007) +[2023-10-08 14:21:58,695][102898] Updated weights for policy 1, policy_version 65060 (0.0008) +[2023-10-08 14:21:58,948][102897] Updated weights for policy 0, policy_version 65010 (0.0007) +[2023-10-08 14:21:59,059][102898] Updated weights for policy 1, policy_version 65070 (0.0008) +[2023-10-08 14:21:59,313][102897] Updated weights for policy 0, policy_version 65020 (0.0007) +[2023-10-08 14:21:59,421][102898] Updated weights for policy 1, policy_version 65080 (0.0007) +[2023-10-08 14:22:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 133234688. Throughput: 0: 1762.7, 1: 1793.5. Samples: 33320594. Policy #0 lag: (min: 26.0, avg: 27.4, max: 52.0) +[2023-10-08 14:22:01,875][101941] Avg episode reward: [(0, '8.430'), (1, '8.500')] +[2023-10-08 14:22:03,087][102897] Updated weights for policy 0, policy_version 65030 (0.0007) +[2023-10-08 14:22:03,104][102898] Updated weights for policy 1, policy_version 65090 (0.0007) +[2023-10-08 14:22:03,456][102897] Updated weights for policy 0, policy_version 65040 (0.0007) +[2023-10-08 14:22:03,467][102898] Updated weights for policy 1, policy_version 65100 (0.0007) +[2023-10-08 14:22:03,828][102897] Updated weights for policy 0, policy_version 65050 (0.0007) +[2023-10-08 14:22:03,838][102898] Updated weights for policy 1, policy_version 65110 (0.0008) +[2023-10-08 14:22:04,213][102898] Updated weights for policy 1, policy_version 65120 (0.0010) +[2023-10-08 14:22:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 133300224. Throughput: 0: 1760.9, 1: 1793.9. Samples: 33330318. Policy #0 lag: (min: 26.0, avg: 27.4, max: 52.0) +[2023-10-08 14:22:06,876][101941] Avg episode reward: [(0, '8.730'), (1, '8.870')] +[2023-10-08 14:22:07,547][102897] Updated weights for policy 0, policy_version 65060 (0.0007) +[2023-10-08 14:22:07,880][102898] Updated weights for policy 1, policy_version 65130 (0.0007) +[2023-10-08 14:22:07,917][102897] Updated weights for policy 0, policy_version 65070 (0.0007) +[2023-10-08 14:22:08,244][102898] Updated weights for policy 1, policy_version 65140 (0.0007) +[2023-10-08 14:22:08,294][102897] Updated weights for policy 0, policy_version 65080 (0.0009) +[2023-10-08 14:22:08,603][102898] Updated weights for policy 1, policy_version 65150 (0.0007) +[2023-10-08 14:22:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 133365760. Throughput: 0: 1757.8, 1: 1791.7. Samples: 33352596. Policy #0 lag: (min: 26.0, avg: 27.4, max: 52.0) +[2023-10-08 14:22:11,875][101941] Avg episode reward: [(0, '8.350'), (1, '8.230')] +[2023-10-08 14:22:12,099][102897] Updated weights for policy 0, policy_version 65090 (0.0008) +[2023-10-08 14:22:12,373][102898] Updated weights for policy 1, policy_version 65160 (0.0008) +[2023-10-08 14:22:12,471][102897] Updated weights for policy 0, policy_version 65100 (0.0007) +[2023-10-08 14:22:12,742][102898] Updated weights for policy 1, policy_version 65170 (0.0007) +[2023-10-08 14:22:12,839][102897] Updated weights for policy 0, policy_version 65110 (0.0007) +[2023-10-08 14:22:13,096][102898] Updated weights for policy 1, policy_version 65180 (0.0008) +[2023-10-08 14:22:13,204][102897] Updated weights for policy 0, policy_version 65120 (0.0007) +[2023-10-08 14:22:16,865][102898] Updated weights for policy 1, policy_version 65190 (0.0009) +[2023-10-08 14:22:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 133431296. Throughput: 0: 1787.0, 1: 1801.2. Samples: 33374974. Policy #0 lag: (min: 26.0, avg: 27.4, max: 52.0) +[2023-10-08 14:22:16,876][101941] Avg episode reward: [(0, '7.940'), (1, '8.150')] +[2023-10-08 14:22:17,077][102897] Updated weights for policy 0, policy_version 65130 (0.0007) +[2023-10-08 14:22:17,230][102898] Updated weights for policy 1, policy_version 65200 (0.0007) +[2023-10-08 14:22:17,454][102897] Updated weights for policy 0, policy_version 65140 (0.0008) +[2023-10-08 14:22:17,591][102898] Updated weights for policy 1, policy_version 65210 (0.0008) +[2023-10-08 14:22:17,809][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000065216_66781184.pth... +[2023-10-08 14:22:17,825][102897] Updated weights for policy 0, policy_version 65150 (0.0009) +[2023-10-08 14:22:17,841][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000063520_65044480.pth +[2023-10-08 14:22:17,891][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000065152_66715648.pth... +[2023-10-08 14:22:17,931][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000063456_64978944.pth +[2023-10-08 14:22:21,562][102898] Updated weights for policy 1, policy_version 65220 (0.0009) +[2023-10-08 14:22:21,662][102897] Updated weights for policy 0, policy_version 65160 (0.0009) +[2023-10-08 14:22:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 133496832. Throughput: 0: 1756.5, 1: 1789.4. Samples: 33384386. Policy #0 lag: (min: 26.0, avg: 27.4, max: 52.0) +[2023-10-08 14:22:21,876][101941] Avg episode reward: [(0, '8.230'), (1, '8.900')] +[2023-10-08 14:22:21,927][102898] Updated weights for policy 1, policy_version 65230 (0.0008) +[2023-10-08 14:22:22,025][102897] Updated weights for policy 0, policy_version 65170 (0.0008) +[2023-10-08 14:22:22,291][102898] Updated weights for policy 1, policy_version 65240 (0.0007) +[2023-10-08 14:22:22,397][102897] Updated weights for policy 0, policy_version 65180 (0.0008) +[2023-10-08 14:22:25,964][102898] Updated weights for policy 1, policy_version 65250 (0.0008) +[2023-10-08 14:22:26,180][102897] Updated weights for policy 0, policy_version 65190 (0.0008) +[2023-10-08 14:22:26,332][102898] Updated weights for policy 1, policy_version 65260 (0.0008) +[2023-10-08 14:22:26,556][102897] Updated weights for policy 0, policy_version 65200 (0.0007) +[2023-10-08 14:22:26,698][102898] Updated weights for policy 1, policy_version 65270 (0.0009) +[2023-10-08 14:22:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 133562368. Throughput: 0: 1780.8, 1: 1786.4. Samples: 33406568. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:22:26,876][101941] Avg episode reward: [(0, '8.750'), (1, '9.570')] +[2023-10-08 14:22:26,927][102897] Updated weights for policy 0, policy_version 65210 (0.0007) +[2023-10-08 14:22:27,065][102898] Updated weights for policy 1, policy_version 65280 (0.0009) +[2023-10-08 14:22:30,799][102897] Updated weights for policy 0, policy_version 65220 (0.0008) +[2023-10-08 14:22:30,980][102898] Updated weights for policy 1, policy_version 65290 (0.0007) +[2023-10-08 14:22:31,158][102897] Updated weights for policy 0, policy_version 65230 (0.0008) +[2023-10-08 14:22:31,342][102898] Updated weights for policy 1, policy_version 65300 (0.0007) +[2023-10-08 14:22:31,538][102897] Updated weights for policy 0, policy_version 65240 (0.0008) +[2023-10-08 14:22:31,705][102898] Updated weights for policy 1, policy_version 65310 (0.0009) +[2023-10-08 14:22:31,875][101941] Fps is (10 sec: 19661.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 133693440. Throughput: 0: 1778.9, 1: 1790.8. Samples: 33426746. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:22:31,875][101941] Avg episode reward: [(0, '8.400'), (1, '9.070')] +[2023-10-08 14:22:35,258][102897] Updated weights for policy 0, policy_version 65250 (0.0008) +[2023-10-08 14:22:35,353][102898] Updated weights for policy 1, policy_version 65320 (0.0008) +[2023-10-08 14:22:35,631][102897] Updated weights for policy 0, policy_version 65260 (0.0009) +[2023-10-08 14:22:35,723][102898] Updated weights for policy 1, policy_version 65330 (0.0007) +[2023-10-08 14:22:35,990][102897] Updated weights for policy 0, policy_version 65270 (0.0008) +[2023-10-08 14:22:36,086][102898] Updated weights for policy 1, policy_version 65340 (0.0008) +[2023-10-08 14:22:36,368][102897] Updated weights for policy 0, policy_version 65280 (0.0008) +[2023-10-08 14:22:36,875][101941] Fps is (10 sec: 19661.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 133758976. Throughput: 0: 1778.7, 1: 1782.0. Samples: 33438584. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:22:36,875][101941] Avg episode reward: [(0, '9.130'), (1, '9.330')] +[2023-10-08 14:22:39,806][102898] Updated weights for policy 1, policy_version 65350 (0.0007) +[2023-10-08 14:22:40,054][102897] Updated weights for policy 0, policy_version 65290 (0.0007) +[2023-10-08 14:22:40,180][102898] Updated weights for policy 1, policy_version 65360 (0.0007) +[2023-10-08 14:22:40,423][102897] Updated weights for policy 0, policy_version 65300 (0.0008) +[2023-10-08 14:22:40,542][102898] Updated weights for policy 1, policy_version 65370 (0.0008) +[2023-10-08 14:22:40,793][102897] Updated weights for policy 0, policy_version 65310 (0.0008) +[2023-10-08 14:22:41,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 133824512. Throughput: 0: 1791.1, 1: 1791.8. Samples: 33459366. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:22:41,876][101941] Avg episode reward: [(0, '8.970'), (1, '9.760')] +[2023-10-08 14:22:44,429][102898] Updated weights for policy 1, policy_version 65380 (0.0008) +[2023-10-08 14:22:44,741][102897] Updated weights for policy 0, policy_version 65320 (0.0008) +[2023-10-08 14:22:44,797][102898] Updated weights for policy 1, policy_version 65390 (0.0007) +[2023-10-08 14:22:45,108][102897] Updated weights for policy 0, policy_version 65330 (0.0009) +[2023-10-08 14:22:45,158][102898] Updated weights for policy 1, policy_version 65400 (0.0010) +[2023-10-08 14:22:45,481][102897] Updated weights for policy 0, policy_version 65340 (0.0008) +[2023-10-08 14:22:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 133890048. Throughput: 0: 1772.7, 1: 1771.7. Samples: 33480094. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:22:46,875][101941] Avg episode reward: [(0, '8.400'), (1, '9.160')] +[2023-10-08 14:22:49,145][102898] Updated weights for policy 1, policy_version 65410 (0.0009) +[2023-10-08 14:22:49,267][102897] Updated weights for policy 0, policy_version 65350 (0.0009) +[2023-10-08 14:22:49,506][102898] Updated weights for policy 1, policy_version 65420 (0.0008) +[2023-10-08 14:22:49,626][102897] Updated weights for policy 0, policy_version 65360 (0.0008) +[2023-10-08 14:22:49,879][102898] Updated weights for policy 1, policy_version 65430 (0.0008) +[2023-10-08 14:22:50,003][102897] Updated weights for policy 0, policy_version 65370 (0.0008) +[2023-10-08 14:22:50,244][102898] Updated weights for policy 1, policy_version 65440 (0.0007) +[2023-10-08 14:22:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 133955584. Throughput: 0: 1795.6, 1: 1791.9. Samples: 33491752. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:22:51,876][101941] Avg episode reward: [(0, '8.290'), (1, '9.710')] +[2023-10-08 14:22:53,920][102897] Updated weights for policy 0, policy_version 65380 (0.0009) +[2023-10-08 14:22:54,118][102898] Updated weights for policy 1, policy_version 65450 (0.0007) +[2023-10-08 14:22:54,281][102897] Updated weights for policy 0, policy_version 65390 (0.0009) +[2023-10-08 14:22:54,493][102898] Updated weights for policy 1, policy_version 65460 (0.0008) +[2023-10-08 14:22:54,651][102897] Updated weights for policy 0, policy_version 65400 (0.0009) +[2023-10-08 14:22:54,855][102898] Updated weights for policy 1, policy_version 65470 (0.0007) +[2023-10-08 14:22:56,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 134021120. Throughput: 0: 1766.6, 1: 1767.3. Samples: 33511620. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:22:56,876][101941] Avg episode reward: [(0, '8.150'), (1, '9.420')] +[2023-10-08 14:22:58,537][102897] Updated weights for policy 0, policy_version 65410 (0.0009) +[2023-10-08 14:22:58,657][102898] Updated weights for policy 1, policy_version 65480 (0.0007) +[2023-10-08 14:22:58,914][102897] Updated weights for policy 0, policy_version 65420 (0.0007) +[2023-10-08 14:22:59,029][102898] Updated weights for policy 1, policy_version 65490 (0.0008) +[2023-10-08 14:22:59,287][102897] Updated weights for policy 0, policy_version 65430 (0.0008) +[2023-10-08 14:22:59,392][102898] Updated weights for policy 1, policy_version 65500 (0.0007) +[2023-10-08 14:22:59,652][102897] Updated weights for policy 0, policy_version 65440 (0.0007) +[2023-10-08 14:23:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 134086656. Throughput: 0: 1761.6, 1: 1769.6. Samples: 33533878. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:23:01,876][101941] Avg episode reward: [(0, '8.710'), (1, '9.680')] +[2023-10-08 14:23:03,154][102898] Updated weights for policy 1, policy_version 65510 (0.0008) +[2023-10-08 14:23:03,460][102897] Updated weights for policy 0, policy_version 65450 (0.0009) +[2023-10-08 14:23:03,517][102898] Updated weights for policy 1, policy_version 65520 (0.0007) +[2023-10-08 14:23:03,825][102897] Updated weights for policy 0, policy_version 65460 (0.0009) +[2023-10-08 14:23:03,891][102898] Updated weights for policy 1, policy_version 65530 (0.0008) +[2023-10-08 14:23:04,179][102897] Updated weights for policy 0, policy_version 65470 (0.0008) +[2023-10-08 14:23:06,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 134152192. Throughput: 0: 1764.0, 1: 1774.1. Samples: 33543598. Policy #0 lag: (min: 0.0, avg: 21.8, max: 32.0) +[2023-10-08 14:23:06,875][101941] Avg episode reward: [(0, '8.320'), (1, '8.940')] +[2023-10-08 14:23:07,633][102898] Updated weights for policy 1, policy_version 65540 (0.0008) +[2023-10-08 14:23:08,003][102898] Updated weights for policy 1, policy_version 65550 (0.0008) +[2023-10-08 14:23:08,017][102897] Updated weights for policy 0, policy_version 65480 (0.0007) +[2023-10-08 14:23:08,363][102898] Updated weights for policy 1, policy_version 65560 (0.0009) +[2023-10-08 14:23:08,389][102897] Updated weights for policy 0, policy_version 65490 (0.0007) +[2023-10-08 14:23:08,759][102897] Updated weights for policy 0, policy_version 65500 (0.0008) +[2023-10-08 14:23:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 134217728. Throughput: 0: 1760.8, 1: 1779.7. Samples: 33565888. Policy #0 lag: (min: 0.0, avg: 21.8, max: 32.0) +[2023-10-08 14:23:11,876][101941] Avg episode reward: [(0, '8.200'), (1, '8.660')] +[2023-10-08 14:23:12,107][102898] Updated weights for policy 1, policy_version 65570 (0.0010) +[2023-10-08 14:23:12,430][102897] Updated weights for policy 0, policy_version 65510 (0.0009) +[2023-10-08 14:23:12,467][102898] Updated weights for policy 1, policy_version 65580 (0.0009) +[2023-10-08 14:23:12,806][102897] Updated weights for policy 0, policy_version 65520 (0.0008) +[2023-10-08 14:23:12,834][102898] Updated weights for policy 1, policy_version 65590 (0.0009) +[2023-10-08 14:23:13,169][102897] Updated weights for policy 0, policy_version 65530 (0.0008) +[2023-10-08 14:23:13,197][102898] Updated weights for policy 1, policy_version 65600 (0.0007) +[2023-10-08 14:23:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 134283264. Throughput: 0: 1780.3, 1: 1808.2. Samples: 33588226. Policy #0 lag: (min: 0.0, avg: 21.8, max: 32.0) +[2023-10-08 14:23:16,876][101941] Avg episode reward: [(0, '7.650'), (1, '7.680')] +[2023-10-08 14:23:16,897][102898] Updated weights for policy 1, policy_version 65610 (0.0007) +[2023-10-08 14:23:16,941][102897] Updated weights for policy 0, policy_version 65540 (0.0008) +[2023-10-08 14:23:17,269][102898] Updated weights for policy 1, policy_version 65620 (0.0008) +[2023-10-08 14:23:17,319][102897] Updated weights for policy 0, policy_version 65550 (0.0008) +[2023-10-08 14:23:17,627][102898] Updated weights for policy 1, policy_version 65630 (0.0007) +[2023-10-08 14:23:17,693][102897] Updated weights for policy 0, policy_version 65560 (0.0008) +[2023-10-08 14:23:21,408][102898] Updated weights for policy 1, policy_version 65640 (0.0008) +[2023-10-08 14:23:21,481][102897] Updated weights for policy 0, policy_version 65570 (0.0009) +[2023-10-08 14:23:21,778][102898] Updated weights for policy 1, policy_version 65650 (0.0008) +[2023-10-08 14:23:21,858][102897] Updated weights for policy 0, policy_version 65580 (0.0008) +[2023-10-08 14:23:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 134348800. Throughput: 0: 1757.9, 1: 1783.4. Samples: 33597940. Policy #0 lag: (min: 0.0, avg: 21.8, max: 32.0) +[2023-10-08 14:23:21,875][101941] Avg episode reward: [(0, '8.150'), (1, '7.190')] +[2023-10-08 14:23:22,140][102898] Updated weights for policy 1, policy_version 65660 (0.0009) +[2023-10-08 14:23:22,238][102897] Updated weights for policy 0, policy_version 65590 (0.0008) +[2023-10-08 14:23:22,609][102897] Updated weights for policy 0, policy_version 65600 (0.0007) +[2023-10-08 14:23:26,027][102898] Updated weights for policy 1, policy_version 65670 (0.0007) +[2023-10-08 14:23:26,392][102898] Updated weights for policy 1, policy_version 65680 (0.0007) +[2023-10-08 14:23:26,437][102897] Updated weights for policy 0, policy_version 65610 (0.0008) +[2023-10-08 14:23:26,762][102898] Updated weights for policy 1, policy_version 65690 (0.0009) +[2023-10-08 14:23:26,806][102897] Updated weights for policy 0, policy_version 65620 (0.0007) +[2023-10-08 14:23:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 134414336. Throughput: 0: 1769.9, 1: 1801.4. Samples: 33620076. Policy #0 lag: (min: 0.0, avg: 21.8, max: 32.0) +[2023-10-08 14:23:26,876][101941] Avg episode reward: [(0, '7.930'), (1, '7.930')] +[2023-10-08 14:23:27,179][102897] Updated weights for policy 0, policy_version 65630 (0.0008) +[2023-10-08 14:23:30,636][102898] Updated weights for policy 1, policy_version 65700 (0.0008) +[2023-10-08 14:23:30,945][102897] Updated weights for policy 0, policy_version 65640 (0.0009) +[2023-10-08 14:23:30,998][102898] Updated weights for policy 1, policy_version 65710 (0.0009) +[2023-10-08 14:23:31,311][102897] Updated weights for policy 0, policy_version 65650 (0.0009) +[2023-10-08 14:23:31,363][102898] Updated weights for policy 1, policy_version 65720 (0.0009) +[2023-10-08 14:23:31,675][102897] Updated weights for policy 0, policy_version 65660 (0.0010) +[2023-10-08 14:23:31,875][101941] Fps is (10 sec: 19660.8, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 134545408. Throughput: 0: 1771.9, 1: 1790.3. Samples: 33640390. Policy #0 lag: (min: 0.0, avg: 21.8, max: 32.0) +[2023-10-08 14:23:31,875][101941] Avg episode reward: [(0, '8.270'), (1, '8.350')] +[2023-10-08 14:23:35,087][102898] Updated weights for policy 1, policy_version 65730 (0.0007) +[2023-10-08 14:23:35,354][102897] Updated weights for policy 0, policy_version 65670 (0.0009) +[2023-10-08 14:23:35,454][102898] Updated weights for policy 1, policy_version 65740 (0.0007) +[2023-10-08 14:23:35,731][102897] Updated weights for policy 0, policy_version 65680 (0.0009) +[2023-10-08 14:23:35,828][102898] Updated weights for policy 1, policy_version 65750 (0.0007) +[2023-10-08 14:23:36,092][102897] Updated weights for policy 0, policy_version 65690 (0.0008) +[2023-10-08 14:23:36,188][102898] Updated weights for policy 1, policy_version 65760 (0.0008) +[2023-10-08 14:23:36,875][101941] Fps is (10 sec: 19661.1, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 134610944. Throughput: 0: 1773.2, 1: 1792.5. Samples: 33652206. Policy #0 lag: (min: 0.0, avg: 21.8, max: 32.0) +[2023-10-08 14:23:36,876][101941] Avg episode reward: [(0, '8.890'), (1, '8.980')] +[2023-10-08 14:23:39,980][102897] Updated weights for policy 0, policy_version 65700 (0.0009) +[2023-10-08 14:23:40,049][102898] Updated weights for policy 1, policy_version 65770 (0.0008) +[2023-10-08 14:23:40,352][102897] Updated weights for policy 0, policy_version 65710 (0.0007) +[2023-10-08 14:23:40,409][102898] Updated weights for policy 1, policy_version 65780 (0.0007) +[2023-10-08 14:23:40,710][102897] Updated weights for policy 0, policy_version 65720 (0.0008) +[2023-10-08 14:23:40,775][102898] Updated weights for policy 1, policy_version 65790 (0.0009) +[2023-10-08 14:23:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 134676480. Throughput: 0: 1782.3, 1: 1796.9. Samples: 33672684. Policy #0 lag: (min: 0.0, avg: 21.8, max: 32.0) +[2023-10-08 14:23:41,875][101941] Avg episode reward: [(0, '9.340'), (1, '9.640')] +[2023-10-08 14:23:44,349][102897] Updated weights for policy 0, policy_version 65730 (0.0010) +[2023-10-08 14:23:44,661][102898] Updated weights for policy 1, policy_version 65800 (0.0009) +[2023-10-08 14:23:44,723][102897] Updated weights for policy 0, policy_version 65740 (0.0008) +[2023-10-08 14:23:45,047][102898] Updated weights for policy 1, policy_version 65810 (0.0009) +[2023-10-08 14:23:45,095][102897] Updated weights for policy 0, policy_version 65750 (0.0009) +[2023-10-08 14:23:45,415][102898] Updated weights for policy 1, policy_version 65820 (0.0007) +[2023-10-08 14:23:45,459][102897] Updated weights for policy 0, policy_version 65760 (0.0008) +[2023-10-08 14:23:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 134742016. Throughput: 0: 1772.3, 1: 1778.2. Samples: 33693650. Policy #0 lag: (min: 31.0, avg: 33.6, max: 63.0) +[2023-10-08 14:23:46,875][101941] Avg episode reward: [(0, '8.490'), (1, '9.250')] +[2023-10-08 14:23:49,106][102898] Updated weights for policy 1, policy_version 65830 (0.0007) +[2023-10-08 14:23:49,371][102897] Updated weights for policy 0, policy_version 65770 (0.0007) +[2023-10-08 14:23:49,475][102898] Updated weights for policy 1, policy_version 65840 (0.0008) +[2023-10-08 14:23:49,738][102897] Updated weights for policy 0, policy_version 65780 (0.0009) +[2023-10-08 14:23:49,843][102898] Updated weights for policy 1, policy_version 65850 (0.0007) +[2023-10-08 14:23:50,110][102897] Updated weights for policy 0, policy_version 65790 (0.0008) +[2023-10-08 14:23:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 134807552. Throughput: 0: 1794.3, 1: 1788.6. Samples: 33704828. Policy #0 lag: (min: 31.0, avg: 33.6, max: 63.0) +[2023-10-08 14:23:51,876][101941] Avg episode reward: [(0, '7.850'), (1, '8.750')] +[2023-10-08 14:23:53,671][102898] Updated weights for policy 1, policy_version 65860 (0.0007) +[2023-10-08 14:23:53,805][102897] Updated weights for policy 0, policy_version 65800 (0.0007) +[2023-10-08 14:23:54,038][102898] Updated weights for policy 1, policy_version 65870 (0.0010) +[2023-10-08 14:23:54,182][102897] Updated weights for policy 0, policy_version 65810 (0.0007) +[2023-10-08 14:23:54,395][102898] Updated weights for policy 1, policy_version 65880 (0.0007) +[2023-10-08 14:23:54,559][102897] Updated weights for policy 0, policy_version 65820 (0.0010) +[2023-10-08 14:23:56,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 134873088. Throughput: 0: 1774.8, 1: 1769.4. Samples: 33725378. Policy #0 lag: (min: 31.0, avg: 33.6, max: 63.0) +[2023-10-08 14:23:56,876][101941] Avg episode reward: [(0, '7.900'), (1, '7.960')] +[2023-10-08 14:23:58,314][102897] Updated weights for policy 0, policy_version 65830 (0.0009) +[2023-10-08 14:23:58,370][102898] Updated weights for policy 1, policy_version 65890 (0.0007) +[2023-10-08 14:23:58,691][102897] Updated weights for policy 0, policy_version 65840 (0.0008) +[2023-10-08 14:23:58,727][102898] Updated weights for policy 1, policy_version 65900 (0.0009) +[2023-10-08 14:23:59,064][102897] Updated weights for policy 0, policy_version 65850 (0.0007) +[2023-10-08 14:23:59,096][102898] Updated weights for policy 1, policy_version 65910 (0.0008) +[2023-10-08 14:23:59,457][102898] Updated weights for policy 1, policy_version 65920 (0.0007) +[2023-10-08 14:24:01,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 134938624. Throughput: 0: 1774.8, 1: 1765.4. Samples: 33747536. Policy #0 lag: (min: 31.0, avg: 33.6, max: 63.0) +[2023-10-08 14:24:01,876][101941] Avg episode reward: [(0, '8.340'), (1, '8.050')] +[2023-10-08 14:24:02,773][102897] Updated weights for policy 0, policy_version 65860 (0.0007) +[2023-10-08 14:24:03,142][102898] Updated weights for policy 1, policy_version 65930 (0.0007) +[2023-10-08 14:24:03,142][102897] Updated weights for policy 0, policy_version 65870 (0.0008) +[2023-10-08 14:24:03,510][102897] Updated weights for policy 0, policy_version 65880 (0.0009) +[2023-10-08 14:24:03,519][102898] Updated weights for policy 1, policy_version 65940 (0.0008) +[2023-10-08 14:24:03,880][102898] Updated weights for policy 1, policy_version 65950 (0.0009) +[2023-10-08 14:24:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 135004160. Throughput: 0: 1777.2, 1: 1765.9. Samples: 33757380. Policy #0 lag: (min: 31.0, avg: 33.6, max: 63.0) +[2023-10-08 14:24:06,876][101941] Avg episode reward: [(0, '7.920'), (1, '9.000')] +[2023-10-08 14:24:07,342][102897] Updated weights for policy 0, policy_version 65890 (0.0009) +[2023-10-08 14:24:07,557][102898] Updated weights for policy 1, policy_version 65960 (0.0008) +[2023-10-08 14:24:07,713][102897] Updated weights for policy 0, policy_version 65900 (0.0008) +[2023-10-08 14:24:07,915][102898] Updated weights for policy 1, policy_version 65970 (0.0009) +[2023-10-08 14:24:08,092][102897] Updated weights for policy 0, policy_version 65910 (0.0008) +[2023-10-08 14:24:08,281][102898] Updated weights for policy 1, policy_version 65980 (0.0007) +[2023-10-08 14:24:08,459][102897] Updated weights for policy 0, policy_version 65920 (0.0008) +[2023-10-08 14:24:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 135069696. Throughput: 0: 1783.7, 1: 1769.8. Samples: 33779986. Policy #0 lag: (min: 31.0, avg: 33.6, max: 63.0) +[2023-10-08 14:24:11,876][101941] Avg episode reward: [(0, '8.250'), (1, '9.410')] +[2023-10-08 14:24:12,126][102898] Updated weights for policy 1, policy_version 65990 (0.0008) +[2023-10-08 14:24:12,188][102897] Updated weights for policy 0, policy_version 65930 (0.0007) +[2023-10-08 14:24:12,493][102898] Updated weights for policy 1, policy_version 66000 (0.0007) +[2023-10-08 14:24:12,564][102897] Updated weights for policy 0, policy_version 65940 (0.0007) +[2023-10-08 14:24:12,865][102898] Updated weights for policy 1, policy_version 66010 (0.0008) +[2023-10-08 14:24:12,921][102897] Updated weights for policy 0, policy_version 65950 (0.0009) +[2023-10-08 14:24:16,567][102898] Updated weights for policy 1, policy_version 66020 (0.0007) +[2023-10-08 14:24:16,820][102897] Updated weights for policy 0, policy_version 65960 (0.0008) +[2023-10-08 14:24:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 135135232. Throughput: 0: 1800.0, 1: 1798.1. Samples: 33802302. Policy #0 lag: (min: 31.0, avg: 33.6, max: 63.0) +[2023-10-08 14:24:16,876][101941] Avg episode reward: [(0, '8.020'), (1, '9.240')] +[2023-10-08 14:24:16,936][102898] Updated weights for policy 1, policy_version 66030 (0.0007) +[2023-10-08 14:24:17,187][102897] Updated weights for policy 0, policy_version 65970 (0.0007) +[2023-10-08 14:24:17,302][102898] Updated weights for policy 1, policy_version 66040 (0.0007) +[2023-10-08 14:24:17,566][102897] Updated weights for policy 0, policy_version 65980 (0.0008) +[2023-10-08 14:24:17,590][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000066048_67633152.pth... +[2023-10-08 14:24:17,623][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000064352_65896448.pth +[2023-10-08 14:24:17,708][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000065984_67567616.pth... +[2023-10-08 14:24:17,737][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000064288_65830912.pth +[2023-10-08 14:24:21,199][102898] Updated weights for policy 1, policy_version 66050 (0.0007) +[2023-10-08 14:24:21,390][102897] Updated weights for policy 0, policy_version 65990 (0.0008) +[2023-10-08 14:24:21,573][102898] Updated weights for policy 1, policy_version 66060 (0.0008) +[2023-10-08 14:24:21,759][102897] Updated weights for policy 0, policy_version 66000 (0.0008) +[2023-10-08 14:24:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 135200768. Throughput: 0: 1774.7, 1: 1769.9. Samples: 33811712. Policy #0 lag: (min: 31.0, avg: 33.6, max: 63.0) +[2023-10-08 14:24:21,876][101941] Avg episode reward: [(0, '7.820'), (1, '8.870')] +[2023-10-08 14:24:21,939][102898] Updated weights for policy 1, policy_version 66070 (0.0007) +[2023-10-08 14:24:22,122][102897] Updated weights for policy 0, policy_version 66010 (0.0007) +[2023-10-08 14:24:22,304][102898] Updated weights for policy 1, policy_version 66080 (0.0007) +[2023-10-08 14:24:25,919][102897] Updated weights for policy 0, policy_version 66020 (0.0007) +[2023-10-08 14:24:26,080][102898] Updated weights for policy 1, policy_version 66090 (0.0008) +[2023-10-08 14:24:26,290][102897] Updated weights for policy 0, policy_version 66030 (0.0008) +[2023-10-08 14:24:26,442][102898] Updated weights for policy 1, policy_version 66100 (0.0008) +[2023-10-08 14:24:26,659][102897] Updated weights for policy 0, policy_version 66040 (0.0009) +[2023-10-08 14:24:26,804][102898] Updated weights for policy 1, policy_version 66110 (0.0007) +[2023-10-08 14:24:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 135266304. Throughput: 0: 1793.7, 1: 1791.1. Samples: 33833998. Policy #0 lag: (min: 31.0, avg: 33.6, max: 63.0) +[2023-10-08 14:24:26,876][101941] Avg episode reward: [(0, '7.960'), (1, '8.890')] +[2023-10-08 14:24:30,518][102897] Updated weights for policy 0, policy_version 66050 (0.0009) +[2023-10-08 14:24:30,565][102898] Updated weights for policy 1, policy_version 66120 (0.0009) +[2023-10-08 14:24:30,890][102897] Updated weights for policy 0, policy_version 66060 (0.0009) +[2023-10-08 14:24:30,929][102898] Updated weights for policy 1, policy_version 66130 (0.0009) +[2023-10-08 14:24:31,255][102897] Updated weights for policy 0, policy_version 66070 (0.0009) +[2023-10-08 14:24:31,294][102898] Updated weights for policy 1, policy_version 66140 (0.0008) +[2023-10-08 14:24:31,620][102897] Updated weights for policy 0, policy_version 66080 (0.0011) +[2023-10-08 14:24:31,875][101941] Fps is (10 sec: 19660.6, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 135397376. Throughput: 0: 1787.1, 1: 1772.0. Samples: 33853810. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:24:31,876][101941] Avg episode reward: [(0, '7.940'), (1, '8.620')] +[2023-10-08 14:24:35,060][102898] Updated weights for policy 1, policy_version 66150 (0.0009) +[2023-10-08 14:24:35,425][102898] Updated weights for policy 1, policy_version 66160 (0.0009) +[2023-10-08 14:24:35,516][102897] Updated weights for policy 0, policy_version 66090 (0.0008) +[2023-10-08 14:24:35,794][102898] Updated weights for policy 1, policy_version 66170 (0.0007) +[2023-10-08 14:24:35,890][102897] Updated weights for policy 0, policy_version 66100 (0.0008) +[2023-10-08 14:24:36,267][102897] Updated weights for policy 0, policy_version 66110 (0.0009) +[2023-10-08 14:24:36,875][101941] Fps is (10 sec: 19661.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 135462912. Throughput: 0: 1788.1, 1: 1790.3. Samples: 33865856. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:24:36,875][101941] Avg episode reward: [(0, '7.700'), (1, '8.610')] +[2023-10-08 14:24:39,565][102898] Updated weights for policy 1, policy_version 66180 (0.0009) +[2023-10-08 14:24:39,934][102898] Updated weights for policy 1, policy_version 66190 (0.0008) +[2023-10-08 14:24:40,043][102897] Updated weights for policy 0, policy_version 66120 (0.0008) +[2023-10-08 14:24:40,304][102898] Updated weights for policy 1, policy_version 66200 (0.0008) +[2023-10-08 14:24:40,411][102897] Updated weights for policy 0, policy_version 66130 (0.0008) +[2023-10-08 14:24:40,788][102897] Updated weights for policy 0, policy_version 66140 (0.0008) +[2023-10-08 14:24:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 135528448. Throughput: 0: 1789.8, 1: 1780.5. Samples: 33886040. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:24:41,876][101941] Avg episode reward: [(0, '7.600'), (1, '8.640')] +[2023-10-08 14:24:43,986][102898] Updated weights for policy 1, policy_version 66210 (0.0008) +[2023-10-08 14:24:44,348][102898] Updated weights for policy 1, policy_version 66220 (0.0010) +[2023-10-08 14:24:44,524][102897] Updated weights for policy 0, policy_version 66150 (0.0009) +[2023-10-08 14:24:44,714][102898] Updated weights for policy 1, policy_version 66230 (0.0008) +[2023-10-08 14:24:44,890][102897] Updated weights for policy 0, policy_version 66160 (0.0007) +[2023-10-08 14:24:45,081][102898] Updated weights for policy 1, policy_version 66240 (0.0008) +[2023-10-08 14:24:45,256][102897] Updated weights for policy 0, policy_version 66170 (0.0008) +[2023-10-08 14:24:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 135593984. Throughput: 0: 1775.7, 1: 1777.7. Samples: 33907440. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:24:46,875][101941] Avg episode reward: [(0, '7.900'), (1, '9.270')] +[2023-10-08 14:24:48,910][102898] Updated weights for policy 1, policy_version 66250 (0.0008) +[2023-10-08 14:24:48,971][102897] Updated weights for policy 0, policy_version 66180 (0.0009) +[2023-10-08 14:24:49,271][102898] Updated weights for policy 1, policy_version 66260 (0.0008) +[2023-10-08 14:24:49,350][102897] Updated weights for policy 0, policy_version 66190 (0.0007) +[2023-10-08 14:24:49,641][102898] Updated weights for policy 1, policy_version 66270 (0.0008) +[2023-10-08 14:24:49,719][102897] Updated weights for policy 0, policy_version 66200 (0.0007) +[2023-10-08 14:24:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 135659520. Throughput: 0: 1793.2, 1: 1783.6. Samples: 33918338. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:24:51,875][101941] Avg episode reward: [(0, '8.260'), (1, '9.900')] +[2023-10-08 14:24:53,430][102897] Updated weights for policy 0, policy_version 66210 (0.0007) +[2023-10-08 14:24:53,441][102898] Updated weights for policy 1, policy_version 66280 (0.0008) +[2023-10-08 14:24:53,793][102897] Updated weights for policy 0, policy_version 66220 (0.0007) +[2023-10-08 14:24:53,801][102898] Updated weights for policy 1, policy_version 66290 (0.0008) +[2023-10-08 14:24:54,161][102897] Updated weights for policy 0, policy_version 66230 (0.0007) +[2023-10-08 14:24:54,165][102898] Updated weights for policy 1, policy_version 66300 (0.0008) +[2023-10-08 14:24:54,543][102897] Updated weights for policy 0, policy_version 66240 (0.0009) +[2023-10-08 14:24:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 135725056. Throughput: 0: 1767.3, 1: 1772.6. Samples: 33939280. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:24:56,875][101941] Avg episode reward: [(0, '9.010'), (1, '9.780')] +[2023-10-08 14:24:58,029][102898] Updated weights for policy 1, policy_version 66310 (0.0008) +[2023-10-08 14:24:58,201][102897] Updated weights for policy 0, policy_version 66250 (0.0009) +[2023-10-08 14:24:58,402][102898] Updated weights for policy 1, policy_version 66320 (0.0008) +[2023-10-08 14:24:58,574][102897] Updated weights for policy 0, policy_version 66260 (0.0007) +[2023-10-08 14:24:58,760][102898] Updated weights for policy 1, policy_version 66330 (0.0009) +[2023-10-08 14:24:58,942][102897] Updated weights for policy 0, policy_version 66270 (0.0008) +[2023-10-08 14:25:01,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 135790592. Throughput: 0: 1768.3, 1: 1773.0. Samples: 33961662. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:25:01,876][101941] Avg episode reward: [(0, '8.990'), (1, '9.200')] +[2023-10-08 14:25:02,627][102898] Updated weights for policy 1, policy_version 66340 (0.0007) +[2023-10-08 14:25:02,906][102897] Updated weights for policy 0, policy_version 66280 (0.0008) +[2023-10-08 14:25:02,996][102898] Updated weights for policy 1, policy_version 66350 (0.0008) +[2023-10-08 14:25:03,265][102897] Updated weights for policy 0, policy_version 66290 (0.0008) +[2023-10-08 14:25:03,353][102898] Updated weights for policy 1, policy_version 66360 (0.0007) +[2023-10-08 14:25:03,629][102897] Updated weights for policy 0, policy_version 66300 (0.0007) +[2023-10-08 14:25:06,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 135856128. Throughput: 0: 1769.9, 1: 1777.5. Samples: 33971342. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:25:06,876][101941] Avg episode reward: [(0, '7.800'), (1, '8.800')] +[2023-10-08 14:25:07,119][102898] Updated weights for policy 1, policy_version 66370 (0.0007) +[2023-10-08 14:25:07,483][102898] Updated weights for policy 1, policy_version 66380 (0.0007) +[2023-10-08 14:25:07,507][102897] Updated weights for policy 0, policy_version 66310 (0.0008) +[2023-10-08 14:25:07,861][102898] Updated weights for policy 1, policy_version 66390 (0.0007) +[2023-10-08 14:25:07,881][102897] Updated weights for policy 0, policy_version 66320 (0.0007) +[2023-10-08 14:25:08,221][102898] Updated weights for policy 1, policy_version 66400 (0.0008) +[2023-10-08 14:25:08,246][102897] Updated weights for policy 0, policy_version 66330 (0.0007) +[2023-10-08 14:25:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 135921664. Throughput: 0: 1765.6, 1: 1778.7. Samples: 33993494. Policy #0 lag: (min: 31.0, avg: 33.9, max: 63.0) +[2023-10-08 14:25:11,876][101941] Avg episode reward: [(0, '7.790'), (1, '8.720')] +[2023-10-08 14:25:11,901][102897] Updated weights for policy 0, policy_version 66340 (0.0008) +[2023-10-08 14:25:12,027][102898] Updated weights for policy 1, policy_version 66410 (0.0007) +[2023-10-08 14:25:12,278][102897] Updated weights for policy 0, policy_version 66350 (0.0007) +[2023-10-08 14:25:12,386][102898] Updated weights for policy 1, policy_version 66420 (0.0007) +[2023-10-08 14:25:12,656][102897] Updated weights for policy 0, policy_version 66360 (0.0007) +[2023-10-08 14:25:12,758][102898] Updated weights for policy 1, policy_version 66430 (0.0008) +[2023-10-08 14:25:16,468][102897] Updated weights for policy 0, policy_version 66370 (0.0007) +[2023-10-08 14:25:16,595][102898] Updated weights for policy 1, policy_version 66440 (0.0009) +[2023-10-08 14:25:16,844][102897] Updated weights for policy 0, policy_version 66380 (0.0008) +[2023-10-08 14:25:16,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 135987200. Throughput: 0: 1788.5, 1: 1805.8. Samples: 34015554. Policy #0 lag: (min: 31.0, avg: 32.2, max: 54.0) +[2023-10-08 14:25:16,875][101941] Avg episode reward: [(0, '8.320'), (1, '8.600')] +[2023-10-08 14:25:16,970][102898] Updated weights for policy 1, policy_version 66450 (0.0009) +[2023-10-08 14:25:17,206][102897] Updated weights for policy 0, policy_version 66390 (0.0007) +[2023-10-08 14:25:17,342][102898] Updated weights for policy 1, policy_version 66460 (0.0007) +[2023-10-08 14:25:17,580][102897] Updated weights for policy 0, policy_version 66400 (0.0008) +[2023-10-08 14:25:21,045][102898] Updated weights for policy 1, policy_version 66470 (0.0008) +[2023-10-08 14:25:21,404][102898] Updated weights for policy 1, policy_version 66480 (0.0009) +[2023-10-08 14:25:21,435][102897] Updated weights for policy 0, policy_version 66410 (0.0007) +[2023-10-08 14:25:21,769][102898] Updated weights for policy 1, policy_version 66490 (0.0010) +[2023-10-08 14:25:21,803][102897] Updated weights for policy 0, policy_version 66420 (0.0010) +[2023-10-08 14:25:21,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 136052736. Throughput: 0: 1767.1, 1: 1779.6. Samples: 34025460. Policy #0 lag: (min: 31.0, avg: 32.2, max: 54.0) +[2023-10-08 14:25:21,875][101941] Avg episode reward: [(0, '7.940'), (1, '8.870')] +[2023-10-08 14:25:22,175][102897] Updated weights for policy 0, policy_version 66430 (0.0008) +[2023-10-08 14:25:25,689][102898] Updated weights for policy 1, policy_version 66500 (0.0009) +[2023-10-08 14:25:25,954][102897] Updated weights for policy 0, policy_version 66440 (0.0008) +[2023-10-08 14:25:26,061][102898] Updated weights for policy 1, policy_version 66510 (0.0007) +[2023-10-08 14:25:26,325][102897] Updated weights for policy 0, policy_version 66450 (0.0007) +[2023-10-08 14:25:26,430][102898] Updated weights for policy 1, policy_version 66520 (0.0009) +[2023-10-08 14:25:26,702][102897] Updated weights for policy 0, policy_version 66460 (0.0009) +[2023-10-08 14:25:26,875][101941] Fps is (10 sec: 19660.8, 60 sec: 15291.8, 300 sec: 14440.1). Total num frames: 136183808. Throughput: 0: 1785.0, 1: 1802.2. Samples: 34047462. Policy #0 lag: (min: 31.0, avg: 32.2, max: 54.0) +[2023-10-08 14:25:26,875][101941] Avg episode reward: [(0, '7.840'), (1, '8.930')] +[2023-10-08 14:25:30,179][102898] Updated weights for policy 1, policy_version 66530 (0.0009) +[2023-10-08 14:25:30,545][102898] Updated weights for policy 1, policy_version 66540 (0.0007) +[2023-10-08 14:25:30,548][102897] Updated weights for policy 0, policy_version 66470 (0.0007) +[2023-10-08 14:25:30,911][102898] Updated weights for policy 1, policy_version 66550 (0.0007) +[2023-10-08 14:25:30,922][102897] Updated weights for policy 0, policy_version 66480 (0.0008) +[2023-10-08 14:25:31,268][102898] Updated weights for policy 1, policy_version 66560 (0.0008) +[2023-10-08 14:25:31,290][102897] Updated weights for policy 0, policy_version 66490 (0.0007) +[2023-10-08 14:25:31,875][101941] Fps is (10 sec: 19660.3, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 136249344. Throughput: 0: 1771.2, 1: 1773.8. Samples: 34066968. Policy #0 lag: (min: 31.0, avg: 32.2, max: 54.0) +[2023-10-08 14:25:31,876][101941] Avg episode reward: [(0, '8.200'), (1, '9.860')] +[2023-10-08 14:25:34,930][102897] Updated weights for policy 0, policy_version 66500 (0.0008) +[2023-10-08 14:25:35,016][102898] Updated weights for policy 1, policy_version 66570 (0.0009) +[2023-10-08 14:25:35,308][102897] Updated weights for policy 0, policy_version 66510 (0.0008) +[2023-10-08 14:25:35,389][102898] Updated weights for policy 1, policy_version 66580 (0.0010) +[2023-10-08 14:25:35,679][102897] Updated weights for policy 0, policy_version 66520 (0.0008) +[2023-10-08 14:25:35,745][102898] Updated weights for policy 1, policy_version 66590 (0.0008) +[2023-10-08 14:25:36,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 136314880. Throughput: 0: 1785.2, 1: 1799.8. Samples: 34079664. Policy #0 lag: (min: 31.0, avg: 32.2, max: 54.0) +[2023-10-08 14:25:36,876][101941] Avg episode reward: [(0, '7.040'), (1, '10.100')] +[2023-10-08 14:25:39,470][102897] Updated weights for policy 0, policy_version 66530 (0.0007) +[2023-10-08 14:25:39,584][102898] Updated weights for policy 1, policy_version 66600 (0.0008) +[2023-10-08 14:25:39,833][102897] Updated weights for policy 0, policy_version 66540 (0.0007) +[2023-10-08 14:25:39,958][102898] Updated weights for policy 1, policy_version 66610 (0.0007) +[2023-10-08 14:25:40,208][102897] Updated weights for policy 0, policy_version 66550 (0.0007) +[2023-10-08 14:25:40,320][102898] Updated weights for policy 1, policy_version 66620 (0.0009) +[2023-10-08 14:25:40,577][102897] Updated weights for policy 0, policy_version 66560 (0.0008) +[2023-10-08 14:25:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 136380416. Throughput: 0: 1781.1, 1: 1776.8. Samples: 34099386. Policy #0 lag: (min: 31.0, avg: 32.2, max: 54.0) +[2023-10-08 14:25:41,875][101941] Avg episode reward: [(0, '6.130'), (1, '10.040')] +[2023-10-08 14:25:44,123][102898] Updated weights for policy 1, policy_version 66630 (0.0008) +[2023-10-08 14:25:44,347][102897] Updated weights for policy 0, policy_version 66570 (0.0008) +[2023-10-08 14:25:44,495][102898] Updated weights for policy 1, policy_version 66640 (0.0007) +[2023-10-08 14:25:44,709][102897] Updated weights for policy 0, policy_version 66580 (0.0007) +[2023-10-08 14:25:44,862][102898] Updated weights for policy 1, policy_version 66650 (0.0009) +[2023-10-08 14:25:45,082][102897] Updated weights for policy 0, policy_version 66590 (0.0007) +[2023-10-08 14:25:46,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 136445952. Throughput: 0: 1773.4, 1: 1772.3. Samples: 34121218. Policy #0 lag: (min: 31.0, avg: 32.2, max: 54.0) +[2023-10-08 14:25:46,875][101941] Avg episode reward: [(0, '7.300'), (1, '10.170')] +[2023-10-08 14:25:48,653][102898] Updated weights for policy 1, policy_version 66660 (0.0008) +[2023-10-08 14:25:48,805][102897] Updated weights for policy 0, policy_version 66600 (0.0009) +[2023-10-08 14:25:49,020][102898] Updated weights for policy 1, policy_version 66670 (0.0011) +[2023-10-08 14:25:49,175][102897] Updated weights for policy 0, policy_version 66610 (0.0009) +[2023-10-08 14:25:49,389][102898] Updated weights for policy 1, policy_version 66680 (0.0007) +[2023-10-08 14:25:49,557][102897] Updated weights for policy 0, policy_version 66620 (0.0008) +[2023-10-08 14:25:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 136511488. Throughput: 0: 1787.6, 1: 1777.9. Samples: 34131790. Policy #0 lag: (min: 31.0, avg: 32.2, max: 54.0) +[2023-10-08 14:25:51,876][101941] Avg episode reward: [(0, '7.570'), (1, '10.190')] +[2023-10-08 14:25:53,027][102898] Updated weights for policy 1, policy_version 66690 (0.0007) +[2023-10-08 14:25:53,391][102898] Updated weights for policy 1, policy_version 66700 (0.0008) +[2023-10-08 14:25:53,396][102897] Updated weights for policy 0, policy_version 66630 (0.0007) +[2023-10-08 14:25:53,756][102898] Updated weights for policy 1, policy_version 66710 (0.0008) +[2023-10-08 14:25:53,762][102897] Updated weights for policy 0, policy_version 66640 (0.0008) +[2023-10-08 14:25:54,121][102898] Updated weights for policy 1, policy_version 66720 (0.0008) +[2023-10-08 14:25:54,131][102897] Updated weights for policy 0, policy_version 66650 (0.0008) +[2023-10-08 14:25:56,875][101941] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 136577024. Throughput: 0: 1778.0, 1: 1773.4. Samples: 34153310. Policy #0 lag: (min: 31.0, avg: 32.2, max: 54.0) +[2023-10-08 14:25:56,876][101941] Avg episode reward: [(0, '6.410'), (1, '9.490')] +[2023-10-08 14:25:57,935][102898] Updated weights for policy 1, policy_version 66730 (0.0007) +[2023-10-08 14:25:57,970][102897] Updated weights for policy 0, policy_version 66660 (0.0010) +[2023-10-08 14:25:58,295][102898] Updated weights for policy 1, policy_version 66740 (0.0008) +[2023-10-08 14:25:58,341][102897] Updated weights for policy 0, policy_version 66670 (0.0008) +[2023-10-08 14:25:58,658][102898] Updated weights for policy 1, policy_version 66750 (0.0007) +[2023-10-08 14:25:58,715][102897] Updated weights for policy 0, policy_version 66680 (0.0007) +[2023-10-08 14:26:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 136642560. Throughput: 0: 1770.0, 1: 1785.3. Samples: 34175544. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 14:26:01,876][101941] Avg episode reward: [(0, '7.460'), (1, '9.640')] +[2023-10-08 14:26:02,492][102898] Updated weights for policy 1, policy_version 66760 (0.0009) +[2023-10-08 14:26:02,577][102897] Updated weights for policy 0, policy_version 66690 (0.0008) +[2023-10-08 14:26:02,859][102898] Updated weights for policy 1, policy_version 66770 (0.0008) +[2023-10-08 14:26:02,956][102897] Updated weights for policy 0, policy_version 66700 (0.0008) +[2023-10-08 14:26:03,216][102898] Updated weights for policy 1, policy_version 66780 (0.0008) +[2023-10-08 14:26:03,324][102897] Updated weights for policy 0, policy_version 66710 (0.0008) +[2023-10-08 14:26:03,700][102897] Updated weights for policy 0, policy_version 66720 (0.0007) +[2023-10-08 14:26:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 136708096. Throughput: 0: 1771.5, 1: 1775.1. Samples: 34185060. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 14:26:06,876][101941] Avg episode reward: [(0, '7.850'), (1, '9.080')] +[2023-10-08 14:26:06,919][102898] Updated weights for policy 1, policy_version 66790 (0.0009) +[2023-10-08 14:26:07,285][102898] Updated weights for policy 1, policy_version 66800 (0.0007) +[2023-10-08 14:26:07,594][102897] Updated weights for policy 0, policy_version 66730 (0.0008) +[2023-10-08 14:26:07,649][102898] Updated weights for policy 1, policy_version 66810 (0.0008) +[2023-10-08 14:26:07,977][102897] Updated weights for policy 0, policy_version 66740 (0.0009) +[2023-10-08 14:26:08,348][102897] Updated weights for policy 0, policy_version 66750 (0.0008) +[2023-10-08 14:26:11,430][102898] Updated weights for policy 1, policy_version 66820 (0.0009) +[2023-10-08 14:26:11,797][102898] Updated weights for policy 1, policy_version 66830 (0.0009) +[2023-10-08 14:26:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 136773632. Throughput: 0: 1770.1, 1: 1783.0. Samples: 34207352. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 14:26:11,875][101941] Avg episode reward: [(0, '7.670'), (1, '9.100')] +[2023-10-08 14:26:12,001][102897] Updated weights for policy 0, policy_version 66760 (0.0008) +[2023-10-08 14:26:12,160][102898] Updated weights for policy 1, policy_version 66840 (0.0008) +[2023-10-08 14:26:12,375][102897] Updated weights for policy 0, policy_version 66770 (0.0008) +[2023-10-08 14:26:12,748][102897] Updated weights for policy 0, policy_version 66780 (0.0007) +[2023-10-08 14:26:15,972][102898] Updated weights for policy 1, policy_version 66850 (0.0010) +[2023-10-08 14:26:16,341][102898] Updated weights for policy 1, policy_version 66860 (0.0010) +[2023-10-08 14:26:16,607][102897] Updated weights for policy 0, policy_version 66790 (0.0008) +[2023-10-08 14:26:16,702][102898] Updated weights for policy 1, policy_version 66870 (0.0007) +[2023-10-08 14:26:16,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 136839168. Throughput: 0: 1797.5, 1: 1799.7. Samples: 34228842. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 14:26:16,875][101941] Avg episode reward: [(0, '7.850'), (1, '8.830')] +[2023-10-08 14:26:16,979][102897] Updated weights for policy 0, policy_version 66800 (0.0007) +[2023-10-08 14:26:17,063][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000066880_68485120.pth... +[2023-10-08 14:26:17,067][102898] Updated weights for policy 1, policy_version 66880 (0.0007) +[2023-10-08 14:26:17,097][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000065216_66781184.pth +[2023-10-08 14:26:17,101][102760] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p1/milestones/checkpoint_000066880_68485120.pth +[2023-10-08 14:26:17,345][102897] Updated weights for policy 0, policy_version 66810 (0.0008) +[2023-10-08 14:26:17,564][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000066816_68419584.pth... +[2023-10-08 14:26:17,593][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000065152_66715648.pth +[2023-10-08 14:26:17,597][102634] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p0/milestones/checkpoint_000066816_68419584.pth +[2023-10-08 14:26:20,882][102898] Updated weights for policy 1, policy_version 66890 (0.0008) +[2023-10-08 14:26:21,193][102897] Updated weights for policy 0, policy_version 66820 (0.0007) +[2023-10-08 14:26:21,254][102898] Updated weights for policy 1, policy_version 66900 (0.0008) +[2023-10-08 14:26:21,554][102897] Updated weights for policy 0, policy_version 66830 (0.0007) +[2023-10-08 14:26:21,616][102898] Updated weights for policy 1, policy_version 66910 (0.0007) +[2023-10-08 14:26:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 136937472. Throughput: 0: 1763.6, 1: 1783.6. Samples: 34239288. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 14:26:21,876][101941] Avg episode reward: [(0, '7.110'), (1, '8.760')] +[2023-10-08 14:26:21,920][102897] Updated weights for policy 0, policy_version 66840 (0.0009) +[2023-10-08 14:26:25,274][102898] Updated weights for policy 1, policy_version 66920 (0.0007) +[2023-10-08 14:26:25,566][102897] Updated weights for policy 0, policy_version 66850 (0.0010) +[2023-10-08 14:26:25,643][102898] Updated weights for policy 1, policy_version 66930 (0.0008) +[2023-10-08 14:26:25,929][102897] Updated weights for policy 0, policy_version 66860 (0.0009) +[2023-10-08 14:26:26,011][102898] Updated weights for policy 1, policy_version 66940 (0.0007) +[2023-10-08 14:26:26,296][102897] Updated weights for policy 0, policy_version 66870 (0.0010) +[2023-10-08 14:26:26,668][102897] Updated weights for policy 0, policy_version 66880 (0.0011) +[2023-10-08 14:26:26,875][101941] Fps is (10 sec: 19660.5, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 137035776. Throughput: 0: 1793.8, 1: 1807.9. Samples: 34261464. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 14:26:26,876][101941] Avg episode reward: [(0, '7.660'), (1, '9.000')] +[2023-10-08 14:26:29,643][102898] Updated weights for policy 1, policy_version 66950 (0.0009) +[2023-10-08 14:26:30,019][102898] Updated weights for policy 1, policy_version 66960 (0.0008) +[2023-10-08 14:26:30,381][102898] Updated weights for policy 1, policy_version 66970 (0.0007) +[2023-10-08 14:26:30,459][102897] Updated weights for policy 0, policy_version 66890 (0.0007) +[2023-10-08 14:26:30,826][102897] Updated weights for policy 0, policy_version 66900 (0.0008) +[2023-10-08 14:26:31,192][102897] Updated weights for policy 0, policy_version 66910 (0.0009) +[2023-10-08 14:26:31,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 137101312. Throughput: 0: 1768.0, 1: 1792.9. Samples: 34281456. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 14:26:31,876][101941] Avg episode reward: [(0, '8.050'), (1, '9.200')] +[2023-10-08 14:26:33,988][102898] Updated weights for policy 1, policy_version 66980 (0.0007) +[2023-10-08 14:26:34,354][102898] Updated weights for policy 1, policy_version 66990 (0.0008) +[2023-10-08 14:26:34,717][102898] Updated weights for policy 1, policy_version 67000 (0.0007) +[2023-10-08 14:26:34,984][102897] Updated weights for policy 0, policy_version 66920 (0.0008) +[2023-10-08 14:26:35,351][102897] Updated weights for policy 0, policy_version 66930 (0.0011) +[2023-10-08 14:26:35,722][102897] Updated weights for policy 0, policy_version 66940 (0.0011) +[2023-10-08 14:26:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 137166848. Throughput: 0: 1787.7, 1: 1804.5. Samples: 34293440. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 14:26:36,876][101941] Avg episode reward: [(0, '8.300'), (1, '9.510')] +[2023-10-08 14:26:38,519][102898] Updated weights for policy 1, policy_version 67010 (0.0008) +[2023-10-08 14:26:38,892][102898] Updated weights for policy 1, policy_version 67020 (0.0008) +[2023-10-08 14:26:39,257][102898] Updated weights for policy 1, policy_version 67030 (0.0010) +[2023-10-08 14:26:39,521][102897] Updated weights for policy 0, policy_version 66950 (0.0007) +[2023-10-08 14:26:39,621][102898] Updated weights for policy 1, policy_version 67040 (0.0008) +[2023-10-08 14:26:39,886][102897] Updated weights for policy 0, policy_version 66960 (0.0007) +[2023-10-08 14:26:40,265][102897] Updated weights for policy 0, policy_version 66970 (0.0008) +[2023-10-08 14:26:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 137232384. Throughput: 0: 1773.0, 1: 1794.7. Samples: 34313856. Policy #0 lag: (min: 22.0, avg: 22.0, max: 22.0) +[2023-10-08 14:26:41,876][101941] Avg episode reward: [(0, '8.270'), (1, '10.100')] +[2023-10-08 14:26:43,340][102898] Updated weights for policy 1, policy_version 67050 (0.0008) +[2023-10-08 14:26:43,710][102898] Updated weights for policy 1, policy_version 67060 (0.0010) +[2023-10-08 14:26:44,078][102898] Updated weights for policy 1, policy_version 67070 (0.0010) +[2023-10-08 14:26:44,153][102897] Updated weights for policy 0, policy_version 66980 (0.0007) +[2023-10-08 14:26:44,518][102897] Updated weights for policy 0, policy_version 66990 (0.0008) +[2023-10-08 14:26:44,893][102897] Updated weights for policy 0, policy_version 67000 (0.0008) +[2023-10-08 14:26:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 137297920. Throughput: 0: 1772.9, 1: 1791.7. Samples: 34335948. Policy #0 lag: (min: 6.0, avg: 14.0, max: 38.0) +[2023-10-08 14:26:46,875][101941] Avg episode reward: [(0, '8.000'), (1, '10.290')] +[2023-10-08 14:26:48,031][102898] Updated weights for policy 1, policy_version 67080 (0.0008) +[2023-10-08 14:26:48,406][102898] Updated weights for policy 1, policy_version 67090 (0.0008) +[2023-10-08 14:26:48,688][102897] Updated weights for policy 0, policy_version 67010 (0.0009) +[2023-10-08 14:26:48,785][102898] Updated weights for policy 1, policy_version 67100 (0.0009) +[2023-10-08 14:26:49,063][102897] Updated weights for policy 0, policy_version 67020 (0.0009) +[2023-10-08 14:26:49,435][102897] Updated weights for policy 0, policy_version 67030 (0.0008) +[2023-10-08 14:26:49,794][102897] Updated weights for policy 0, policy_version 67040 (0.0009) +[2023-10-08 14:26:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 137363456. Throughput: 0: 1781.6, 1: 1795.2. Samples: 34346014. Policy #0 lag: (min: 6.0, avg: 14.0, max: 38.0) +[2023-10-08 14:26:51,876][101941] Avg episode reward: [(0, '7.880'), (1, '9.350')] +[2023-10-08 14:26:52,390][102898] Updated weights for policy 1, policy_version 67110 (0.0010) +[2023-10-08 14:26:52,753][102898] Updated weights for policy 1, policy_version 67120 (0.0009) +[2023-10-08 14:26:53,124][102898] Updated weights for policy 1, policy_version 67130 (0.0009) +[2023-10-08 14:26:53,600][102897] Updated weights for policy 0, policy_version 67050 (0.0007) +[2023-10-08 14:26:53,968][102897] Updated weights for policy 0, policy_version 67060 (0.0007) +[2023-10-08 14:26:54,337][102897] Updated weights for policy 0, policy_version 67070 (0.0007) +[2023-10-08 14:26:56,847][102898] Updated weights for policy 1, policy_version 67140 (0.0008) +[2023-10-08 14:26:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 137428992. Throughput: 0: 1768.8, 1: 1794.9. Samples: 34367718. Policy #0 lag: (min: 6.0, avg: 14.0, max: 38.0) +[2023-10-08 14:26:56,876][101941] Avg episode reward: [(0, '7.660'), (1, '9.830')] +[2023-10-08 14:26:57,222][102898] Updated weights for policy 1, policy_version 67150 (0.0008) +[2023-10-08 14:26:57,582][102898] Updated weights for policy 1, policy_version 67160 (0.0009) +[2023-10-08 14:26:58,138][102897] Updated weights for policy 0, policy_version 67080 (0.0007) +[2023-10-08 14:26:58,513][102897] Updated weights for policy 0, policy_version 67090 (0.0007) +[2023-10-08 14:26:58,889][102897] Updated weights for policy 0, policy_version 67100 (0.0007) +[2023-10-08 14:27:01,443][102898] Updated weights for policy 1, policy_version 67170 (0.0008) +[2023-10-08 14:27:01,813][102898] Updated weights for policy 1, policy_version 67180 (0.0008) +[2023-10-08 14:27:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 137494528. Throughput: 0: 1773.5, 1: 1806.8. Samples: 34389952. Policy #0 lag: (min: 6.0, avg: 14.0, max: 38.0) +[2023-10-08 14:27:01,876][101941] Avg episode reward: [(0, '7.400'), (1, '9.940')] +[2023-10-08 14:27:02,186][102898] Updated weights for policy 1, policy_version 67190 (0.0007) +[2023-10-08 14:27:02,500][102897] Updated weights for policy 0, policy_version 67110 (0.0008) +[2023-10-08 14:27:02,553][102898] Updated weights for policy 1, policy_version 67200 (0.0007) +[2023-10-08 14:27:02,869][102897] Updated weights for policy 0, policy_version 67120 (0.0007) +[2023-10-08 14:27:03,232][102897] Updated weights for policy 0, policy_version 67130 (0.0008) +[2023-10-08 14:27:06,314][102898] Updated weights for policy 1, policy_version 67210 (0.0008) +[2023-10-08 14:27:06,675][102898] Updated weights for policy 1, policy_version 67220 (0.0007) +[2023-10-08 14:27:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 137560064. Throughput: 0: 1774.2, 1: 1792.8. Samples: 34399804. Policy #0 lag: (min: 6.0, avg: 14.0, max: 38.0) +[2023-10-08 14:27:06,875][101941] Avg episode reward: [(0, '7.570'), (1, '9.590')] +[2023-10-08 14:27:06,944][102897] Updated weights for policy 0, policy_version 67140 (0.0007) +[2023-10-08 14:27:07,040][102898] Updated weights for policy 1, policy_version 67230 (0.0008) +[2023-10-08 14:27:07,305][102897] Updated weights for policy 0, policy_version 67150 (0.0008) +[2023-10-08 14:27:07,675][102897] Updated weights for policy 0, policy_version 67160 (0.0010) +[2023-10-08 14:27:10,923][102898] Updated weights for policy 1, policy_version 67240 (0.0009) +[2023-10-08 14:27:11,297][102898] Updated weights for policy 1, policy_version 67250 (0.0009) +[2023-10-08 14:27:11,559][102897] Updated weights for policy 0, policy_version 67170 (0.0008) +[2023-10-08 14:27:11,669][102898] Updated weights for policy 1, policy_version 67260 (0.0008) +[2023-10-08 14:27:11,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 137658368. Throughput: 0: 1769.0, 1: 1797.3. Samples: 34421944. Policy #0 lag: (min: 6.0, avg: 14.0, max: 38.0) +[2023-10-08 14:27:11,875][101941] Avg episode reward: [(0, '7.080'), (1, '9.090')] +[2023-10-08 14:27:11,929][102897] Updated weights for policy 0, policy_version 67180 (0.0010) +[2023-10-08 14:27:12,299][102897] Updated weights for policy 0, policy_version 67190 (0.0010) +[2023-10-08 14:27:12,677][102897] Updated weights for policy 0, policy_version 67200 (0.0008) +[2023-10-08 14:27:15,319][102898] Updated weights for policy 1, policy_version 67270 (0.0008) +[2023-10-08 14:27:15,687][102898] Updated weights for policy 1, policy_version 67280 (0.0008) +[2023-10-08 14:27:16,058][102898] Updated weights for policy 1, policy_version 67290 (0.0010) +[2023-10-08 14:27:16,527][102897] Updated weights for policy 0, policy_version 67210 (0.0009) +[2023-10-08 14:27:16,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 137723904. Throughput: 0: 1797.8, 1: 1786.2. Samples: 34442734. Policy #0 lag: (min: 6.0, avg: 14.0, max: 38.0) +[2023-10-08 14:27:16,875][101941] Avg episode reward: [(0, '7.730'), (1, '9.560')] +[2023-10-08 14:27:16,887][102897] Updated weights for policy 0, policy_version 67220 (0.0008) +[2023-10-08 14:27:17,246][102897] Updated weights for policy 0, policy_version 67230 (0.0009) +[2023-10-08 14:27:19,849][102898] Updated weights for policy 1, policy_version 67300 (0.0009) +[2023-10-08 14:27:20,216][102898] Updated weights for policy 1, policy_version 67310 (0.0010) +[2023-10-08 14:27:20,583][102898] Updated weights for policy 1, policy_version 67320 (0.0010) +[2023-10-08 14:27:21,022][102897] Updated weights for policy 0, policy_version 67240 (0.0010) +[2023-10-08 14:27:21,398][102897] Updated weights for policy 0, policy_version 67250 (0.0011) +[2023-10-08 14:27:21,774][102897] Updated weights for policy 0, policy_version 67260 (0.0010) +[2023-10-08 14:27:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 137789440. Throughput: 0: 1770.9, 1: 1798.8. Samples: 34454076. Policy #0 lag: (min: 6.0, avg: 14.0, max: 38.0) +[2023-10-08 14:27:21,875][101941] Avg episode reward: [(0, '7.680'), (1, '9.510')] +[2023-10-08 14:27:24,608][102898] Updated weights for policy 1, policy_version 67330 (0.0010) +[2023-10-08 14:27:24,975][102898] Updated weights for policy 1, policy_version 67340 (0.0010) +[2023-10-08 14:27:25,351][102898] Updated weights for policy 1, policy_version 67350 (0.0009) +[2023-10-08 14:27:25,599][102897] Updated weights for policy 0, policy_version 67270 (0.0010) +[2023-10-08 14:27:25,717][102898] Updated weights for policy 1, policy_version 67360 (0.0007) +[2023-10-08 14:27:25,967][102897] Updated weights for policy 0, policy_version 67280 (0.0008) +[2023-10-08 14:27:26,341][102897] Updated weights for policy 0, policy_version 67290 (0.0007) +[2023-10-08 14:27:26,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 137887744. Throughput: 0: 1796.7, 1: 1782.8. Samples: 34474934. Policy #0 lag: (min: 31.0, avg: 35.5, max: 63.0) +[2023-10-08 14:27:26,876][101941] Avg episode reward: [(0, '8.000'), (1, '8.840')] +[2023-10-08 14:27:29,441][102898] Updated weights for policy 1, policy_version 67370 (0.0008) +[2023-10-08 14:27:29,806][102898] Updated weights for policy 1, policy_version 67380 (0.0008) +[2023-10-08 14:27:30,083][102897] Updated weights for policy 0, policy_version 67300 (0.0008) +[2023-10-08 14:27:30,176][102898] Updated weights for policy 1, policy_version 67390 (0.0010) +[2023-10-08 14:27:30,463][102897] Updated weights for policy 0, policy_version 67310 (0.0009) +[2023-10-08 14:27:30,824][102897] Updated weights for policy 0, policy_version 67320 (0.0009) +[2023-10-08 14:27:31,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 137953280. Throughput: 0: 1772.9, 1: 1772.5. Samples: 34495492. Policy #0 lag: (min: 31.0, avg: 35.5, max: 63.0) +[2023-10-08 14:27:31,875][101941] Avg episode reward: [(0, '7.400'), (1, '8.540')] +[2023-10-08 14:27:34,018][102898] Updated weights for policy 1, policy_version 67400 (0.0008) +[2023-10-08 14:27:34,387][102898] Updated weights for policy 1, policy_version 67410 (0.0007) +[2023-10-08 14:27:34,466][102897] Updated weights for policy 0, policy_version 67330 (0.0008) +[2023-10-08 14:27:34,749][102898] Updated weights for policy 1, policy_version 67420 (0.0008) +[2023-10-08 14:27:34,830][102897] Updated weights for policy 0, policy_version 67340 (0.0009) +[2023-10-08 14:27:35,207][102897] Updated weights for policy 0, policy_version 67350 (0.0009) +[2023-10-08 14:27:35,571][102897] Updated weights for policy 0, policy_version 67360 (0.0008) +[2023-10-08 14:27:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 138018816. Throughput: 0: 1801.3, 1: 1787.2. Samples: 34507498. Policy #0 lag: (min: 31.0, avg: 35.5, max: 63.0) +[2023-10-08 14:27:36,876][101941] Avg episode reward: [(0, '7.740'), (1, '9.050')] +[2023-10-08 14:27:38,594][102898] Updated weights for policy 1, policy_version 67430 (0.0008) +[2023-10-08 14:27:38,964][102898] Updated weights for policy 1, policy_version 67440 (0.0010) +[2023-10-08 14:27:39,315][102897] Updated weights for policy 0, policy_version 67370 (0.0008) +[2023-10-08 14:27:39,328][102898] Updated weights for policy 1, policy_version 67450 (0.0007) +[2023-10-08 14:27:39,678][102897] Updated weights for policy 0, policy_version 67380 (0.0008) +[2023-10-08 14:27:40,050][102897] Updated weights for policy 0, policy_version 67390 (0.0009) +[2023-10-08 14:27:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 138084352. Throughput: 0: 1785.7, 1: 1770.8. Samples: 34527762. Policy #0 lag: (min: 31.0, avg: 35.5, max: 63.0) +[2023-10-08 14:27:41,876][101941] Avg episode reward: [(0, '8.040'), (1, '9.970')] +[2023-10-08 14:27:43,001][102898] Updated weights for policy 1, policy_version 67460 (0.0007) +[2023-10-08 14:27:43,368][102898] Updated weights for policy 1, policy_version 67470 (0.0008) +[2023-10-08 14:27:43,723][102898] Updated weights for policy 1, policy_version 67480 (0.0008) +[2023-10-08 14:27:43,856][102897] Updated weights for policy 0, policy_version 67400 (0.0008) +[2023-10-08 14:27:44,221][102897] Updated weights for policy 0, policy_version 67410 (0.0009) +[2023-10-08 14:27:44,604][102897] Updated weights for policy 0, policy_version 67420 (0.0011) +[2023-10-08 14:27:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 138149888. Throughput: 0: 1782.0, 1: 1781.4. Samples: 34550304. Policy #0 lag: (min: 31.0, avg: 35.5, max: 63.0) +[2023-10-08 14:27:46,876][101941] Avg episode reward: [(0, '8.080'), (1, '9.620')] +[2023-10-08 14:27:47,498][102898] Updated weights for policy 1, policy_version 67490 (0.0007) +[2023-10-08 14:27:47,861][102898] Updated weights for policy 1, policy_version 67500 (0.0009) +[2023-10-08 14:27:48,230][102898] Updated weights for policy 1, policy_version 67510 (0.0007) +[2023-10-08 14:27:48,288][102897] Updated weights for policy 0, policy_version 67430 (0.0008) +[2023-10-08 14:27:48,594][102898] Updated weights for policy 1, policy_version 67520 (0.0007) +[2023-10-08 14:27:48,646][102897] Updated weights for policy 0, policy_version 67440 (0.0010) +[2023-10-08 14:27:49,019][102897] Updated weights for policy 0, policy_version 67450 (0.0010) +[2023-10-08 14:27:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 138215424. Throughput: 0: 1783.6, 1: 1777.0. Samples: 34560030. Policy #0 lag: (min: 31.0, avg: 35.5, max: 63.0) +[2023-10-08 14:27:51,876][101941] Avg episode reward: [(0, '8.380'), (1, '9.230')] +[2023-10-08 14:27:52,463][102898] Updated weights for policy 1, policy_version 67530 (0.0007) +[2023-10-08 14:27:52,822][102898] Updated weights for policy 1, policy_version 67540 (0.0008) +[2023-10-08 14:27:52,825][102897] Updated weights for policy 0, policy_version 67460 (0.0008) +[2023-10-08 14:27:53,187][102898] Updated weights for policy 1, policy_version 67550 (0.0008) +[2023-10-08 14:27:53,199][102897] Updated weights for policy 0, policy_version 67470 (0.0008) +[2023-10-08 14:27:53,567][102897] Updated weights for policy 0, policy_version 67480 (0.0011) +[2023-10-08 14:27:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 138280960. Throughput: 0: 1787.1, 1: 1775.0. Samples: 34582236. Policy #0 lag: (min: 31.0, avg: 35.5, max: 63.0) +[2023-10-08 14:27:56,875][101941] Avg episode reward: [(0, '8.180'), (1, '8.950')] +[2023-10-08 14:27:57,016][102898] Updated weights for policy 1, policy_version 67560 (0.0009) +[2023-10-08 14:27:57,380][102898] Updated weights for policy 1, policy_version 67570 (0.0009) +[2023-10-08 14:27:57,485][102897] Updated weights for policy 0, policy_version 67490 (0.0008) +[2023-10-08 14:27:57,746][102898] Updated weights for policy 1, policy_version 67580 (0.0009) +[2023-10-08 14:27:57,859][102897] Updated weights for policy 0, policy_version 67500 (0.0007) +[2023-10-08 14:27:58,231][102897] Updated weights for policy 0, policy_version 67510 (0.0008) +[2023-10-08 14:27:58,606][102897] Updated weights for policy 0, policy_version 67520 (0.0008) +[2023-10-08 14:28:01,500][102898] Updated weights for policy 1, policy_version 67590 (0.0010) +[2023-10-08 14:28:01,873][102898] Updated weights for policy 1, policy_version 67600 (0.0008) +[2023-10-08 14:28:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 138346496. Throughput: 0: 1787.1, 1: 1799.9. Samples: 34604150. Policy #0 lag: (min: 31.0, avg: 35.5, max: 63.0) +[2023-10-08 14:28:01,876][101941] Avg episode reward: [(0, '7.910'), (1, '9.080')] +[2023-10-08 14:28:02,243][102898] Updated weights for policy 1, policy_version 67610 (0.0007) +[2023-10-08 14:28:02,506][102897] Updated weights for policy 0, policy_version 67530 (0.0008) +[2023-10-08 14:28:02,868][102897] Updated weights for policy 0, policy_version 67540 (0.0009) +[2023-10-08 14:28:03,239][102897] Updated weights for policy 0, policy_version 67550 (0.0007) +[2023-10-08 14:28:06,022][102898] Updated weights for policy 1, policy_version 67620 (0.0008) +[2023-10-08 14:28:06,384][102898] Updated weights for policy 1, policy_version 67630 (0.0009) +[2023-10-08 14:28:06,750][102898] Updated weights for policy 1, policy_version 67640 (0.0009) +[2023-10-08 14:28:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 138412032. Throughput: 0: 1781.7, 1: 1777.2. Samples: 34614226. Policy #0 lag: (min: 31.0, avg: 35.5, max: 63.0) +[2023-10-08 14:28:06,876][101941] Avg episode reward: [(0, '7.880'), (1, '8.650')] +[2023-10-08 14:28:06,976][102897] Updated weights for policy 0, policy_version 67560 (0.0008) +[2023-10-08 14:28:07,340][102897] Updated weights for policy 0, policy_version 67570 (0.0009) +[2023-10-08 14:28:07,721][102897] Updated weights for policy 0, policy_version 67580 (0.0011) +[2023-10-08 14:28:10,482][102898] Updated weights for policy 1, policy_version 67650 (0.0008) +[2023-10-08 14:28:10,847][102898] Updated weights for policy 1, policy_version 67660 (0.0009) +[2023-10-08 14:28:11,204][102898] Updated weights for policy 1, policy_version 67670 (0.0010) +[2023-10-08 14:28:11,558][102897] Updated weights for policy 0, policy_version 67590 (0.0007) +[2023-10-08 14:28:11,577][102898] Updated weights for policy 1, policy_version 67680 (0.0009) +[2023-10-08 14:28:11,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 138510336. Throughput: 0: 1782.2, 1: 1806.4. Samples: 34636424. Policy #0 lag: (min: 31.0, avg: 35.5, max: 63.0) +[2023-10-08 14:28:11,876][101941] Avg episode reward: [(0, '8.560'), (1, '9.000')] +[2023-10-08 14:28:11,930][102897] Updated weights for policy 0, policy_version 67600 (0.0012) +[2023-10-08 14:28:12,296][102897] Updated weights for policy 0, policy_version 67610 (0.0008) +[2023-10-08 14:28:15,375][102898] Updated weights for policy 1, policy_version 67690 (0.0008) +[2023-10-08 14:28:15,733][102898] Updated weights for policy 1, policy_version 67700 (0.0009) +[2023-10-08 14:28:16,097][102898] Updated weights for policy 1, policy_version 67710 (0.0008) +[2023-10-08 14:28:16,161][102897] Updated weights for policy 0, policy_version 67620 (0.0009) +[2023-10-08 14:28:16,529][102897] Updated weights for policy 0, policy_version 67630 (0.0008) +[2023-10-08 14:28:16,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 138575872. Throughput: 0: 1803.2, 1: 1786.8. Samples: 34657040. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:28:16,876][101941] Avg episode reward: [(0, '8.120'), (1, '9.210')] +[2023-10-08 14:28:16,883][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000067712_69337088.pth... +[2023-10-08 14:28:16,905][102897] Updated weights for policy 0, policy_version 67640 (0.0007) +[2023-10-08 14:28:16,919][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000066048_67633152.pth +[2023-10-08 14:28:17,191][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000067648_69271552.pth... +[2023-10-08 14:28:17,228][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000065984_67567616.pth +[2023-10-08 14:28:19,836][102898] Updated weights for policy 1, policy_version 67720 (0.0009) +[2023-10-08 14:28:20,215][102898] Updated weights for policy 1, policy_version 67730 (0.0009) +[2023-10-08 14:28:20,565][102897] Updated weights for policy 0, policy_version 67650 (0.0007) +[2023-10-08 14:28:20,579][102898] Updated weights for policy 1, policy_version 67740 (0.0008) +[2023-10-08 14:28:20,933][102897] Updated weights for policy 0, policy_version 67660 (0.0009) +[2023-10-08 14:28:21,318][102897] Updated weights for policy 0, policy_version 67670 (0.0009) +[2023-10-08 14:28:21,684][102897] Updated weights for policy 0, policy_version 67680 (0.0007) +[2023-10-08 14:28:21,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 138674176. Throughput: 0: 1779.7, 1: 1807.1. Samples: 34668902. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:28:21,876][101941] Avg episode reward: [(0, '7.430'), (1, '9.180')] +[2023-10-08 14:28:24,355][102898] Updated weights for policy 1, policy_version 67750 (0.0008) +[2023-10-08 14:28:24,722][102898] Updated weights for policy 1, policy_version 67760 (0.0009) +[2023-10-08 14:28:25,088][102898] Updated weights for policy 1, policy_version 67770 (0.0007) +[2023-10-08 14:28:25,292][102897] Updated weights for policy 0, policy_version 67690 (0.0008) +[2023-10-08 14:28:25,664][102897] Updated weights for policy 0, policy_version 67700 (0.0009) +[2023-10-08 14:28:26,044][102897] Updated weights for policy 0, policy_version 67710 (0.0008) +[2023-10-08 14:28:26,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 138739712. Throughput: 0: 1800.7, 1: 1780.8. Samples: 34688928. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:28:26,876][101941] Avg episode reward: [(0, '7.920'), (1, '9.000')] +[2023-10-08 14:28:28,940][102898] Updated weights for policy 1, policy_version 67780 (0.0009) +[2023-10-08 14:28:29,305][102898] Updated weights for policy 1, policy_version 67790 (0.0008) +[2023-10-08 14:28:29,679][102898] Updated weights for policy 1, policy_version 67800 (0.0007) +[2023-10-08 14:28:29,838][102897] Updated weights for policy 0, policy_version 67720 (0.0009) +[2023-10-08 14:28:30,218][102897] Updated weights for policy 0, policy_version 67730 (0.0008) +[2023-10-08 14:28:30,601][102897] Updated weights for policy 0, policy_version 67740 (0.0009) +[2023-10-08 14:28:31,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 138805248. Throughput: 0: 1782.4, 1: 1776.7. Samples: 34710462. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:28:31,876][101941] Avg episode reward: [(0, '8.350'), (1, '9.550')] +[2023-10-08 14:28:33,225][102898] Updated weights for policy 1, policy_version 67810 (0.0007) +[2023-10-08 14:28:33,594][102898] Updated weights for policy 1, policy_version 67820 (0.0008) +[2023-10-08 14:28:33,964][102898] Updated weights for policy 1, policy_version 67830 (0.0009) +[2023-10-08 14:28:34,298][102897] Updated weights for policy 0, policy_version 67750 (0.0008) +[2023-10-08 14:28:34,325][102898] Updated weights for policy 1, policy_version 67840 (0.0008) +[2023-10-08 14:28:34,671][102897] Updated weights for policy 0, policy_version 67760 (0.0007) +[2023-10-08 14:28:35,036][102897] Updated weights for policy 0, policy_version 67770 (0.0007) +[2023-10-08 14:28:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 138870784. Throughput: 0: 1807.8, 1: 1777.6. Samples: 34721372. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:28:36,876][101941] Avg episode reward: [(0, '8.260'), (1, '9.590')] +[2023-10-08 14:28:38,117][102898] Updated weights for policy 1, policy_version 67850 (0.0007) +[2023-10-08 14:28:38,484][102898] Updated weights for policy 1, policy_version 67860 (0.0009) +[2023-10-08 14:28:38,853][102898] Updated weights for policy 1, policy_version 67870 (0.0009) +[2023-10-08 14:28:38,901][102897] Updated weights for policy 0, policy_version 67780 (0.0008) +[2023-10-08 14:28:39,270][102897] Updated weights for policy 0, policy_version 67790 (0.0007) +[2023-10-08 14:28:39,641][102897] Updated weights for policy 0, policy_version 67800 (0.0008) +[2023-10-08 14:28:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 138936320. Throughput: 0: 1781.0, 1: 1786.1. Samples: 34742756. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:28:41,876][101941] Avg episode reward: [(0, '7.760'), (1, '9.630')] +[2023-10-08 14:28:42,615][102898] Updated weights for policy 1, policy_version 67880 (0.0008) +[2023-10-08 14:28:42,978][102898] Updated weights for policy 1, policy_version 67890 (0.0009) +[2023-10-08 14:28:43,310][102897] Updated weights for policy 0, policy_version 67810 (0.0007) +[2023-10-08 14:28:43,345][102898] Updated weights for policy 1, policy_version 67900 (0.0009) +[2023-10-08 14:28:43,679][102897] Updated weights for policy 0, policy_version 67820 (0.0007) +[2023-10-08 14:28:44,056][102897] Updated weights for policy 0, policy_version 67830 (0.0011) +[2023-10-08 14:28:44,434][102897] Updated weights for policy 0, policy_version 67840 (0.0010) +[2023-10-08 14:28:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 139001856. Throughput: 0: 1781.3, 1: 1796.0. Samples: 34765130. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:28:46,876][101941] Avg episode reward: [(0, '7.570'), (1, '8.230')] +[2023-10-08 14:28:47,113][102898] Updated weights for policy 1, policy_version 67910 (0.0008) +[2023-10-08 14:28:47,477][102898] Updated weights for policy 1, policy_version 67920 (0.0008) +[2023-10-08 14:28:47,841][102898] Updated weights for policy 1, policy_version 67930 (0.0008) +[2023-10-08 14:28:48,196][102897] Updated weights for policy 0, policy_version 67850 (0.0008) +[2023-10-08 14:28:48,564][102897] Updated weights for policy 0, policy_version 67860 (0.0007) +[2023-10-08 14:28:48,931][102897] Updated weights for policy 0, policy_version 67870 (0.0007) +[2023-10-08 14:28:51,656][102898] Updated weights for policy 1, policy_version 67940 (0.0009) +[2023-10-08 14:28:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 139067392. Throughput: 0: 1783.7, 1: 1787.5. Samples: 34774928. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:28:51,876][101941] Avg episode reward: [(0, '7.680'), (1, '7.810')] +[2023-10-08 14:28:52,033][102898] Updated weights for policy 1, policy_version 67950 (0.0008) +[2023-10-08 14:28:52,394][102898] Updated weights for policy 1, policy_version 67960 (0.0008) +[2023-10-08 14:28:52,673][102897] Updated weights for policy 0, policy_version 67880 (0.0007) +[2023-10-08 14:28:53,055][102897] Updated weights for policy 0, policy_version 67890 (0.0007) +[2023-10-08 14:28:53,428][102897] Updated weights for policy 0, policy_version 67900 (0.0008) +[2023-10-08 14:28:56,181][102898] Updated weights for policy 1, policy_version 67970 (0.0008) +[2023-10-08 14:28:56,555][102898] Updated weights for policy 1, policy_version 67980 (0.0007) +[2023-10-08 14:28:56,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 139132928. Throughput: 0: 1787.1, 1: 1784.0. Samples: 34797122. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:28:56,876][101941] Avg episode reward: [(0, '7.520'), (1, '8.430')] +[2023-10-08 14:28:56,910][102898] Updated weights for policy 1, policy_version 67990 (0.0008) +[2023-10-08 14:28:57,112][102897] Updated weights for policy 0, policy_version 67910 (0.0008) +[2023-10-08 14:28:57,270][102898] Updated weights for policy 1, policy_version 68000 (0.0008) +[2023-10-08 14:28:57,486][102897] Updated weights for policy 0, policy_version 67920 (0.0008) +[2023-10-08 14:28:57,857][102897] Updated weights for policy 0, policy_version 67930 (0.0008) +[2023-10-08 14:29:01,065][102898] Updated weights for policy 1, policy_version 68010 (0.0009) +[2023-10-08 14:29:01,429][102898] Updated weights for policy 1, policy_version 68020 (0.0009) +[2023-10-08 14:29:01,564][102897] Updated weights for policy 0, policy_version 67940 (0.0008) +[2023-10-08 14:29:01,796][102898] Updated weights for policy 1, policy_version 68030 (0.0008) +[2023-10-08 14:29:01,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 139231232. Throughput: 0: 1793.9, 1: 1793.0. Samples: 34818448. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 14:29:01,876][101941] Avg episode reward: [(0, '7.350'), (1, '8.950')] +[2023-10-08 14:29:01,932][102897] Updated weights for policy 0, policy_version 67950 (0.0008) +[2023-10-08 14:29:02,303][102897] Updated weights for policy 0, policy_version 67960 (0.0007) +[2023-10-08 14:29:05,888][102898] Updated weights for policy 1, policy_version 68040 (0.0009) +[2023-10-08 14:29:05,981][102897] Updated weights for policy 0, policy_version 67970 (0.0008) +[2023-10-08 14:29:06,244][102898] Updated weights for policy 1, policy_version 68050 (0.0007) +[2023-10-08 14:29:06,343][102897] Updated weights for policy 0, policy_version 67980 (0.0007) +[2023-10-08 14:29:06,606][102898] Updated weights for policy 1, policy_version 68060 (0.0009) +[2023-10-08 14:29:06,721][102897] Updated weights for policy 0, policy_version 67990 (0.0009) +[2023-10-08 14:29:06,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 139296768. Throughput: 0: 1779.4, 1: 1777.4. Samples: 34828958. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 14:29:06,876][101941] Avg episode reward: [(0, '7.630'), (1, '9.490')] +[2023-10-08 14:29:07,092][102897] Updated weights for policy 0, policy_version 68000 (0.0009) +[2023-10-08 14:29:10,403][102898] Updated weights for policy 1, policy_version 68070 (0.0009) +[2023-10-08 14:29:10,770][102898] Updated weights for policy 1, policy_version 68080 (0.0008) +[2023-10-08 14:29:10,930][102897] Updated weights for policy 0, policy_version 68010 (0.0008) +[2023-10-08 14:29:11,136][102898] Updated weights for policy 1, policy_version 68090 (0.0007) +[2023-10-08 14:29:11,303][102897] Updated weights for policy 0, policy_version 68020 (0.0008) +[2023-10-08 14:29:11,670][102897] Updated weights for policy 0, policy_version 68030 (0.0007) +[2023-10-08 14:29:11,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 139395072. Throughput: 0: 1791.8, 1: 1804.8. Samples: 34850774. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 14:29:11,876][101941] Avg episode reward: [(0, '8.470'), (1, '9.820')] +[2023-10-08 14:29:14,880][102898] Updated weights for policy 1, policy_version 68100 (0.0009) +[2023-10-08 14:29:15,247][102898] Updated weights for policy 1, policy_version 68110 (0.0011) +[2023-10-08 14:29:15,509][102897] Updated weights for policy 0, policy_version 68040 (0.0009) +[2023-10-08 14:29:15,611][102898] Updated weights for policy 1, policy_version 68120 (0.0007) +[2023-10-08 14:29:15,883][102897] Updated weights for policy 0, policy_version 68050 (0.0008) +[2023-10-08 14:29:16,260][102897] Updated weights for policy 0, policy_version 68060 (0.0008) +[2023-10-08 14:29:16,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 139460608. Throughput: 0: 1778.9, 1: 1777.7. Samples: 34870510. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 14:29:16,875][101941] Avg episode reward: [(0, '7.760'), (1, '8.470')] +[2023-10-08 14:29:19,450][102898] Updated weights for policy 1, policy_version 68130 (0.0008) +[2023-10-08 14:29:19,815][102898] Updated weights for policy 1, policy_version 68140 (0.0007) +[2023-10-08 14:29:19,847][102897] Updated weights for policy 0, policy_version 68070 (0.0009) +[2023-10-08 14:29:20,182][102898] Updated weights for policy 1, policy_version 68150 (0.0008) +[2023-10-08 14:29:20,215][102897] Updated weights for policy 0, policy_version 68080 (0.0008) +[2023-10-08 14:29:20,543][102898] Updated weights for policy 1, policy_version 68160 (0.0010) +[2023-10-08 14:29:20,579][102897] Updated weights for policy 0, policy_version 68090 (0.0007) +[2023-10-08 14:29:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 139526144. Throughput: 0: 1789.8, 1: 1805.1. Samples: 34883142. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 14:29:21,875][101941] Avg episode reward: [(0, '7.760'), (1, '8.760')] +[2023-10-08 14:29:24,302][102898] Updated weights for policy 1, policy_version 68170 (0.0010) +[2023-10-08 14:29:24,360][102897] Updated weights for policy 0, policy_version 68100 (0.0009) +[2023-10-08 14:29:24,666][102898] Updated weights for policy 1, policy_version 68180 (0.0007) +[2023-10-08 14:29:24,739][102897] Updated weights for policy 0, policy_version 68110 (0.0008) +[2023-10-08 14:29:25,030][102898] Updated weights for policy 1, policy_version 68190 (0.0008) +[2023-10-08 14:29:25,099][102897] Updated weights for policy 0, policy_version 68120 (0.0008) +[2023-10-08 14:29:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 139591680. Throughput: 0: 1780.8, 1: 1771.8. Samples: 34902626. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 14:29:26,876][101941] Avg episode reward: [(0, '9.080'), (1, '9.150')] +[2023-10-08 14:29:28,806][102898] Updated weights for policy 1, policy_version 68200 (0.0009) +[2023-10-08 14:29:29,085][102897] Updated weights for policy 0, policy_version 68130 (0.0008) +[2023-10-08 14:29:29,168][102898] Updated weights for policy 1, policy_version 68210 (0.0009) +[2023-10-08 14:29:29,455][102897] Updated weights for policy 0, policy_version 68140 (0.0009) +[2023-10-08 14:29:29,534][102898] Updated weights for policy 1, policy_version 68220 (0.0009) +[2023-10-08 14:29:29,837][102897] Updated weights for policy 0, policy_version 68150 (0.0010) +[2023-10-08 14:29:30,197][102897] Updated weights for policy 0, policy_version 68160 (0.0008) +[2023-10-08 14:29:31,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 139657216. Throughput: 0: 1780.5, 1: 1762.5. Samples: 34924564. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 14:29:31,876][101941] Avg episode reward: [(0, '8.790'), (1, '9.080')] +[2023-10-08 14:29:33,471][102898] Updated weights for policy 1, policy_version 68230 (0.0008) +[2023-10-08 14:29:33,833][102898] Updated weights for policy 1, policy_version 68240 (0.0007) +[2023-10-08 14:29:34,011][102897] Updated weights for policy 0, policy_version 68170 (0.0009) +[2023-10-08 14:29:34,203][102898] Updated weights for policy 1, policy_version 68250 (0.0007) +[2023-10-08 14:29:34,391][102897] Updated weights for policy 0, policy_version 68180 (0.0009) +[2023-10-08 14:29:34,763][102897] Updated weights for policy 0, policy_version 68190 (0.0010) +[2023-10-08 14:29:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 139722752. Throughput: 0: 1787.8, 1: 1762.3. Samples: 34934684. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 14:29:36,876][101941] Avg episode reward: [(0, '8.220'), (1, '9.540')] +[2023-10-08 14:29:37,947][102898] Updated weights for policy 1, policy_version 68260 (0.0009) +[2023-10-08 14:29:38,320][102898] Updated weights for policy 1, policy_version 68270 (0.0008) +[2023-10-08 14:29:38,467][102897] Updated weights for policy 0, policy_version 68200 (0.0009) +[2023-10-08 14:29:38,689][102898] Updated weights for policy 1, policy_version 68280 (0.0009) +[2023-10-08 14:29:38,830][102897] Updated weights for policy 0, policy_version 68210 (0.0008) +[2023-10-08 14:29:39,200][102897] Updated weights for policy 0, policy_version 68220 (0.0008) +[2023-10-08 14:29:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 139788288. Throughput: 0: 1772.4, 1: 1766.0. Samples: 34956350. Policy #0 lag: (min: 31.0, avg: 38.7, max: 63.0) +[2023-10-08 14:29:41,876][101941] Avg episode reward: [(0, '8.350'), (1, '9.280')] +[2023-10-08 14:29:42,450][102898] Updated weights for policy 1, policy_version 68290 (0.0007) +[2023-10-08 14:29:42,814][102898] Updated weights for policy 1, policy_version 68300 (0.0007) +[2023-10-08 14:29:42,997][102897] Updated weights for policy 0, policy_version 68230 (0.0009) +[2023-10-08 14:29:43,180][102898] Updated weights for policy 1, policy_version 68310 (0.0007) +[2023-10-08 14:29:43,361][102897] Updated weights for policy 0, policy_version 68240 (0.0007) +[2023-10-08 14:29:43,539][102898] Updated weights for policy 1, policy_version 68320 (0.0009) +[2023-10-08 14:29:43,733][102897] Updated weights for policy 0, policy_version 68250 (0.0007) +[2023-10-08 14:29:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 139853824. Throughput: 0: 1773.7, 1: 1787.9. Samples: 34978720. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:29:46,875][101941] Avg episode reward: [(0, '8.090'), (1, '9.010')] +[2023-10-08 14:29:47,089][102898] Updated weights for policy 1, policy_version 68330 (0.0010) +[2023-10-08 14:29:47,453][102898] Updated weights for policy 1, policy_version 68340 (0.0010) +[2023-10-08 14:29:47,569][102897] Updated weights for policy 0, policy_version 68260 (0.0008) +[2023-10-08 14:29:47,823][102898] Updated weights for policy 1, policy_version 68350 (0.0009) +[2023-10-08 14:29:47,936][102897] Updated weights for policy 0, policy_version 68270 (0.0007) +[2023-10-08 14:29:48,303][102897] Updated weights for policy 0, policy_version 68280 (0.0009) +[2023-10-08 14:29:51,598][102898] Updated weights for policy 1, policy_version 68360 (0.0007) +[2023-10-08 14:29:51,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 139919360. Throughput: 0: 1773.1, 1: 1772.0. Samples: 34988490. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:29:51,876][101941] Avg episode reward: [(0, '6.960'), (1, '9.030')] +[2023-10-08 14:29:51,965][102898] Updated weights for policy 1, policy_version 68370 (0.0008) +[2023-10-08 14:29:51,970][102897] Updated weights for policy 0, policy_version 68290 (0.0008) +[2023-10-08 14:29:52,334][102898] Updated weights for policy 1, policy_version 68380 (0.0009) +[2023-10-08 14:29:52,335][102897] Updated weights for policy 0, policy_version 68300 (0.0008) +[2023-10-08 14:29:52,709][102897] Updated weights for policy 0, policy_version 68310 (0.0008) +[2023-10-08 14:29:53,073][102897] Updated weights for policy 0, policy_version 68320 (0.0008) +[2023-10-08 14:29:56,356][102898] Updated weights for policy 1, policy_version 68390 (0.0009) +[2023-10-08 14:29:56,714][102898] Updated weights for policy 1, policy_version 68400 (0.0007) +[2023-10-08 14:29:56,873][102897] Updated weights for policy 0, policy_version 68330 (0.0007) +[2023-10-08 14:29:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 139984896. Throughput: 0: 1770.2, 1: 1779.1. Samples: 35010492. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:29:56,876][101941] Avg episode reward: [(0, '7.590'), (1, '9.030')] +[2023-10-08 14:29:57,087][102898] Updated weights for policy 1, policy_version 68410 (0.0007) +[2023-10-08 14:29:57,244][102897] Updated weights for policy 0, policy_version 68340 (0.0007) +[2023-10-08 14:29:57,611][102897] Updated weights for policy 0, policy_version 68350 (0.0011) +[2023-10-08 14:30:00,783][102898] Updated weights for policy 1, policy_version 68420 (0.0008) +[2023-10-08 14:30:01,154][102898] Updated weights for policy 1, policy_version 68430 (0.0010) +[2023-10-08 14:30:01,507][102898] Updated weights for policy 1, policy_version 68440 (0.0007) +[2023-10-08 14:30:01,636][102897] Updated weights for policy 0, policy_version 68360 (0.0007) +[2023-10-08 14:30:01,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 140083200. Throughput: 0: 1796.7, 1: 1782.7. Samples: 35031580. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:30:01,875][101941] Avg episode reward: [(0, '8.050'), (1, '8.930')] +[2023-10-08 14:30:02,002][102897] Updated weights for policy 0, policy_version 68370 (0.0007) +[2023-10-08 14:30:02,377][102897] Updated weights for policy 0, policy_version 68380 (0.0008) +[2023-10-08 14:30:05,258][102898] Updated weights for policy 1, policy_version 68450 (0.0008) +[2023-10-08 14:30:05,629][102898] Updated weights for policy 1, policy_version 68460 (0.0008) +[2023-10-08 14:30:05,986][102898] Updated weights for policy 1, policy_version 68470 (0.0008) +[2023-10-08 14:30:06,026][102897] Updated weights for policy 0, policy_version 68390 (0.0008) +[2023-10-08 14:30:06,350][102898] Updated weights for policy 1, policy_version 68480 (0.0007) +[2023-10-08 14:30:06,401][102897] Updated weights for policy 0, policy_version 68400 (0.0008) +[2023-10-08 14:30:06,766][102897] Updated weights for policy 0, policy_version 68410 (0.0010) +[2023-10-08 14:30:06,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 140148736. Throughput: 0: 1762.5, 1: 1776.9. Samples: 35042416. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:30:06,876][101941] Avg episode reward: [(0, '7.520'), (1, '8.960')] +[2023-10-08 14:30:10,108][102898] Updated weights for policy 1, policy_version 68490 (0.0010) +[2023-10-08 14:30:10,469][102898] Updated weights for policy 1, policy_version 68500 (0.0009) +[2023-10-08 14:30:10,560][102897] Updated weights for policy 0, policy_version 68420 (0.0008) +[2023-10-08 14:30:10,830][102898] Updated weights for policy 1, policy_version 68510 (0.0007) +[2023-10-08 14:30:10,931][102897] Updated weights for policy 0, policy_version 68430 (0.0008) +[2023-10-08 14:30:11,303][102897] Updated weights for policy 0, policy_version 68440 (0.0008) +[2023-10-08 14:30:11,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 140247040. Throughput: 0: 1801.0, 1: 1789.0. Samples: 35064176. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:30:11,876][101941] Avg episode reward: [(0, '7.590'), (1, '8.670')] +[2023-10-08 14:30:14,591][102898] Updated weights for policy 1, policy_version 68520 (0.0008) +[2023-10-08 14:30:14,965][102898] Updated weights for policy 1, policy_version 68530 (0.0007) +[2023-10-08 14:30:15,106][102897] Updated weights for policy 0, policy_version 68450 (0.0009) +[2023-10-08 14:30:15,334][102898] Updated weights for policy 1, policy_version 68540 (0.0009) +[2023-10-08 14:30:15,476][102897] Updated weights for policy 0, policy_version 68460 (0.0007) +[2023-10-08 14:30:15,854][102897] Updated weights for policy 0, policy_version 68470 (0.0009) +[2023-10-08 14:30:16,223][102897] Updated weights for policy 0, policy_version 68480 (0.0010) +[2023-10-08 14:30:16,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 140312576. Throughput: 0: 1774.1, 1: 1782.3. Samples: 35084600. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:30:16,875][101941] Avg episode reward: [(0, '8.010'), (1, '9.010')] +[2023-10-08 14:30:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000068480_70123520.pth... +[2023-10-08 14:30:16,883][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000068544_70189056.pth... +[2023-10-08 14:30:16,918][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000066880_68485120.pth +[2023-10-08 14:30:16,921][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000066816_68419584.pth +[2023-10-08 14:30:19,045][102898] Updated weights for policy 1, policy_version 68550 (0.0010) +[2023-10-08 14:30:19,410][102898] Updated weights for policy 1, policy_version 68560 (0.0009) +[2023-10-08 14:30:19,775][102898] Updated weights for policy 1, policy_version 68570 (0.0009) +[2023-10-08 14:30:19,971][102897] Updated weights for policy 0, policy_version 68490 (0.0007) +[2023-10-08 14:30:20,336][102897] Updated weights for policy 0, policy_version 68500 (0.0009) +[2023-10-08 14:30:20,706][102897] Updated weights for policy 0, policy_version 68510 (0.0010) +[2023-10-08 14:30:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 140378112. Throughput: 0: 1798.0, 1: 1798.5. Samples: 35096530. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:30:21,876][101941] Avg episode reward: [(0, '7.950'), (1, '8.720')] +[2023-10-08 14:30:23,644][102898] Updated weights for policy 1, policy_version 68580 (0.0009) +[2023-10-08 14:30:24,013][102898] Updated weights for policy 1, policy_version 68590 (0.0009) +[2023-10-08 14:30:24,382][102898] Updated weights for policy 1, policy_version 68600 (0.0008) +[2023-10-08 14:30:24,496][102897] Updated weights for policy 0, policy_version 68520 (0.0008) +[2023-10-08 14:30:24,868][102897] Updated weights for policy 0, policy_version 68530 (0.0007) +[2023-10-08 14:30:25,238][102897] Updated weights for policy 0, policy_version 68540 (0.0008) +[2023-10-08 14:30:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 140443648. Throughput: 0: 1784.7, 1: 1779.9. Samples: 35116758. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:30:26,876][101941] Avg episode reward: [(0, '7.980'), (1, '8.780')] +[2023-10-08 14:30:28,277][102898] Updated weights for policy 1, policy_version 68610 (0.0007) +[2023-10-08 14:30:28,639][102898] Updated weights for policy 1, policy_version 68620 (0.0007) +[2023-10-08 14:30:29,001][102898] Updated weights for policy 1, policy_version 68630 (0.0008) +[2023-10-08 14:30:29,038][102897] Updated weights for policy 0, policy_version 68550 (0.0007) +[2023-10-08 14:30:29,371][102898] Updated weights for policy 1, policy_version 68640 (0.0007) +[2023-10-08 14:30:29,406][102897] Updated weights for policy 0, policy_version 68560 (0.0009) +[2023-10-08 14:30:29,774][102897] Updated weights for policy 0, policy_version 68570 (0.0008) +[2023-10-08 14:30:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 140509184. Throughput: 0: 1782.7, 1: 1776.0. Samples: 35138860. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 14:30:31,876][101941] Avg episode reward: [(0, '8.090'), (1, '9.270')] +[2023-10-08 14:30:33,247][102898] Updated weights for policy 1, policy_version 68650 (0.0008) +[2023-10-08 14:30:33,526][102897] Updated weights for policy 0, policy_version 68580 (0.0009) +[2023-10-08 14:30:33,602][102898] Updated weights for policy 1, policy_version 68660 (0.0007) +[2023-10-08 14:30:33,890][102897] Updated weights for policy 0, policy_version 68590 (0.0009) +[2023-10-08 14:30:33,966][102898] Updated weights for policy 1, policy_version 68670 (0.0009) +[2023-10-08 14:30:34,261][102897] Updated weights for policy 0, policy_version 68600 (0.0008) +[2023-10-08 14:30:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 140574720. Throughput: 0: 1791.9, 1: 1773.8. Samples: 35148946. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 14:30:36,876][101941] Avg episode reward: [(0, '8.280'), (1, '9.280')] +[2023-10-08 14:30:37,742][102898] Updated weights for policy 1, policy_version 68680 (0.0008) +[2023-10-08 14:30:38,092][102897] Updated weights for policy 0, policy_version 68610 (0.0007) +[2023-10-08 14:30:38,119][102898] Updated weights for policy 1, policy_version 68690 (0.0008) +[2023-10-08 14:30:38,458][102897] Updated weights for policy 0, policy_version 68620 (0.0007) +[2023-10-08 14:30:38,479][102898] Updated weights for policy 1, policy_version 68700 (0.0007) +[2023-10-08 14:30:38,833][102897] Updated weights for policy 0, policy_version 68630 (0.0009) +[2023-10-08 14:30:39,200][102897] Updated weights for policy 0, policy_version 68640 (0.0007) +[2023-10-08 14:30:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 140640256. Throughput: 0: 1791.6, 1: 1773.2. Samples: 35170908. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 14:30:41,875][101941] Avg episode reward: [(0, '8.320'), (1, '9.080')] +[2023-10-08 14:30:42,375][102898] Updated weights for policy 1, policy_version 68710 (0.0008) +[2023-10-08 14:30:42,748][102898] Updated weights for policy 1, policy_version 68720 (0.0010) +[2023-10-08 14:30:43,092][102897] Updated weights for policy 0, policy_version 68650 (0.0008) +[2023-10-08 14:30:43,122][102898] Updated weights for policy 1, policy_version 68730 (0.0008) +[2023-10-08 14:30:43,449][102897] Updated weights for policy 0, policy_version 68660 (0.0007) +[2023-10-08 14:30:43,813][102897] Updated weights for policy 0, policy_version 68670 (0.0009) +[2023-10-08 14:30:46,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 140705792. Throughput: 0: 1798.0, 1: 1790.9. Samples: 35193078. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 14:30:46,875][101941] Avg episode reward: [(0, '8.090'), (1, '8.730')] +[2023-10-08 14:30:46,879][102898] Updated weights for policy 1, policy_version 68740 (0.0009) +[2023-10-08 14:30:47,252][102898] Updated weights for policy 1, policy_version 68750 (0.0009) +[2023-10-08 14:30:47,532][102897] Updated weights for policy 0, policy_version 68680 (0.0007) +[2023-10-08 14:30:47,611][102898] Updated weights for policy 1, policy_version 68760 (0.0007) +[2023-10-08 14:30:47,899][102897] Updated weights for policy 0, policy_version 68690 (0.0010) +[2023-10-08 14:30:48,263][102897] Updated weights for policy 0, policy_version 68700 (0.0008) +[2023-10-08 14:30:51,395][102898] Updated weights for policy 1, policy_version 68770 (0.0008) +[2023-10-08 14:30:51,765][102898] Updated weights for policy 1, policy_version 68780 (0.0008) +[2023-10-08 14:30:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 140771328. Throughput: 0: 1793.9, 1: 1769.6. Samples: 35202770. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 14:30:51,875][101941] Avg episode reward: [(0, '7.580'), (1, '9.580')] +[2023-10-08 14:30:52,139][102898] Updated weights for policy 1, policy_version 68790 (0.0009) +[2023-10-08 14:30:52,171][102897] Updated weights for policy 0, policy_version 68710 (0.0008) +[2023-10-08 14:30:52,494][102898] Updated weights for policy 1, policy_version 68800 (0.0008) +[2023-10-08 14:30:52,540][102897] Updated weights for policy 0, policy_version 68720 (0.0008) +[2023-10-08 14:30:52,915][102897] Updated weights for policy 0, policy_version 68730 (0.0007) +[2023-10-08 14:30:56,447][102898] Updated weights for policy 1, policy_version 68810 (0.0009) +[2023-10-08 14:30:56,682][102897] Updated weights for policy 0, policy_version 68740 (0.0008) +[2023-10-08 14:30:56,815][102898] Updated weights for policy 1, policy_version 68820 (0.0008) +[2023-10-08 14:30:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 140836864. Throughput: 0: 1785.7, 1: 1787.6. Samples: 35224974. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 14:30:56,875][101941] Avg episode reward: [(0, '7.870'), (1, '9.780')] +[2023-10-08 14:30:57,041][102897] Updated weights for policy 0, policy_version 68750 (0.0007) +[2023-10-08 14:30:57,173][102898] Updated weights for policy 1, policy_version 68830 (0.0007) +[2023-10-08 14:30:57,415][102897] Updated weights for policy 0, policy_version 68760 (0.0007) +[2023-10-08 14:31:00,875][102898] Updated weights for policy 1, policy_version 68840 (0.0010) +[2023-10-08 14:31:01,237][102898] Updated weights for policy 1, policy_version 68850 (0.0008) +[2023-10-08 14:31:01,274][102897] Updated weights for policy 0, policy_version 68770 (0.0007) +[2023-10-08 14:31:01,600][102898] Updated weights for policy 1, policy_version 68860 (0.0007) +[2023-10-08 14:31:01,642][102897] Updated weights for policy 0, policy_version 68780 (0.0008) +[2023-10-08 14:31:01,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 140935168. Throughput: 0: 1806.9, 1: 1774.2. Samples: 35245748. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 14:31:01,876][101941] Avg episode reward: [(0, '7.750'), (1, '8.940')] +[2023-10-08 14:31:02,003][102897] Updated weights for policy 0, policy_version 68790 (0.0010) +[2023-10-08 14:31:02,373][102897] Updated weights for policy 0, policy_version 68800 (0.0010) +[2023-10-08 14:31:05,375][102898] Updated weights for policy 1, policy_version 68870 (0.0009) +[2023-10-08 14:31:05,748][102898] Updated weights for policy 1, policy_version 68880 (0.0009) +[2023-10-08 14:31:05,978][102897] Updated weights for policy 0, policy_version 68810 (0.0008) +[2023-10-08 14:31:06,105][102898] Updated weights for policy 1, policy_version 68890 (0.0007) +[2023-10-08 14:31:06,342][102897] Updated weights for policy 0, policy_version 68820 (0.0007) +[2023-10-08 14:31:06,721][102897] Updated weights for policy 0, policy_version 68830 (0.0008) +[2023-10-08 14:31:06,875][101941] Fps is (10 sec: 19660.4, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 141033472. Throughput: 0: 1779.9, 1: 1781.7. Samples: 35256802. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 14:31:06,876][101941] Avg episode reward: [(0, '8.900'), (1, '8.960')] +[2023-10-08 14:31:09,793][102898] Updated weights for policy 1, policy_version 68900 (0.0007) +[2023-10-08 14:31:10,157][102898] Updated weights for policy 1, policy_version 68910 (0.0008) +[2023-10-08 14:31:10,522][102898] Updated weights for policy 1, policy_version 68920 (0.0009) +[2023-10-08 14:31:10,648][102897] Updated weights for policy 0, policy_version 68840 (0.0007) +[2023-10-08 14:31:11,026][102897] Updated weights for policy 0, policy_version 68850 (0.0008) +[2023-10-08 14:31:11,394][102897] Updated weights for policy 0, policy_version 68860 (0.0010) +[2023-10-08 14:31:11,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 141099008. Throughput: 0: 1801.7, 1: 1779.7. Samples: 35277924. Policy #0 lag: (min: 28.0, avg: 28.0, max: 28.0) +[2023-10-08 14:31:11,876][101941] Avg episode reward: [(0, '8.350'), (1, '9.530')] +[2023-10-08 14:31:14,307][102898] Updated weights for policy 1, policy_version 68930 (0.0009) +[2023-10-08 14:31:14,674][102898] Updated weights for policy 1, policy_version 68940 (0.0008) +[2023-10-08 14:31:14,914][102897] Updated weights for policy 0, policy_version 68870 (0.0008) +[2023-10-08 14:31:15,048][102898] Updated weights for policy 1, policy_version 68950 (0.0009) +[2023-10-08 14:31:15,282][102897] Updated weights for policy 0, policy_version 68880 (0.0007) +[2023-10-08 14:31:15,413][102898] Updated weights for policy 1, policy_version 68960 (0.0007) +[2023-10-08 14:31:15,653][102897] Updated weights for policy 0, policy_version 68890 (0.0008) +[2023-10-08 14:31:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 141164544. Throughput: 0: 1777.1, 1: 1773.6. Samples: 35298642. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 14:31:16,876][101941] Avg episode reward: [(0, '7.610'), (1, '9.840')] +[2023-10-08 14:31:19,164][102898] Updated weights for policy 1, policy_version 68970 (0.0009) +[2023-10-08 14:31:19,360][102897] Updated weights for policy 0, policy_version 68900 (0.0007) +[2023-10-08 14:31:19,535][102898] Updated weights for policy 1, policy_version 68980 (0.0007) +[2023-10-08 14:31:19,735][102897] Updated weights for policy 0, policy_version 68910 (0.0008) +[2023-10-08 14:31:19,895][102898] Updated weights for policy 1, policy_version 68990 (0.0008) +[2023-10-08 14:31:20,099][102897] Updated weights for policy 0, policy_version 68920 (0.0007) +[2023-10-08 14:31:21,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 141230080. Throughput: 0: 1797.7, 1: 1786.1. Samples: 35310212. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 14:31:21,875][101941] Avg episode reward: [(0, '8.240'), (1, '8.820')] +[2023-10-08 14:31:23,715][102898] Updated weights for policy 1, policy_version 69000 (0.0009) +[2023-10-08 14:31:23,921][102897] Updated weights for policy 0, policy_version 68930 (0.0007) +[2023-10-08 14:31:24,083][102898] Updated weights for policy 1, policy_version 69010 (0.0007) +[2023-10-08 14:31:24,279][102897] Updated weights for policy 0, policy_version 68940 (0.0007) +[2023-10-08 14:31:24,447][102898] Updated weights for policy 1, policy_version 69020 (0.0007) +[2023-10-08 14:31:24,657][102897] Updated weights for policy 0, policy_version 68950 (0.0007) +[2023-10-08 14:31:25,023][102897] Updated weights for policy 0, policy_version 68960 (0.0008) +[2023-10-08 14:31:26,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 141295616. Throughput: 0: 1770.0, 1: 1773.7. Samples: 35330376. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 14:31:26,876][101941] Avg episode reward: [(0, '8.240'), (1, '7.970')] +[2023-10-08 14:31:28,373][102898] Updated weights for policy 1, policy_version 69030 (0.0009) +[2023-10-08 14:31:28,756][102898] Updated weights for policy 1, policy_version 69040 (0.0009) +[2023-10-08 14:31:28,842][102897] Updated weights for policy 0, policy_version 68970 (0.0007) +[2023-10-08 14:31:29,124][102898] Updated weights for policy 1, policy_version 69050 (0.0010) +[2023-10-08 14:31:29,214][102897] Updated weights for policy 0, policy_version 68980 (0.0007) +[2023-10-08 14:31:29,581][102897] Updated weights for policy 0, policy_version 68990 (0.0007) +[2023-10-08 14:31:31,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 141361152. Throughput: 0: 1766.9, 1: 1771.7. Samples: 35352316. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 14:31:31,876][101941] Avg episode reward: [(0, '8.480'), (1, '8.800')] +[2023-10-08 14:31:32,901][102898] Updated weights for policy 1, policy_version 69060 (0.0010) +[2023-10-08 14:31:33,257][102898] Updated weights for policy 1, policy_version 69070 (0.0009) +[2023-10-08 14:31:33,374][102897] Updated weights for policy 0, policy_version 69000 (0.0007) +[2023-10-08 14:31:33,619][102898] Updated weights for policy 1, policy_version 69080 (0.0008) +[2023-10-08 14:31:33,751][102897] Updated weights for policy 0, policy_version 69010 (0.0007) +[2023-10-08 14:31:34,119][102897] Updated weights for policy 0, policy_version 69020 (0.0009) +[2023-10-08 14:31:36,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 141426688. Throughput: 0: 1770.6, 1: 1769.4. Samples: 35362070. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 14:31:36,876][101941] Avg episode reward: [(0, '8.620'), (1, '10.030')] +[2023-10-08 14:31:37,555][102898] Updated weights for policy 1, policy_version 69090 (0.0009) +[2023-10-08 14:31:37,786][102897] Updated weights for policy 0, policy_version 69030 (0.0008) +[2023-10-08 14:31:37,913][102898] Updated weights for policy 1, policy_version 69100 (0.0008) +[2023-10-08 14:31:38,158][102897] Updated weights for policy 0, policy_version 69040 (0.0008) +[2023-10-08 14:31:38,285][102898] Updated weights for policy 1, policy_version 69110 (0.0009) +[2023-10-08 14:31:38,530][102897] Updated weights for policy 0, policy_version 69050 (0.0007) +[2023-10-08 14:31:38,643][102898] Updated weights for policy 1, policy_version 69120 (0.0009) +[2023-10-08 14:31:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 141492224. Throughput: 0: 1775.0, 1: 1768.2. Samples: 35384418. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 14:31:41,876][101941] Avg episode reward: [(0, '8.630'), (1, '9.340')] +[2023-10-08 14:31:42,389][102897] Updated weights for policy 0, policy_version 69060 (0.0007) +[2023-10-08 14:31:42,504][102898] Updated weights for policy 1, policy_version 69130 (0.0007) +[2023-10-08 14:31:42,758][102897] Updated weights for policy 0, policy_version 69070 (0.0008) +[2023-10-08 14:31:42,867][102898] Updated weights for policy 1, policy_version 69140 (0.0007) +[2023-10-08 14:31:43,134][102897] Updated weights for policy 0, policy_version 69080 (0.0007) +[2023-10-08 14:31:43,227][102898] Updated weights for policy 1, policy_version 69150 (0.0007) +[2023-10-08 14:31:46,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 141557760. Throughput: 0: 1778.4, 1: 1790.8. Samples: 35406358. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 14:31:46,875][101941] Avg episode reward: [(0, '7.760'), (1, '8.590')] +[2023-10-08 14:31:46,984][102897] Updated weights for policy 0, policy_version 69090 (0.0009) +[2023-10-08 14:31:47,032][102898] Updated weights for policy 1, policy_version 69160 (0.0007) +[2023-10-08 14:31:47,352][102897] Updated weights for policy 0, policy_version 69100 (0.0007) +[2023-10-08 14:31:47,399][102898] Updated weights for policy 1, policy_version 69170 (0.0007) +[2023-10-08 14:31:47,720][102897] Updated weights for policy 0, policy_version 69110 (0.0009) +[2023-10-08 14:31:47,761][102898] Updated weights for policy 1, policy_version 69180 (0.0008) +[2023-10-08 14:31:48,087][102897] Updated weights for policy 0, policy_version 69120 (0.0009) +[2023-10-08 14:31:51,558][102898] Updated weights for policy 1, policy_version 69190 (0.0008) +[2023-10-08 14:31:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 141623296. Throughput: 0: 1769.5, 1: 1767.5. Samples: 35415966. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 14:31:51,875][101941] Avg episode reward: [(0, '8.390'), (1, '9.120')] +[2023-10-08 14:31:51,923][102898] Updated weights for policy 1, policy_version 69200 (0.0007) +[2023-10-08 14:31:51,958][102897] Updated weights for policy 0, policy_version 69130 (0.0008) +[2023-10-08 14:31:52,293][102898] Updated weights for policy 1, policy_version 69210 (0.0007) +[2023-10-08 14:31:52,324][102897] Updated weights for policy 0, policy_version 69140 (0.0009) +[2023-10-08 14:31:52,691][102897] Updated weights for policy 0, policy_version 69150 (0.0008) +[2023-10-08 14:31:56,084][102898] Updated weights for policy 1, policy_version 69220 (0.0008) +[2023-10-08 14:31:56,403][102897] Updated weights for policy 0, policy_version 69160 (0.0008) +[2023-10-08 14:31:56,444][102898] Updated weights for policy 1, policy_version 69230 (0.0008) +[2023-10-08 14:31:56,771][102897] Updated weights for policy 0, policy_version 69170 (0.0008) +[2023-10-08 14:31:56,811][102898] Updated weights for policy 1, policy_version 69240 (0.0008) +[2023-10-08 14:31:56,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 141688832. Throughput: 0: 1777.5, 1: 1785.1. Samples: 35438240. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 14:31:56,876][101941] Avg episode reward: [(0, '8.800'), (1, '9.520')] +[2023-10-08 14:31:57,132][102897] Updated weights for policy 0, policy_version 69180 (0.0008) +[2023-10-08 14:32:00,577][102898] Updated weights for policy 1, policy_version 69250 (0.0009) +[2023-10-08 14:32:00,954][102898] Updated weights for policy 1, policy_version 69260 (0.0009) +[2023-10-08 14:32:00,955][102897] Updated weights for policy 0, policy_version 69190 (0.0008) +[2023-10-08 14:32:01,319][102897] Updated weights for policy 0, policy_version 69200 (0.0010) +[2023-10-08 14:32:01,322][102898] Updated weights for policy 1, policy_version 69270 (0.0008) +[2023-10-08 14:32:01,682][102898] Updated weights for policy 1, policy_version 69280 (0.0007) +[2023-10-08 14:32:01,699][102897] Updated weights for policy 0, policy_version 69210 (0.0008) +[2023-10-08 14:32:01,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 141787136. Throughput: 0: 1782.7, 1: 1768.5. Samples: 35458446. Policy #0 lag: (min: 31.0, avg: 38.2, max: 63.0) +[2023-10-08 14:32:01,876][101941] Avg episode reward: [(0, '8.640'), (1, '10.100')] +[2023-10-08 14:32:05,420][102898] Updated weights for policy 1, policy_version 69290 (0.0008) +[2023-10-08 14:32:05,588][102897] Updated weights for policy 0, policy_version 69220 (0.0009) +[2023-10-08 14:32:05,783][102898] Updated weights for policy 1, policy_version 69300 (0.0008) +[2023-10-08 14:32:05,964][102897] Updated weights for policy 0, policy_version 69230 (0.0008) +[2023-10-08 14:32:06,150][102898] Updated weights for policy 1, policy_version 69310 (0.0008) +[2023-10-08 14:32:06,330][102897] Updated weights for policy 0, policy_version 69240 (0.0007) +[2023-10-08 14:32:06,875][101941] Fps is (10 sec: 19660.8, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 141885440. Throughput: 0: 1770.6, 1: 1782.6. Samples: 35470106. Policy #0 lag: (min: 24.0, avg: 52.5, max: 56.0) +[2023-10-08 14:32:06,876][101941] Avg episode reward: [(0, '8.450'), (1, '10.030')] +[2023-10-08 14:32:09,990][102898] Updated weights for policy 1, policy_version 69320 (0.0008) +[2023-10-08 14:32:10,120][102897] Updated weights for policy 0, policy_version 69250 (0.0008) +[2023-10-08 14:32:10,353][102898] Updated weights for policy 1, policy_version 69330 (0.0008) +[2023-10-08 14:32:10,492][102897] Updated weights for policy 0, policy_version 69260 (0.0008) +[2023-10-08 14:32:10,714][102898] Updated weights for policy 1, policy_version 69340 (0.0007) +[2023-10-08 14:32:10,865][102897] Updated weights for policy 0, policy_version 69270 (0.0009) +[2023-10-08 14:32:11,232][102897] Updated weights for policy 0, policy_version 69280 (0.0008) +[2023-10-08 14:32:11,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 141950976. Throughput: 0: 1788.5, 1: 1786.2. Samples: 35491240. Policy #0 lag: (min: 24.0, avg: 52.5, max: 56.0) +[2023-10-08 14:32:11,876][101941] Avg episode reward: [(0, '8.480'), (1, '9.090')] +[2023-10-08 14:32:14,437][102898] Updated weights for policy 1, policy_version 69350 (0.0009) +[2023-10-08 14:32:14,816][102898] Updated weights for policy 1, policy_version 69360 (0.0007) +[2023-10-08 14:32:14,986][102897] Updated weights for policy 0, policy_version 69290 (0.0008) +[2023-10-08 14:32:15,182][102898] Updated weights for policy 1, policy_version 69370 (0.0007) +[2023-10-08 14:32:15,344][102897] Updated weights for policy 0, policy_version 69300 (0.0009) +[2023-10-08 14:32:15,714][102897] Updated weights for policy 0, policy_version 69310 (0.0009) +[2023-10-08 14:32:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 142016512. Throughput: 0: 1771.7, 1: 1775.4. Samples: 35511938. Policy #0 lag: (min: 24.0, avg: 52.5, max: 56.0) +[2023-10-08 14:32:16,876][101941] Avg episode reward: [(0, '8.490'), (1, '8.320')] +[2023-10-08 14:32:16,885][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000069376_71041024.pth... +[2023-10-08 14:32:16,885][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000069312_70975488.pth... +[2023-10-08 14:32:16,919][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000067648_69271552.pth +[2023-10-08 14:32:16,927][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000067712_69337088.pth +[2023-10-08 14:32:18,807][102898] Updated weights for policy 1, policy_version 69380 (0.0008) +[2023-10-08 14:32:19,179][102898] Updated weights for policy 1, policy_version 69390 (0.0010) +[2023-10-08 14:32:19,540][102898] Updated weights for policy 1, policy_version 69400 (0.0007) +[2023-10-08 14:32:19,628][102897] Updated weights for policy 0, policy_version 69320 (0.0009) +[2023-10-08 14:32:20,002][102897] Updated weights for policy 0, policy_version 69330 (0.0008) +[2023-10-08 14:32:20,377][102897] Updated weights for policy 0, policy_version 69340 (0.0009) +[2023-10-08 14:32:21,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 142082048. Throughput: 0: 1794.5, 1: 1795.7. Samples: 35523626. Policy #0 lag: (min: 24.0, avg: 52.5, max: 56.0) +[2023-10-08 14:32:21,876][101941] Avg episode reward: [(0, '8.320'), (1, '8.950')] +[2023-10-08 14:32:23,320][102898] Updated weights for policy 1, policy_version 69410 (0.0007) +[2023-10-08 14:32:23,686][102898] Updated weights for policy 1, policy_version 69420 (0.0008) +[2023-10-08 14:32:24,060][102898] Updated weights for policy 1, policy_version 69430 (0.0010) +[2023-10-08 14:32:24,125][102897] Updated weights for policy 0, policy_version 69350 (0.0009) +[2023-10-08 14:32:24,423][102898] Updated weights for policy 1, policy_version 69440 (0.0007) +[2023-10-08 14:32:24,504][102897] Updated weights for policy 0, policy_version 69360 (0.0007) +[2023-10-08 14:32:24,873][102897] Updated weights for policy 0, policy_version 69370 (0.0009) +[2023-10-08 14:32:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 142147584. Throughput: 0: 1759.3, 1: 1786.1. Samples: 35543962. Policy #0 lag: (min: 24.0, avg: 52.5, max: 56.0) +[2023-10-08 14:32:26,876][101941] Avg episode reward: [(0, '7.560'), (1, '9.580')] +[2023-10-08 14:32:28,247][102898] Updated weights for policy 1, policy_version 69450 (0.0007) +[2023-10-08 14:32:28,616][102898] Updated weights for policy 1, policy_version 69460 (0.0007) +[2023-10-08 14:32:28,617][102897] Updated weights for policy 0, policy_version 69380 (0.0008) +[2023-10-08 14:32:28,980][102898] Updated weights for policy 1, policy_version 69470 (0.0007) +[2023-10-08 14:32:28,985][102897] Updated weights for policy 0, policy_version 69390 (0.0009) +[2023-10-08 14:32:29,354][102897] Updated weights for policy 0, policy_version 69400 (0.0010) +[2023-10-08 14:32:31,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 142213120. Throughput: 0: 1761.2, 1: 1786.0. Samples: 35565984. Policy #0 lag: (min: 24.0, avg: 52.5, max: 56.0) +[2023-10-08 14:32:31,876][101941] Avg episode reward: [(0, '8.270'), (1, '10.010')] +[2023-10-08 14:32:32,723][102898] Updated weights for policy 1, policy_version 69480 (0.0009) +[2023-10-08 14:32:33,091][102898] Updated weights for policy 1, policy_version 69490 (0.0007) +[2023-10-08 14:32:33,157][102897] Updated weights for policy 0, policy_version 69410 (0.0009) +[2023-10-08 14:32:33,462][102898] Updated weights for policy 1, policy_version 69500 (0.0008) +[2023-10-08 14:32:33,538][102897] Updated weights for policy 0, policy_version 69420 (0.0007) +[2023-10-08 14:32:33,908][102897] Updated weights for policy 0, policy_version 69430 (0.0007) +[2023-10-08 14:32:34,273][102897] Updated weights for policy 0, policy_version 69440 (0.0008) +[2023-10-08 14:32:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 142278656. Throughput: 0: 1765.1, 1: 1785.6. Samples: 35575746. Policy #0 lag: (min: 24.0, avg: 52.5, max: 56.0) +[2023-10-08 14:32:36,876][101941] Avg episode reward: [(0, '8.330'), (1, '9.430')] +[2023-10-08 14:32:37,221][102898] Updated weights for policy 1, policy_version 69510 (0.0008) +[2023-10-08 14:32:37,601][102898] Updated weights for policy 1, policy_version 69520 (0.0009) +[2023-10-08 14:32:37,960][102898] Updated weights for policy 1, policy_version 69530 (0.0009) +[2023-10-08 14:32:38,073][102897] Updated weights for policy 0, policy_version 69450 (0.0007) +[2023-10-08 14:32:38,444][102897] Updated weights for policy 0, policy_version 69460 (0.0008) +[2023-10-08 14:32:38,823][102897] Updated weights for policy 0, policy_version 69470 (0.0008) +[2023-10-08 14:32:41,729][102898] Updated weights for policy 1, policy_version 69540 (0.0009) +[2023-10-08 14:32:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 142344192. Throughput: 0: 1760.1, 1: 1787.6. Samples: 35597888. Policy #0 lag: (min: 24.0, avg: 52.5, max: 56.0) +[2023-10-08 14:32:41,876][101941] Avg episode reward: [(0, '8.620'), (1, '9.690')] +[2023-10-08 14:32:42,090][102898] Updated weights for policy 1, policy_version 69550 (0.0009) +[2023-10-08 14:32:42,455][102898] Updated weights for policy 1, policy_version 69560 (0.0009) +[2023-10-08 14:32:42,704][102897] Updated weights for policy 0, policy_version 69480 (0.0008) +[2023-10-08 14:32:43,070][102897] Updated weights for policy 0, policy_version 69490 (0.0009) +[2023-10-08 14:32:43,447][102897] Updated weights for policy 0, policy_version 69500 (0.0009) +[2023-10-08 14:32:46,109][102898] Updated weights for policy 1, policy_version 69570 (0.0008) +[2023-10-08 14:32:46,478][102898] Updated weights for policy 1, policy_version 69580 (0.0007) +[2023-10-08 14:32:46,845][102898] Updated weights for policy 1, policy_version 69590 (0.0008) +[2023-10-08 14:32:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 142409728. Throughput: 0: 1781.4, 1: 1805.1. Samples: 35619838. Policy #0 lag: (min: 24.0, avg: 52.5, max: 56.0) +[2023-10-08 14:32:46,875][101941] Avg episode reward: [(0, '8.570'), (1, '10.140')] +[2023-10-08 14:32:47,116][102897] Updated weights for policy 0, policy_version 69510 (0.0009) +[2023-10-08 14:32:47,211][102898] Updated weights for policy 1, policy_version 69600 (0.0008) +[2023-10-08 14:32:47,484][102897] Updated weights for policy 0, policy_version 69520 (0.0007) +[2023-10-08 14:32:47,865][102897] Updated weights for policy 0, policy_version 69530 (0.0009) +[2023-10-08 14:32:50,958][102898] Updated weights for policy 1, policy_version 69610 (0.0008) +[2023-10-08 14:32:51,324][102898] Updated weights for policy 1, policy_version 69620 (0.0010) +[2023-10-08 14:32:51,691][102898] Updated weights for policy 1, policy_version 69630 (0.0010) +[2023-10-08 14:32:51,723][102897] Updated weights for policy 0, policy_version 69540 (0.0008) +[2023-10-08 14:32:51,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 142508032. Throughput: 0: 1764.5, 1: 1792.4. Samples: 35630162. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 14:32:51,875][101941] Avg episode reward: [(0, '7.920'), (1, '10.190')] +[2023-10-08 14:32:52,083][102897] Updated weights for policy 0, policy_version 69550 (0.0007) +[2023-10-08 14:32:52,453][102897] Updated weights for policy 0, policy_version 69560 (0.0007) +[2023-10-08 14:32:55,453][102898] Updated weights for policy 1, policy_version 69640 (0.0009) +[2023-10-08 14:32:55,820][102898] Updated weights for policy 1, policy_version 69650 (0.0010) +[2023-10-08 14:32:56,119][102897] Updated weights for policy 0, policy_version 69570 (0.0007) +[2023-10-08 14:32:56,180][102898] Updated weights for policy 1, policy_version 69660 (0.0007) +[2023-10-08 14:32:56,487][102897] Updated weights for policy 0, policy_version 69580 (0.0008) +[2023-10-08 14:32:56,865][102897] Updated weights for policy 0, policy_version 69590 (0.0008) +[2023-10-08 14:32:56,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 142573568. Throughput: 0: 1777.2, 1: 1797.9. Samples: 35652118. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 14:32:56,876][101941] Avg episode reward: [(0, '7.770'), (1, '10.020')] +[2023-10-08 14:32:57,227][102897] Updated weights for policy 0, policy_version 69600 (0.0008) +[2023-10-08 14:32:59,980][102898] Updated weights for policy 1, policy_version 69670 (0.0007) +[2023-10-08 14:33:00,367][102898] Updated weights for policy 1, policy_version 69680 (0.0008) +[2023-10-08 14:33:00,737][102898] Updated weights for policy 1, policy_version 69690 (0.0007) +[2023-10-08 14:33:01,057][102897] Updated weights for policy 0, policy_version 69610 (0.0007) +[2023-10-08 14:33:01,424][102897] Updated weights for policy 0, policy_version 69620 (0.0008) +[2023-10-08 14:33:01,794][102897] Updated weights for policy 0, policy_version 69630 (0.0010) +[2023-10-08 14:33:01,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 142671872. Throughput: 0: 1777.8, 1: 1792.7. Samples: 35672610. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 14:33:01,876][101941] Avg episode reward: [(0, '7.490'), (1, '8.610')] +[2023-10-08 14:33:04,450][102898] Updated weights for policy 1, policy_version 69700 (0.0009) +[2023-10-08 14:33:04,818][102898] Updated weights for policy 1, policy_version 69710 (0.0008) +[2023-10-08 14:33:05,188][102898] Updated weights for policy 1, policy_version 69720 (0.0008) +[2023-10-08 14:33:05,631][102897] Updated weights for policy 0, policy_version 69640 (0.0009) +[2023-10-08 14:33:06,016][102897] Updated weights for policy 0, policy_version 69650 (0.0008) +[2023-10-08 14:33:06,394][102897] Updated weights for policy 0, policy_version 69660 (0.0009) +[2023-10-08 14:33:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 142737408. Throughput: 0: 1768.7, 1: 1801.1. Samples: 35684268. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 14:33:06,876][101941] Avg episode reward: [(0, '7.810'), (1, '8.830')] +[2023-10-08 14:33:08,750][102898] Updated weights for policy 1, policy_version 69730 (0.0010) +[2023-10-08 14:33:09,110][102898] Updated weights for policy 1, policy_version 69740 (0.0010) +[2023-10-08 14:33:09,480][102898] Updated weights for policy 1, policy_version 69750 (0.0008) +[2023-10-08 14:33:09,849][102898] Updated weights for policy 1, policy_version 69760 (0.0009) +[2023-10-08 14:33:10,169][102897] Updated weights for policy 0, policy_version 69670 (0.0008) +[2023-10-08 14:33:10,544][102897] Updated weights for policy 0, policy_version 69680 (0.0007) +[2023-10-08 14:33:10,922][102897] Updated weights for policy 0, policy_version 69690 (0.0008) +[2023-10-08 14:33:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 142802944. Throughput: 0: 1789.7, 1: 1786.5. Samples: 35704892. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 14:33:11,876][101941] Avg episode reward: [(0, '8.130'), (1, '9.450')] +[2023-10-08 14:33:13,676][102898] Updated weights for policy 1, policy_version 69770 (0.0010) +[2023-10-08 14:33:14,035][102898] Updated weights for policy 1, policy_version 69780 (0.0010) +[2023-10-08 14:33:14,397][102898] Updated weights for policy 1, policy_version 69790 (0.0010) +[2023-10-08 14:33:14,794][102897] Updated weights for policy 0, policy_version 69700 (0.0010) +[2023-10-08 14:33:15,164][102897] Updated weights for policy 0, policy_version 69710 (0.0008) +[2023-10-08 14:33:15,538][102897] Updated weights for policy 0, policy_version 69720 (0.0010) +[2023-10-08 14:33:16,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 142868480. Throughput: 0: 1773.7, 1: 1787.5. Samples: 35726242. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 14:33:16,876][101941] Avg episode reward: [(0, '7.890'), (1, '10.170')] +[2023-10-08 14:33:18,277][102898] Updated weights for policy 1, policy_version 69800 (0.0008) +[2023-10-08 14:33:18,635][102898] Updated weights for policy 1, policy_version 69810 (0.0008) +[2023-10-08 14:33:18,998][102898] Updated weights for policy 1, policy_version 69820 (0.0007) +[2023-10-08 14:33:19,296][102897] Updated weights for policy 0, policy_version 69730 (0.0008) +[2023-10-08 14:33:19,670][102897] Updated weights for policy 0, policy_version 69740 (0.0007) +[2023-10-08 14:33:20,039][102897] Updated weights for policy 0, policy_version 69750 (0.0010) +[2023-10-08 14:33:20,419][102897] Updated weights for policy 0, policy_version 69760 (0.0009) +[2023-10-08 14:33:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 142934016. Throughput: 0: 1802.5, 1: 1785.1. Samples: 35737186. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 14:33:21,875][101941] Avg episode reward: [(0, '8.250'), (1, '8.790')] +[2023-10-08 14:33:22,746][102898] Updated weights for policy 1, policy_version 69830 (0.0010) +[2023-10-08 14:33:23,114][102898] Updated weights for policy 1, policy_version 69840 (0.0008) +[2023-10-08 14:33:23,477][102898] Updated weights for policy 1, policy_version 69850 (0.0009) +[2023-10-08 14:33:24,320][102897] Updated weights for policy 0, policy_version 69770 (0.0011) +[2023-10-08 14:33:24,698][102897] Updated weights for policy 0, policy_version 69780 (0.0010) +[2023-10-08 14:33:25,067][102897] Updated weights for policy 0, policy_version 69790 (0.0008) +[2023-10-08 14:33:26,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 142999552. Throughput: 0: 1771.6, 1: 1790.4. Samples: 35758180. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 14:33:26,876][101941] Avg episode reward: [(0, '8.260'), (1, '8.490')] +[2023-10-08 14:33:27,452][102898] Updated weights for policy 1, policy_version 69860 (0.0008) +[2023-10-08 14:33:27,821][102898] Updated weights for policy 1, policy_version 69870 (0.0008) +[2023-10-08 14:33:28,179][102898] Updated weights for policy 1, policy_version 69880 (0.0010) +[2023-10-08 14:33:28,773][102897] Updated weights for policy 0, policy_version 69800 (0.0007) +[2023-10-08 14:33:29,141][102897] Updated weights for policy 0, policy_version 69810 (0.0009) +[2023-10-08 14:33:29,516][102897] Updated weights for policy 0, policy_version 69820 (0.0007) +[2023-10-08 14:33:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 143065088. Throughput: 0: 1774.9, 1: 1797.3. Samples: 35780588. Policy #0 lag: (min: 31.0, avg: 31.4, max: 45.0) +[2023-10-08 14:33:31,876][101941] Avg episode reward: [(0, '8.120'), (1, '8.440')] +[2023-10-08 14:33:31,985][102898] Updated weights for policy 1, policy_version 69890 (0.0009) +[2023-10-08 14:33:32,360][102898] Updated weights for policy 1, policy_version 69900 (0.0007) +[2023-10-08 14:33:32,723][102898] Updated weights for policy 1, policy_version 69910 (0.0007) +[2023-10-08 14:33:33,087][102898] Updated weights for policy 1, policy_version 69920 (0.0008) +[2023-10-08 14:33:33,245][102897] Updated weights for policy 0, policy_version 69830 (0.0007) +[2023-10-08 14:33:33,616][102897] Updated weights for policy 0, policy_version 69840 (0.0007) +[2023-10-08 14:33:33,987][102897] Updated weights for policy 0, policy_version 69850 (0.0007) +[2023-10-08 14:33:36,806][102898] Updated weights for policy 1, policy_version 69930 (0.0008) +[2023-10-08 14:33:36,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 143130624. Throughput: 0: 1772.7, 1: 1783.5. Samples: 35790190. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:33:36,875][101941] Avg episode reward: [(0, '8.060'), (1, '8.580')] +[2023-10-08 14:33:37,175][102898] Updated weights for policy 1, policy_version 69940 (0.0008) +[2023-10-08 14:33:37,539][102898] Updated weights for policy 1, policy_version 69950 (0.0008) +[2023-10-08 14:33:37,684][102897] Updated weights for policy 0, policy_version 69860 (0.0008) +[2023-10-08 14:33:38,050][102897] Updated weights for policy 0, policy_version 69870 (0.0009) +[2023-10-08 14:33:38,424][102897] Updated weights for policy 0, policy_version 69880 (0.0008) +[2023-10-08 14:33:41,185][102898] Updated weights for policy 1, policy_version 69960 (0.0011) +[2023-10-08 14:33:41,558][102898] Updated weights for policy 1, policy_version 69970 (0.0010) +[2023-10-08 14:33:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 143196160. Throughput: 0: 1772.5, 1: 1794.7. Samples: 35812644. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:33:41,876][101941] Avg episode reward: [(0, '8.010'), (1, '8.770')] +[2023-10-08 14:33:41,915][102898] Updated weights for policy 1, policy_version 69980 (0.0010) +[2023-10-08 14:33:42,158][102897] Updated weights for policy 0, policy_version 69890 (0.0010) +[2023-10-08 14:33:42,526][102897] Updated weights for policy 0, policy_version 69900 (0.0010) +[2023-10-08 14:33:42,895][102897] Updated weights for policy 0, policy_version 69910 (0.0009) +[2023-10-08 14:33:43,262][102897] Updated weights for policy 0, policy_version 69920 (0.0011) +[2023-10-08 14:33:45,646][102898] Updated weights for policy 1, policy_version 69990 (0.0009) +[2023-10-08 14:33:46,024][102898] Updated weights for policy 1, policy_version 70000 (0.0007) +[2023-10-08 14:33:46,394][102898] Updated weights for policy 1, policy_version 70010 (0.0007) +[2023-10-08 14:33:46,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 143294464. Throughput: 0: 1790.0, 1: 1791.6. Samples: 35833784. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:33:46,876][101941] Avg episode reward: [(0, '7.810'), (1, '9.870')] +[2023-10-08 14:33:47,089][102897] Updated weights for policy 0, policy_version 69930 (0.0008) +[2023-10-08 14:33:47,472][102897] Updated weights for policy 0, policy_version 69940 (0.0008) +[2023-10-08 14:33:47,837][102897] Updated weights for policy 0, policy_version 69950 (0.0010) +[2023-10-08 14:33:50,087][102898] Updated weights for policy 1, policy_version 70020 (0.0007) +[2023-10-08 14:33:50,462][102898] Updated weights for policy 1, policy_version 70030 (0.0007) +[2023-10-08 14:33:50,826][102898] Updated weights for policy 1, policy_version 70040 (0.0008) +[2023-10-08 14:33:51,710][102897] Updated weights for policy 0, policy_version 69960 (0.0008) +[2023-10-08 14:33:51,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 143360000. Throughput: 0: 1770.4, 1: 1791.4. Samples: 35844548. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:33:51,875][101941] Avg episode reward: [(0, '6.970'), (1, '9.880')] +[2023-10-08 14:33:52,093][102897] Updated weights for policy 0, policy_version 69970 (0.0008) +[2023-10-08 14:33:52,465][102897] Updated weights for policy 0, policy_version 69980 (0.0007) +[2023-10-08 14:33:54,558][102898] Updated weights for policy 1, policy_version 70050 (0.0008) +[2023-10-08 14:33:54,921][102898] Updated weights for policy 1, policy_version 70060 (0.0007) +[2023-10-08 14:33:55,289][102898] Updated weights for policy 1, policy_version 70070 (0.0009) +[2023-10-08 14:33:55,658][102898] Updated weights for policy 1, policy_version 70080 (0.0008) +[2023-10-08 14:33:56,359][102897] Updated weights for policy 0, policy_version 69990 (0.0008) +[2023-10-08 14:33:56,720][102897] Updated weights for policy 0, policy_version 70000 (0.0007) +[2023-10-08 14:33:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 143425536. Throughput: 0: 1784.3, 1: 1792.4. Samples: 35865842. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:33:56,875][101941] Avg episode reward: [(0, '7.990'), (1, '9.300')] +[2023-10-08 14:33:57,095][102897] Updated weights for policy 0, policy_version 70010 (0.0008) +[2023-10-08 14:33:59,349][102898] Updated weights for policy 1, policy_version 70090 (0.0008) +[2023-10-08 14:33:59,719][102898] Updated weights for policy 1, policy_version 70100 (0.0008) +[2023-10-08 14:34:00,085][102898] Updated weights for policy 1, policy_version 70110 (0.0010) +[2023-10-08 14:34:00,754][102897] Updated weights for policy 0, policy_version 70020 (0.0009) +[2023-10-08 14:34:01,135][102897] Updated weights for policy 0, policy_version 70030 (0.0009) +[2023-10-08 14:34:01,509][102897] Updated weights for policy 0, policy_version 70040 (0.0008) +[2023-10-08 14:34:01,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 143523840. Throughput: 0: 1786.0, 1: 1794.9. Samples: 35887380. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:34:01,876][101941] Avg episode reward: [(0, '8.300'), (1, '8.950')] +[2023-10-08 14:34:03,747][102898] Updated weights for policy 1, policy_version 70120 (0.0008) +[2023-10-08 14:34:04,106][102898] Updated weights for policy 1, policy_version 70130 (0.0008) +[2023-10-08 14:34:04,476][102898] Updated weights for policy 1, policy_version 70140 (0.0008) +[2023-10-08 14:34:05,202][102897] Updated weights for policy 0, policy_version 70050 (0.0009) +[2023-10-08 14:34:05,567][102897] Updated weights for policy 0, policy_version 70060 (0.0008) +[2023-10-08 14:34:05,939][102897] Updated weights for policy 0, policy_version 70070 (0.0007) +[2023-10-08 14:34:06,315][102897] Updated weights for policy 0, policy_version 70080 (0.0008) +[2023-10-08 14:34:06,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 143589376. Throughput: 0: 1775.5, 1: 1806.1. Samples: 35898358. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:34:06,876][101941] Avg episode reward: [(0, '8.470'), (1, '9.080')] +[2023-10-08 14:34:08,291][102898] Updated weights for policy 1, policy_version 70150 (0.0008) +[2023-10-08 14:34:08,659][102898] Updated weights for policy 1, policy_version 70160 (0.0007) +[2023-10-08 14:34:09,021][102898] Updated weights for policy 1, policy_version 70170 (0.0010) +[2023-10-08 14:34:10,007][102897] Updated weights for policy 0, policy_version 70090 (0.0009) +[2023-10-08 14:34:10,379][102897] Updated weights for policy 0, policy_version 70100 (0.0009) +[2023-10-08 14:34:10,746][102897] Updated weights for policy 0, policy_version 70110 (0.0008) +[2023-10-08 14:34:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 143654912. Throughput: 0: 1792.5, 1: 1800.9. Samples: 35919882. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:34:11,875][101941] Avg episode reward: [(0, '8.480'), (1, '9.220')] +[2023-10-08 14:34:12,630][102898] Updated weights for policy 1, policy_version 70180 (0.0008) +[2023-10-08 14:34:12,993][102898] Updated weights for policy 1, policy_version 70190 (0.0010) +[2023-10-08 14:34:13,366][102898] Updated weights for policy 1, policy_version 70200 (0.0007) +[2023-10-08 14:34:14,392][102897] Updated weights for policy 0, policy_version 70120 (0.0010) +[2023-10-08 14:34:14,775][102897] Updated weights for policy 0, policy_version 70130 (0.0008) +[2023-10-08 14:34:15,147][102897] Updated weights for policy 0, policy_version 70140 (0.0008) +[2023-10-08 14:34:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 143720448. Throughput: 0: 1774.7, 1: 1808.0. Samples: 35941810. Policy #0 lag: (min: 31.0, avg: 39.0, max: 63.0) +[2023-10-08 14:34:16,876][101941] Avg episode reward: [(0, '7.520'), (1, '9.680')] +[2023-10-08 14:34:16,887][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000070144_71827456.pth... +[2023-10-08 14:34:16,887][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000070208_71892992.pth... +[2023-10-08 14:34:16,926][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000068480_70123520.pth +[2023-10-08 14:34:16,928][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000068544_70189056.pth +[2023-10-08 14:34:17,136][102898] Updated weights for policy 1, policy_version 70210 (0.0007) +[2023-10-08 14:34:17,506][102898] Updated weights for policy 1, policy_version 70220 (0.0008) +[2023-10-08 14:34:17,873][102898] Updated weights for policy 1, policy_version 70230 (0.0007) +[2023-10-08 14:34:18,228][102898] Updated weights for policy 1, policy_version 70240 (0.0007) +[2023-10-08 14:34:19,027][102897] Updated weights for policy 0, policy_version 70150 (0.0009) +[2023-10-08 14:34:19,385][102897] Updated weights for policy 0, policy_version 70160 (0.0009) +[2023-10-08 14:34:19,763][102897] Updated weights for policy 0, policy_version 70170 (0.0009) +[2023-10-08 14:34:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 143785984. Throughput: 0: 1793.6, 1: 1810.5. Samples: 35952376. Policy #0 lag: (min: 16.0, avg: 34.9, max: 48.0) +[2023-10-08 14:34:21,876][101941] Avg episode reward: [(0, '7.870'), (1, '9.710')] +[2023-10-08 14:34:22,012][102898] Updated weights for policy 1, policy_version 70250 (0.0007) +[2023-10-08 14:34:22,382][102898] Updated weights for policy 1, policy_version 70260 (0.0008) +[2023-10-08 14:34:22,741][102898] Updated weights for policy 1, policy_version 70270 (0.0008) +[2023-10-08 14:34:23,410][102897] Updated weights for policy 0, policy_version 70180 (0.0008) +[2023-10-08 14:34:23,782][102897] Updated weights for policy 0, policy_version 70190 (0.0008) +[2023-10-08 14:34:24,170][102897] Updated weights for policy 0, policy_version 70200 (0.0009) +[2023-10-08 14:34:26,495][102898] Updated weights for policy 1, policy_version 70280 (0.0007) +[2023-10-08 14:34:26,859][102898] Updated weights for policy 1, policy_version 70290 (0.0009) +[2023-10-08 14:34:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 143851520. Throughput: 0: 1781.3, 1: 1804.4. Samples: 35974002. Policy #0 lag: (min: 16.0, avg: 34.9, max: 48.0) +[2023-10-08 14:34:26,876][101941] Avg episode reward: [(0, '7.370'), (1, '9.910')] +[2023-10-08 14:34:27,231][102898] Updated weights for policy 1, policy_version 70300 (0.0007) +[2023-10-08 14:34:27,992][102897] Updated weights for policy 0, policy_version 70210 (0.0009) +[2023-10-08 14:34:28,365][102897] Updated weights for policy 0, policy_version 70220 (0.0010) +[2023-10-08 14:34:28,740][102897] Updated weights for policy 0, policy_version 70230 (0.0008) +[2023-10-08 14:34:29,116][102897] Updated weights for policy 0, policy_version 70240 (0.0010) +[2023-10-08 14:34:31,085][102898] Updated weights for policy 1, policy_version 70310 (0.0007) +[2023-10-08 14:34:31,469][102898] Updated weights for policy 1, policy_version 70320 (0.0009) +[2023-10-08 14:34:31,843][102898] Updated weights for policy 1, policy_version 70330 (0.0007) +[2023-10-08 14:34:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 143917056. Throughput: 0: 1783.1, 1: 1810.7. Samples: 35995506. Policy #0 lag: (min: 16.0, avg: 34.9, max: 48.0) +[2023-10-08 14:34:31,876][101941] Avg episode reward: [(0, '7.950'), (1, '9.040')] +[2023-10-08 14:34:32,918][102897] Updated weights for policy 0, policy_version 70250 (0.0007) +[2023-10-08 14:34:33,294][102897] Updated weights for policy 0, policy_version 70260 (0.0007) +[2023-10-08 14:34:33,660][102897] Updated weights for policy 0, policy_version 70270 (0.0008) +[2023-10-08 14:34:35,409][102898] Updated weights for policy 1, policy_version 70340 (0.0007) +[2023-10-08 14:34:35,783][102898] Updated weights for policy 1, policy_version 70350 (0.0008) +[2023-10-08 14:34:36,145][102898] Updated weights for policy 1, policy_version 70360 (0.0009) +[2023-10-08 14:34:36,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.5, 300 sec: 14329.1). Total num frames: 144015360. Throughput: 0: 1788.4, 1: 1802.0. Samples: 36006116. Policy #0 lag: (min: 16.0, avg: 34.9, max: 48.0) +[2023-10-08 14:34:36,876][101941] Avg episode reward: [(0, '7.910'), (1, '9.720')] +[2023-10-08 14:34:37,574][102897] Updated weights for policy 0, policy_version 70280 (0.0009) +[2023-10-08 14:34:37,942][102897] Updated weights for policy 0, policy_version 70290 (0.0010) +[2023-10-08 14:34:38,313][102897] Updated weights for policy 0, policy_version 70300 (0.0011) +[2023-10-08 14:34:39,622][102898] Updated weights for policy 1, policy_version 70370 (0.0007) +[2023-10-08 14:34:39,996][102898] Updated weights for policy 1, policy_version 70380 (0.0009) +[2023-10-08 14:34:40,368][102898] Updated weights for policy 1, policy_version 70390 (0.0009) +[2023-10-08 14:34:40,736][102898] Updated weights for policy 1, policy_version 70400 (0.0008) +[2023-10-08 14:34:41,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 144080896. Throughput: 0: 1783.5, 1: 1814.5. Samples: 36027752. Policy #0 lag: (min: 16.0, avg: 34.9, max: 48.0) +[2023-10-08 14:34:41,875][101941] Avg episode reward: [(0, '7.870'), (1, '9.850')] +[2023-10-08 14:34:41,881][102897] Updated weights for policy 0, policy_version 70310 (0.0009) +[2023-10-08 14:34:42,244][102897] Updated weights for policy 0, policy_version 70320 (0.0007) +[2023-10-08 14:34:42,610][102897] Updated weights for policy 0, policy_version 70330 (0.0007) +[2023-10-08 14:34:44,516][102898] Updated weights for policy 1, policy_version 70410 (0.0010) +[2023-10-08 14:34:44,888][102898] Updated weights for policy 1, policy_version 70420 (0.0008) +[2023-10-08 14:34:45,249][102898] Updated weights for policy 1, policy_version 70430 (0.0008) +[2023-10-08 14:34:46,387][102897] Updated weights for policy 0, policy_version 70340 (0.0008) +[2023-10-08 14:34:46,761][102897] Updated weights for policy 0, policy_version 70350 (0.0010) +[2023-10-08 14:34:46,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 144146432. Throughput: 0: 1799.1, 1: 1804.0. Samples: 36049518. Policy #0 lag: (min: 16.0, avg: 34.9, max: 48.0) +[2023-10-08 14:34:46,875][101941] Avg episode reward: [(0, '7.830'), (1, '9.760')] +[2023-10-08 14:34:47,130][102897] Updated weights for policy 0, policy_version 70360 (0.0010) +[2023-10-08 14:34:49,190][102898] Updated weights for policy 1, policy_version 70440 (0.0007) +[2023-10-08 14:34:49,563][102898] Updated weights for policy 1, policy_version 70450 (0.0007) +[2023-10-08 14:34:49,925][102898] Updated weights for policy 1, policy_version 70460 (0.0009) +[2023-10-08 14:34:50,910][102897] Updated weights for policy 0, policy_version 70370 (0.0007) +[2023-10-08 14:34:51,275][102897] Updated weights for policy 0, policy_version 70380 (0.0008) +[2023-10-08 14:34:51,652][102897] Updated weights for policy 0, policy_version 70390 (0.0008) +[2023-10-08 14:34:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 144211968. Throughput: 0: 1783.3, 1: 1814.0. Samples: 36060236. Policy #0 lag: (min: 16.0, avg: 34.9, max: 48.0) +[2023-10-08 14:34:51,875][101941] Avg episode reward: [(0, '8.560'), (1, '9.700')] +[2023-10-08 14:34:52,014][102897] Updated weights for policy 0, policy_version 70400 (0.0009) +[2023-10-08 14:34:53,567][102898] Updated weights for policy 1, policy_version 70470 (0.0009) +[2023-10-08 14:34:53,930][102898] Updated weights for policy 1, policy_version 70480 (0.0007) +[2023-10-08 14:34:54,300][102898] Updated weights for policy 1, policy_version 70490 (0.0009) +[2023-10-08 14:34:55,823][102897] Updated weights for policy 0, policy_version 70410 (0.0007) +[2023-10-08 14:34:56,193][102897] Updated weights for policy 0, policy_version 70420 (0.0007) +[2023-10-08 14:34:56,563][102897] Updated weights for policy 0, policy_version 70430 (0.0007) +[2023-10-08 14:34:56,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 144310272. Throughput: 0: 1799.3, 1: 1804.7. Samples: 36082062. Policy #0 lag: (min: 16.0, avg: 34.9, max: 48.0) +[2023-10-08 14:34:56,876][101941] Avg episode reward: [(0, '8.450'), (1, '9.590')] +[2023-10-08 14:34:58,109][102898] Updated weights for policy 1, policy_version 70500 (0.0010) +[2023-10-08 14:34:58,475][102898] Updated weights for policy 1, policy_version 70510 (0.0009) +[2023-10-08 14:34:58,846][102898] Updated weights for policy 1, policy_version 70520 (0.0007) +[2023-10-08 14:35:00,238][102897] Updated weights for policy 0, policy_version 70440 (0.0008) +[2023-10-08 14:35:00,600][102897] Updated weights for policy 0, policy_version 70450 (0.0007) +[2023-10-08 14:35:00,969][102897] Updated weights for policy 0, policy_version 70460 (0.0008) +[2023-10-08 14:35:01,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 144375808. Throughput: 0: 1791.4, 1: 1795.2. Samples: 36103206. Policy #0 lag: (min: 16.0, avg: 34.9, max: 48.0) +[2023-10-08 14:35:01,876][101941] Avg episode reward: [(0, '8.160'), (1, '8.990')] +[2023-10-08 14:35:02,670][102898] Updated weights for policy 1, policy_version 70530 (0.0008) +[2023-10-08 14:35:03,041][102898] Updated weights for policy 1, policy_version 70540 (0.0007) +[2023-10-08 14:35:03,420][102898] Updated weights for policy 1, policy_version 70550 (0.0010) +[2023-10-08 14:35:03,778][102898] Updated weights for policy 1, policy_version 70560 (0.0008) +[2023-10-08 14:35:04,693][102897] Updated weights for policy 0, policy_version 70470 (0.0010) +[2023-10-08 14:35:05,064][102897] Updated weights for policy 0, policy_version 70480 (0.0010) +[2023-10-08 14:35:05,439][102897] Updated weights for policy 0, policy_version 70490 (0.0010) +[2023-10-08 14:35:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 144441344. Throughput: 0: 1811.9, 1: 1792.8. Samples: 36114588. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:35:06,876][101941] Avg episode reward: [(0, '8.730'), (1, '9.420')] +[2023-10-08 14:35:07,477][102898] Updated weights for policy 1, policy_version 70570 (0.0007) +[2023-10-08 14:35:07,843][102898] Updated weights for policy 1, policy_version 70580 (0.0007) +[2023-10-08 14:35:08,202][102898] Updated weights for policy 1, policy_version 70590 (0.0007) +[2023-10-08 14:35:09,324][102897] Updated weights for policy 0, policy_version 70500 (0.0009) +[2023-10-08 14:35:09,686][102897] Updated weights for policy 0, policy_version 70510 (0.0007) +[2023-10-08 14:35:10,057][102897] Updated weights for policy 0, policy_version 70520 (0.0007) +[2023-10-08 14:35:11,841][102898] Updated weights for policy 1, policy_version 70600 (0.0009) +[2023-10-08 14:35:11,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 144506880. Throughput: 0: 1786.9, 1: 1801.3. Samples: 36135472. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:35:11,876][101941] Avg episode reward: [(0, '8.670'), (1, '10.190')] +[2023-10-08 14:35:12,205][102898] Updated weights for policy 1, policy_version 70610 (0.0010) +[2023-10-08 14:35:12,571][102898] Updated weights for policy 1, policy_version 70620 (0.0009) +[2023-10-08 14:35:13,912][102897] Updated weights for policy 0, policy_version 70530 (0.0008) +[2023-10-08 14:35:14,278][102897] Updated weights for policy 0, policy_version 70540 (0.0008) +[2023-10-08 14:35:14,648][102897] Updated weights for policy 0, policy_version 70550 (0.0008) +[2023-10-08 14:35:15,018][102897] Updated weights for policy 0, policy_version 70560 (0.0009) +[2023-10-08 14:35:16,416][102898] Updated weights for policy 1, policy_version 70630 (0.0008) +[2023-10-08 14:35:16,796][102898] Updated weights for policy 1, policy_version 70640 (0.0007) +[2023-10-08 14:35:16,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 144572416. Throughput: 0: 1785.8, 1: 1810.5. Samples: 36157338. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:35:16,875][101941] Avg episode reward: [(0, '8.520'), (1, '10.310')] +[2023-10-08 14:35:17,160][102898] Updated weights for policy 1, policy_version 70650 (0.0007) +[2023-10-08 14:35:18,672][102897] Updated weights for policy 0, policy_version 70570 (0.0008) +[2023-10-08 14:35:19,048][102897] Updated weights for policy 0, policy_version 70580 (0.0007) +[2023-10-08 14:35:19,419][102897] Updated weights for policy 0, policy_version 70590 (0.0007) +[2023-10-08 14:35:20,964][102898] Updated weights for policy 1, policy_version 70660 (0.0009) +[2023-10-08 14:35:21,329][102898] Updated weights for policy 1, policy_version 70670 (0.0009) +[2023-10-08 14:35:21,689][102898] Updated weights for policy 1, policy_version 70680 (0.0009) +[2023-10-08 14:35:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 144637952. Throughput: 0: 1791.9, 1: 1799.6. Samples: 36167734. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:35:21,875][101941] Avg episode reward: [(0, '8.780'), (1, '9.960')] +[2023-10-08 14:35:23,107][102897] Updated weights for policy 0, policy_version 70600 (0.0008) +[2023-10-08 14:35:23,474][102897] Updated weights for policy 0, policy_version 70610 (0.0007) +[2023-10-08 14:35:23,845][102897] Updated weights for policy 0, policy_version 70620 (0.0008) +[2023-10-08 14:35:25,460][102898] Updated weights for policy 1, policy_version 70690 (0.0008) +[2023-10-08 14:35:25,829][102898] Updated weights for policy 1, policy_version 70700 (0.0009) +[2023-10-08 14:35:26,205][102898] Updated weights for policy 1, policy_version 70710 (0.0010) +[2023-10-08 14:35:26,575][102898] Updated weights for policy 1, policy_version 70720 (0.0008) +[2023-10-08 14:35:26,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 144736256. Throughput: 0: 1796.4, 1: 1809.3. Samples: 36190010. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:35:26,875][101941] Avg episode reward: [(0, '8.580'), (1, '10.050')] +[2023-10-08 14:35:27,704][102897] Updated weights for policy 0, policy_version 70630 (0.0009) +[2023-10-08 14:35:28,086][102897] Updated weights for policy 0, policy_version 70640 (0.0011) +[2023-10-08 14:35:28,442][102897] Updated weights for policy 0, policy_version 70650 (0.0010) +[2023-10-08 14:35:30,469][102898] Updated weights for policy 1, policy_version 70730 (0.0009) +[2023-10-08 14:35:30,841][102898] Updated weights for policy 1, policy_version 70740 (0.0008) +[2023-10-08 14:35:31,200][102898] Updated weights for policy 1, policy_version 70750 (0.0007) +[2023-10-08 14:35:31,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 144801792. Throughput: 0: 1795.2, 1: 1792.2. Samples: 36210950. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:35:31,876][101941] Avg episode reward: [(0, '7.720'), (1, '9.700')] +[2023-10-08 14:35:32,196][102897] Updated weights for policy 0, policy_version 70660 (0.0009) +[2023-10-08 14:35:32,569][102897] Updated weights for policy 0, policy_version 70670 (0.0008) +[2023-10-08 14:35:32,943][102897] Updated weights for policy 0, policy_version 70680 (0.0008) +[2023-10-08 14:35:34,985][102898] Updated weights for policy 1, policy_version 70760 (0.0008) +[2023-10-08 14:35:35,350][102898] Updated weights for policy 1, policy_version 70770 (0.0009) +[2023-10-08 14:35:35,714][102898] Updated weights for policy 1, policy_version 70780 (0.0009) +[2023-10-08 14:35:36,695][102897] Updated weights for policy 0, policy_version 70690 (0.0007) +[2023-10-08 14:35:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 144867328. Throughput: 0: 1789.2, 1: 1805.4. Samples: 36221994. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:35:36,875][101941] Avg episode reward: [(0, '7.610'), (1, '9.210')] +[2023-10-08 14:35:37,071][102897] Updated weights for policy 0, policy_version 70700 (0.0009) +[2023-10-08 14:35:37,440][102897] Updated weights for policy 0, policy_version 70710 (0.0009) +[2023-10-08 14:35:37,807][102897] Updated weights for policy 0, policy_version 70720 (0.0008) +[2023-10-08 14:35:39,376][102898] Updated weights for policy 1, policy_version 70790 (0.0009) +[2023-10-08 14:35:39,747][102898] Updated weights for policy 1, policy_version 70800 (0.0007) +[2023-10-08 14:35:40,110][102898] Updated weights for policy 1, policy_version 70810 (0.0008) +[2023-10-08 14:35:41,576][102897] Updated weights for policy 0, policy_version 70730 (0.0010) +[2023-10-08 14:35:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 144932864. Throughput: 0: 1793.6, 1: 1783.2. Samples: 36243018. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:35:41,876][101941] Avg episode reward: [(0, '7.850'), (1, '9.610')] +[2023-10-08 14:35:41,952][102897] Updated weights for policy 0, policy_version 70740 (0.0010) +[2023-10-08 14:35:42,310][102897] Updated weights for policy 0, policy_version 70750 (0.0010) +[2023-10-08 14:35:43,940][102898] Updated weights for policy 1, policy_version 70820 (0.0009) +[2023-10-08 14:35:44,318][102898] Updated weights for policy 1, policy_version 70830 (0.0009) +[2023-10-08 14:35:44,689][102898] Updated weights for policy 1, policy_version 70840 (0.0008) +[2023-10-08 14:35:46,212][102897] Updated weights for policy 0, policy_version 70760 (0.0008) +[2023-10-08 14:35:46,589][102897] Updated weights for policy 0, policy_version 70770 (0.0009) +[2023-10-08 14:35:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 144998400. Throughput: 0: 1805.3, 1: 1780.8. Samples: 36264582. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:35:46,876][101941] Avg episode reward: [(0, '8.360'), (1, '9.600')] +[2023-10-08 14:35:46,955][102897] Updated weights for policy 0, policy_version 70780 (0.0008) +[2023-10-08 14:35:48,425][102898] Updated weights for policy 1, policy_version 70850 (0.0007) +[2023-10-08 14:35:48,795][102898] Updated weights for policy 1, policy_version 70860 (0.0009) +[2023-10-08 14:35:49,159][102898] Updated weights for policy 1, policy_version 70870 (0.0011) +[2023-10-08 14:35:49,530][102898] Updated weights for policy 1, policy_version 70880 (0.0009) +[2023-10-08 14:35:50,763][102897] Updated weights for policy 0, policy_version 70790 (0.0009) +[2023-10-08 14:35:51,137][102897] Updated weights for policy 0, policy_version 70800 (0.0009) +[2023-10-08 14:35:51,509][102897] Updated weights for policy 0, policy_version 70810 (0.0007) +[2023-10-08 14:35:51,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 145096704. Throughput: 0: 1781.0, 1: 1784.5. Samples: 36275034. Policy #0 lag: (min: 26.0, avg: 42.4, max: 58.0) +[2023-10-08 14:35:51,876][101941] Avg episode reward: [(0, '8.130'), (1, '9.410')] +[2023-10-08 14:35:53,160][102898] Updated weights for policy 1, policy_version 70890 (0.0008) +[2023-10-08 14:35:53,527][102898] Updated weights for policy 1, policy_version 70900 (0.0011) +[2023-10-08 14:35:53,897][102898] Updated weights for policy 1, policy_version 70910 (0.0008) +[2023-10-08 14:35:55,208][102897] Updated weights for policy 0, policy_version 70820 (0.0008) +[2023-10-08 14:35:55,566][102897] Updated weights for policy 0, policy_version 70830 (0.0007) +[2023-10-08 14:35:55,946][102897] Updated weights for policy 0, policy_version 70840 (0.0008) +[2023-10-08 14:35:56,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 145162240. Throughput: 0: 1810.7, 1: 1779.3. Samples: 36297022. Policy #0 lag: (min: 26.0, avg: 42.4, max: 58.0) +[2023-10-08 14:35:56,876][101941] Avg episode reward: [(0, '8.410'), (1, '9.400')] +[2023-10-08 14:35:57,743][102898] Updated weights for policy 1, policy_version 70920 (0.0008) +[2023-10-08 14:35:58,106][102898] Updated weights for policy 1, policy_version 70930 (0.0009) +[2023-10-08 14:35:58,475][102898] Updated weights for policy 1, policy_version 70940 (0.0010) +[2023-10-08 14:35:59,627][102897] Updated weights for policy 0, policy_version 70850 (0.0008) +[2023-10-08 14:35:59,998][102897] Updated weights for policy 0, policy_version 70860 (0.0009) +[2023-10-08 14:36:00,361][102897] Updated weights for policy 0, policy_version 70870 (0.0009) +[2023-10-08 14:36:00,727][102897] Updated weights for policy 0, policy_version 70880 (0.0011) +[2023-10-08 14:36:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 145227776. Throughput: 0: 1791.3, 1: 1788.0. Samples: 36318406. Policy #0 lag: (min: 26.0, avg: 42.4, max: 58.0) +[2023-10-08 14:36:01,876][101941] Avg episode reward: [(0, '8.370'), (1, '9.860')] +[2023-10-08 14:36:02,327][102898] Updated weights for policy 1, policy_version 70950 (0.0008) +[2023-10-08 14:36:02,712][102898] Updated weights for policy 1, policy_version 70960 (0.0008) +[2023-10-08 14:36:03,072][102898] Updated weights for policy 1, policy_version 70970 (0.0009) +[2023-10-08 14:36:04,346][102897] Updated weights for policy 0, policy_version 70890 (0.0008) +[2023-10-08 14:36:04,717][102897] Updated weights for policy 0, policy_version 70900 (0.0008) +[2023-10-08 14:36:05,084][102897] Updated weights for policy 0, policy_version 70910 (0.0008) +[2023-10-08 14:36:06,722][102898] Updated weights for policy 1, policy_version 70980 (0.0007) +[2023-10-08 14:36:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 145293312. Throughput: 0: 1810.4, 1: 1780.6. Samples: 36329326. Policy #0 lag: (min: 26.0, avg: 42.4, max: 58.0) +[2023-10-08 14:36:06,876][101941] Avg episode reward: [(0, '8.100'), (1, '9.590')] +[2023-10-08 14:36:07,090][102898] Updated weights for policy 1, policy_version 70990 (0.0009) +[2023-10-08 14:36:07,452][102898] Updated weights for policy 1, policy_version 71000 (0.0009) +[2023-10-08 14:36:09,026][102897] Updated weights for policy 0, policy_version 70920 (0.0008) +[2023-10-08 14:36:09,383][102897] Updated weights for policy 0, policy_version 70930 (0.0008) +[2023-10-08 14:36:09,757][102897] Updated weights for policy 0, policy_version 70940 (0.0008) +[2023-10-08 14:36:11,257][102898] Updated weights for policy 1, policy_version 71010 (0.0008) +[2023-10-08 14:36:11,617][102898] Updated weights for policy 1, policy_version 71020 (0.0008) +[2023-10-08 14:36:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 145358848. Throughput: 0: 1783.9, 1: 1790.1. Samples: 36350838. Policy #0 lag: (min: 26.0, avg: 42.4, max: 58.0) +[2023-10-08 14:36:11,876][101941] Avg episode reward: [(0, '8.370'), (1, '9.580')] +[2023-10-08 14:36:11,977][102898] Updated weights for policy 1, policy_version 71030 (0.0008) +[2023-10-08 14:36:12,347][102898] Updated weights for policy 1, policy_version 71040 (0.0009) +[2023-10-08 14:36:13,497][102897] Updated weights for policy 0, policy_version 70950 (0.0008) +[2023-10-08 14:36:13,882][102897] Updated weights for policy 0, policy_version 70960 (0.0008) +[2023-10-08 14:36:14,254][102897] Updated weights for policy 0, policy_version 70970 (0.0008) +[2023-10-08 14:36:16,069][102898] Updated weights for policy 1, policy_version 71050 (0.0007) +[2023-10-08 14:36:16,428][102898] Updated weights for policy 1, policy_version 71060 (0.0007) +[2023-10-08 14:36:16,792][102898] Updated weights for policy 1, policy_version 71070 (0.0008) +[2023-10-08 14:36:16,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 145457152. Throughput: 0: 1792.1, 1: 1797.3. Samples: 36372474. Policy #0 lag: (min: 26.0, avg: 42.4, max: 58.0) +[2023-10-08 14:36:16,876][101941] Avg episode reward: [(0, '9.150'), (1, '9.370')] +[2023-10-08 14:36:16,889][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000070976_72679424.pth... +[2023-10-08 14:36:16,889][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000071072_72777728.pth... +[2023-10-08 14:36:16,928][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000069376_71041024.pth +[2023-10-08 14:36:16,929][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000069312_70975488.pth +[2023-10-08 14:36:17,839][102897] Updated weights for policy 0, policy_version 70980 (0.0009) +[2023-10-08 14:36:18,200][102897] Updated weights for policy 0, policy_version 70990 (0.0010) +[2023-10-08 14:36:18,571][102897] Updated weights for policy 0, policy_version 71000 (0.0010) +[2023-10-08 14:36:20,481][102898] Updated weights for policy 1, policy_version 71080 (0.0008) +[2023-10-08 14:36:20,849][102898] Updated weights for policy 1, policy_version 71090 (0.0008) +[2023-10-08 14:36:21,212][102898] Updated weights for policy 1, policy_version 71100 (0.0008) +[2023-10-08 14:36:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 145522688. Throughput: 0: 1793.8, 1: 1788.6. Samples: 36383202. Policy #0 lag: (min: 26.0, avg: 42.4, max: 58.0) +[2023-10-08 14:36:21,876][101941] Avg episode reward: [(0, '8.880'), (1, '9.990')] +[2023-10-08 14:36:22,348][102897] Updated weights for policy 0, policy_version 71010 (0.0011) +[2023-10-08 14:36:22,724][102897] Updated weights for policy 0, policy_version 71020 (0.0007) +[2023-10-08 14:36:23,088][102897] Updated weights for policy 0, policy_version 71030 (0.0007) +[2023-10-08 14:36:23,467][102897] Updated weights for policy 0, policy_version 71040 (0.0009) +[2023-10-08 14:36:25,090][102898] Updated weights for policy 1, policy_version 71110 (0.0010) +[2023-10-08 14:36:25,455][102898] Updated weights for policy 1, policy_version 71120 (0.0008) +[2023-10-08 14:36:25,814][102898] Updated weights for policy 1, policy_version 71130 (0.0011) +[2023-10-08 14:36:26,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 145588224. Throughput: 0: 1790.2, 1: 1809.6. Samples: 36405010. Policy #0 lag: (min: 26.0, avg: 42.4, max: 58.0) +[2023-10-08 14:36:26,876][101941] Avg episode reward: [(0, '8.490'), (1, '10.120')] +[2023-10-08 14:36:27,286][102897] Updated weights for policy 0, policy_version 71050 (0.0009) +[2023-10-08 14:36:27,662][102897] Updated weights for policy 0, policy_version 71060 (0.0008) +[2023-10-08 14:36:28,032][102897] Updated weights for policy 0, policy_version 71070 (0.0008) +[2023-10-08 14:36:29,600][102898] Updated weights for policy 1, policy_version 71140 (0.0008) +[2023-10-08 14:36:29,964][102898] Updated weights for policy 1, policy_version 71150 (0.0007) +[2023-10-08 14:36:30,330][102898] Updated weights for policy 1, policy_version 71160 (0.0008) +[2023-10-08 14:36:31,801][102897] Updated weights for policy 0, policy_version 71080 (0.0008) +[2023-10-08 14:36:31,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 145653760. Throughput: 0: 1798.8, 1: 1796.1. Samples: 36426354. Policy #0 lag: (min: 26.0, avg: 42.4, max: 58.0) +[2023-10-08 14:36:31,875][101941] Avg episode reward: [(0, '8.090'), (1, '8.610')] +[2023-10-08 14:36:32,168][102897] Updated weights for policy 0, policy_version 71090 (0.0008) +[2023-10-08 14:36:32,537][102897] Updated weights for policy 0, policy_version 71100 (0.0007) +[2023-10-08 14:36:33,895][102898] Updated weights for policy 1, policy_version 71170 (0.0008) +[2023-10-08 14:36:34,264][102898] Updated weights for policy 1, policy_version 71180 (0.0008) +[2023-10-08 14:36:34,627][102898] Updated weights for policy 1, policy_version 71190 (0.0008) +[2023-10-08 14:36:34,998][102898] Updated weights for policy 1, policy_version 71200 (0.0007) +[2023-10-08 14:36:36,149][102897] Updated weights for policy 0, policy_version 71110 (0.0007) +[2023-10-08 14:36:36,522][102897] Updated weights for policy 0, policy_version 71120 (0.0009) +[2023-10-08 14:36:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 145719296. Throughput: 0: 1790.6, 1: 1811.1. Samples: 36437112. Policy #0 lag: (min: 26.0, avg: 42.4, max: 58.0) +[2023-10-08 14:36:36,876][101941] Avg episode reward: [(0, '8.150'), (1, '9.200')] +[2023-10-08 14:36:36,885][102897] Updated weights for policy 0, policy_version 71130 (0.0011) +[2023-10-08 14:36:38,766][102898] Updated weights for policy 1, policy_version 71210 (0.0009) +[2023-10-08 14:36:39,122][102898] Updated weights for policy 1, policy_version 71220 (0.0008) +[2023-10-08 14:36:39,492][102898] Updated weights for policy 1, policy_version 71230 (0.0008) +[2023-10-08 14:36:40,616][102897] Updated weights for policy 0, policy_version 71140 (0.0008) +[2023-10-08 14:36:40,986][102897] Updated weights for policy 0, policy_version 71150 (0.0008) +[2023-10-08 14:36:41,359][102897] Updated weights for policy 0, policy_version 71160 (0.0009) +[2023-10-08 14:36:41,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 145817600. Throughput: 0: 1799.7, 1: 1790.8. Samples: 36458594. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:36:41,876][101941] Avg episode reward: [(0, '8.430'), (1, '9.150')] +[2023-10-08 14:36:43,382][102898] Updated weights for policy 1, policy_version 71240 (0.0008) +[2023-10-08 14:36:43,748][102898] Updated weights for policy 1, policy_version 71250 (0.0008) +[2023-10-08 14:36:44,121][102898] Updated weights for policy 1, policy_version 71260 (0.0007) +[2023-10-08 14:36:45,228][102897] Updated weights for policy 0, policy_version 71170 (0.0008) +[2023-10-08 14:36:45,596][102897] Updated weights for policy 0, policy_version 71180 (0.0007) +[2023-10-08 14:36:45,973][102897] Updated weights for policy 0, policy_version 71190 (0.0009) +[2023-10-08 14:36:46,339][102897] Updated weights for policy 0, policy_version 71200 (0.0008) +[2023-10-08 14:36:46,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 145883136. Throughput: 0: 1785.9, 1: 1801.6. Samples: 36479844. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:36:46,876][101941] Avg episode reward: [(0, '8.990'), (1, '8.930')] +[2023-10-08 14:36:47,825][102898] Updated weights for policy 1, policy_version 71270 (0.0008) +[2023-10-08 14:36:48,207][102898] Updated weights for policy 1, policy_version 71280 (0.0010) +[2023-10-08 14:36:48,569][102898] Updated weights for policy 1, policy_version 71290 (0.0007) +[2023-10-08 14:36:50,095][102897] Updated weights for policy 0, policy_version 71210 (0.0009) +[2023-10-08 14:36:50,462][102897] Updated weights for policy 0, policy_version 71220 (0.0009) +[2023-10-08 14:36:50,831][102897] Updated weights for policy 0, policy_version 71230 (0.0009) +[2023-10-08 14:36:51,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 145948672. Throughput: 0: 1790.2, 1: 1797.8. Samples: 36490786. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:36:51,876][101941] Avg episode reward: [(0, '8.970'), (1, '10.030')] +[2023-10-08 14:36:52,324][102898] Updated weights for policy 1, policy_version 71300 (0.0008) +[2023-10-08 14:36:52,688][102898] Updated weights for policy 1, policy_version 71310 (0.0010) +[2023-10-08 14:36:53,057][102898] Updated weights for policy 1, policy_version 71320 (0.0009) +[2023-10-08 14:36:54,487][102897] Updated weights for policy 0, policy_version 71240 (0.0008) +[2023-10-08 14:36:54,849][102897] Updated weights for policy 0, policy_version 71250 (0.0008) +[2023-10-08 14:36:55,215][102897] Updated weights for policy 0, policy_version 71260 (0.0009) +[2023-10-08 14:36:56,876][101941] Fps is (10 sec: 13106.3, 60 sec: 14199.3, 300 sec: 14329.0). Total num frames: 146014208. Throughput: 0: 1784.3, 1: 1790.5. Samples: 36511706. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:36:56,876][101941] Avg episode reward: [(0, '7.930'), (1, '9.850')] +[2023-10-08 14:36:56,885][102898] Updated weights for policy 1, policy_version 71330 (0.0008) +[2023-10-08 14:36:57,246][102898] Updated weights for policy 1, policy_version 71340 (0.0008) +[2023-10-08 14:36:57,615][102898] Updated weights for policy 1, policy_version 71350 (0.0007) +[2023-10-08 14:36:57,976][102898] Updated weights for policy 1, policy_version 71360 (0.0008) +[2023-10-08 14:36:59,087][102897] Updated weights for policy 0, policy_version 71270 (0.0009) +[2023-10-08 14:36:59,470][102897] Updated weights for policy 0, policy_version 71280 (0.0009) +[2023-10-08 14:36:59,839][102897] Updated weights for policy 0, policy_version 71290 (0.0008) +[2023-10-08 14:37:01,733][102898] Updated weights for policy 1, policy_version 71370 (0.0008) +[2023-10-08 14:37:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 146079744. Throughput: 0: 1777.2, 1: 1807.4. Samples: 36533778. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:37:01,876][101941] Avg episode reward: [(0, '8.330'), (1, '9.850')] +[2023-10-08 14:37:02,096][102898] Updated weights for policy 1, policy_version 71380 (0.0010) +[2023-10-08 14:37:02,465][102898] Updated weights for policy 1, policy_version 71390 (0.0007) +[2023-10-08 14:37:03,688][102897] Updated weights for policy 0, policy_version 71300 (0.0007) +[2023-10-08 14:37:04,058][102897] Updated weights for policy 0, policy_version 71310 (0.0008) +[2023-10-08 14:37:04,423][102897] Updated weights for policy 0, policy_version 71320 (0.0008) +[2023-10-08 14:37:06,231][102898] Updated weights for policy 1, policy_version 71400 (0.0009) +[2023-10-08 14:37:06,602][102898] Updated weights for policy 1, policy_version 71410 (0.0007) +[2023-10-08 14:37:06,875][101941] Fps is (10 sec: 13108.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 146145280. Throughput: 0: 1786.0, 1: 1788.4. Samples: 36544050. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:37:06,876][101941] Avg episode reward: [(0, '8.040'), (1, '9.610')] +[2023-10-08 14:37:06,965][102898] Updated weights for policy 1, policy_version 71420 (0.0008) +[2023-10-08 14:37:08,182][102897] Updated weights for policy 0, policy_version 71330 (0.0008) +[2023-10-08 14:37:08,558][102897] Updated weights for policy 0, policy_version 71340 (0.0009) +[2023-10-08 14:37:08,936][102897] Updated weights for policy 0, policy_version 71350 (0.0009) +[2023-10-08 14:37:09,304][102897] Updated weights for policy 0, policy_version 71360 (0.0009) +[2023-10-08 14:37:10,739][102898] Updated weights for policy 1, policy_version 71430 (0.0007) +[2023-10-08 14:37:11,107][102898] Updated weights for policy 1, policy_version 71440 (0.0008) +[2023-10-08 14:37:11,471][102898] Updated weights for policy 1, policy_version 71450 (0.0007) +[2023-10-08 14:37:11,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 146243584. Throughput: 0: 1776.8, 1: 1801.2. Samples: 36566018. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:37:11,876][101941] Avg episode reward: [(0, '8.330'), (1, '10.040')] +[2023-10-08 14:37:13,039][102897] Updated weights for policy 0, policy_version 71370 (0.0007) +[2023-10-08 14:37:13,405][102897] Updated weights for policy 0, policy_version 71380 (0.0007) +[2023-10-08 14:37:13,770][102897] Updated weights for policy 0, policy_version 71390 (0.0007) +[2023-10-08 14:37:15,268][102898] Updated weights for policy 1, policy_version 71460 (0.0008) +[2023-10-08 14:37:15,632][102898] Updated weights for policy 1, policy_version 71470 (0.0009) +[2023-10-08 14:37:15,998][102898] Updated weights for policy 1, policy_version 71480 (0.0008) +[2023-10-08 14:37:16,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 146309120. Throughput: 0: 1786.5, 1: 1786.3. Samples: 36587128. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:37:16,876][101941] Avg episode reward: [(0, '8.400'), (1, '9.150')] +[2023-10-08 14:37:17,431][102897] Updated weights for policy 0, policy_version 71400 (0.0007) +[2023-10-08 14:37:17,816][102897] Updated weights for policy 0, policy_version 71410 (0.0007) +[2023-10-08 14:37:18,175][102897] Updated weights for policy 0, policy_version 71420 (0.0008) +[2023-10-08 14:37:19,868][102898] Updated weights for policy 1, policy_version 71490 (0.0008) +[2023-10-08 14:37:20,227][102898] Updated weights for policy 1, policy_version 71500 (0.0010) +[2023-10-08 14:37:20,601][102898] Updated weights for policy 1, policy_version 71510 (0.0009) +[2023-10-08 14:37:20,970][102898] Updated weights for policy 1, policy_version 71520 (0.0010) +[2023-10-08 14:37:21,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 146374656. Throughput: 0: 1781.9, 1: 1800.7. Samples: 36598328. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:37:21,876][101941] Avg episode reward: [(0, '8.060'), (1, '8.970')] +[2023-10-08 14:37:22,044][102897] Updated weights for policy 0, policy_version 71430 (0.0009) +[2023-10-08 14:37:22,413][102897] Updated weights for policy 0, policy_version 71440 (0.0009) +[2023-10-08 14:37:22,787][102897] Updated weights for policy 0, policy_version 71450 (0.0008) +[2023-10-08 14:37:24,642][102898] Updated weights for policy 1, policy_version 71530 (0.0008) +[2023-10-08 14:37:25,021][102898] Updated weights for policy 1, policy_version 71540 (0.0008) +[2023-10-08 14:37:25,382][102898] Updated weights for policy 1, policy_version 71550 (0.0010) +[2023-10-08 14:37:26,683][102897] Updated weights for policy 0, policy_version 71460 (0.0008) +[2023-10-08 14:37:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 146440192. Throughput: 0: 1783.8, 1: 1788.9. Samples: 36619364. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:37:26,876][101941] Avg episode reward: [(0, '7.950'), (1, '9.610')] +[2023-10-08 14:37:27,054][102897] Updated weights for policy 0, policy_version 71470 (0.0007) +[2023-10-08 14:37:27,418][102897] Updated weights for policy 0, policy_version 71480 (0.0007) +[2023-10-08 14:37:29,073][102898] Updated weights for policy 1, policy_version 71560 (0.0008) +[2023-10-08 14:37:29,438][102898] Updated weights for policy 1, policy_version 71570 (0.0007) +[2023-10-08 14:37:29,808][102898] Updated weights for policy 1, policy_version 71580 (0.0007) +[2023-10-08 14:37:31,278][102897] Updated weights for policy 0, policy_version 71490 (0.0008) +[2023-10-08 14:37:31,650][102897] Updated weights for policy 0, policy_version 71500 (0.0008) +[2023-10-08 14:37:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 146505728. Throughput: 0: 1809.1, 1: 1783.9. Samples: 36641530. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:37:31,876][101941] Avg episode reward: [(0, '8.020'), (1, '9.250')] +[2023-10-08 14:37:32,018][102897] Updated weights for policy 0, policy_version 71510 (0.0008) +[2023-10-08 14:37:32,390][102897] Updated weights for policy 0, policy_version 71520 (0.0007) +[2023-10-08 14:37:33,631][102898] Updated weights for policy 1, policy_version 71590 (0.0007) +[2023-10-08 14:37:33,999][102898] Updated weights for policy 1, policy_version 71600 (0.0007) +[2023-10-08 14:37:34,374][102898] Updated weights for policy 1, policy_version 71610 (0.0009) +[2023-10-08 14:37:36,033][102897] Updated weights for policy 0, policy_version 71530 (0.0007) +[2023-10-08 14:37:36,395][102897] Updated weights for policy 0, policy_version 71540 (0.0009) +[2023-10-08 14:37:36,772][102897] Updated weights for policy 0, policy_version 71550 (0.0007) +[2023-10-08 14:37:36,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 146604032. Throughput: 0: 1786.3, 1: 1795.4. Samples: 36651962. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:37:36,875][101941] Avg episode reward: [(0, '7.740'), (1, '9.570')] +[2023-10-08 14:37:38,073][102898] Updated weights for policy 1, policy_version 71620 (0.0010) +[2023-10-08 14:37:38,438][102898] Updated weights for policy 1, policy_version 71630 (0.0008) +[2023-10-08 14:37:38,802][102898] Updated weights for policy 1, policy_version 71640 (0.0010) +[2023-10-08 14:37:40,594][102897] Updated weights for policy 0, policy_version 71560 (0.0009) +[2023-10-08 14:37:40,961][102897] Updated weights for policy 0, policy_version 71570 (0.0009) +[2023-10-08 14:37:41,328][102897] Updated weights for policy 0, policy_version 71580 (0.0008) +[2023-10-08 14:37:41,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 146669568. Throughput: 0: 1813.0, 1: 1794.7. Samples: 36674052. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:37:41,876][101941] Avg episode reward: [(0, '8.320'), (1, '9.720')] +[2023-10-08 14:37:42,568][102898] Updated weights for policy 1, policy_version 71650 (0.0009) +[2023-10-08 14:37:42,941][102898] Updated weights for policy 1, policy_version 71660 (0.0008) +[2023-10-08 14:37:43,312][102898] Updated weights for policy 1, policy_version 71670 (0.0007) +[2023-10-08 14:37:43,669][102898] Updated weights for policy 1, policy_version 71680 (0.0008) +[2023-10-08 14:37:44,987][102897] Updated weights for policy 0, policy_version 71590 (0.0008) +[2023-10-08 14:37:45,372][102897] Updated weights for policy 0, policy_version 71600 (0.0010) +[2023-10-08 14:37:45,741][102897] Updated weights for policy 0, policy_version 71610 (0.0011) +[2023-10-08 14:37:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 146735104. Throughput: 0: 1785.1, 1: 1803.8. Samples: 36695278. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:37:46,875][101941] Avg episode reward: [(0, '9.070'), (1, '9.590')] +[2023-10-08 14:37:47,345][102898] Updated weights for policy 1, policy_version 71690 (0.0009) +[2023-10-08 14:37:47,709][102898] Updated weights for policy 1, policy_version 71700 (0.0008) +[2023-10-08 14:37:48,084][102898] Updated weights for policy 1, policy_version 71710 (0.0009) +[2023-10-08 14:37:49,372][102897] Updated weights for policy 0, policy_version 71620 (0.0009) +[2023-10-08 14:37:49,745][102897] Updated weights for policy 0, policy_version 71630 (0.0009) +[2023-10-08 14:37:50,107][102897] Updated weights for policy 0, policy_version 71640 (0.0008) +[2023-10-08 14:37:51,609][102898] Updated weights for policy 1, policy_version 71720 (0.0010) +[2023-10-08 14:37:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 146800640. Throughput: 0: 1807.9, 1: 1803.6. Samples: 36706566. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:37:51,875][101941] Avg episode reward: [(0, '8.910'), (1, '9.350')] +[2023-10-08 14:37:51,978][102898] Updated weights for policy 1, policy_version 71730 (0.0009) +[2023-10-08 14:37:52,344][102898] Updated weights for policy 1, policy_version 71740 (0.0009) +[2023-10-08 14:37:53,646][102897] Updated weights for policy 0, policy_version 71650 (0.0009) +[2023-10-08 14:37:54,025][102897] Updated weights for policy 0, policy_version 71660 (0.0011) +[2023-10-08 14:37:54,397][102897] Updated weights for policy 0, policy_version 71670 (0.0009) +[2023-10-08 14:37:54,773][102897] Updated weights for policy 0, policy_version 71680 (0.0007) +[2023-10-08 14:37:56,093][102898] Updated weights for policy 1, policy_version 71750 (0.0007) +[2023-10-08 14:37:56,457][102898] Updated weights for policy 1, policy_version 71760 (0.0008) +[2023-10-08 14:37:56,835][102898] Updated weights for policy 1, policy_version 71770 (0.0008) +[2023-10-08 14:37:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.7, 300 sec: 14218.0). Total num frames: 146866176. Throughput: 0: 1797.0, 1: 1804.8. Samples: 36728098. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:37:56,875][101941] Avg episode reward: [(0, '8.790'), (1, '9.780')] +[2023-10-08 14:37:58,414][102897] Updated weights for policy 0, policy_version 71690 (0.0010) +[2023-10-08 14:37:58,791][102897] Updated weights for policy 0, policy_version 71700 (0.0009) +[2023-10-08 14:37:59,151][102897] Updated weights for policy 0, policy_version 71710 (0.0007) +[2023-10-08 14:38:00,748][102898] Updated weights for policy 1, policy_version 71780 (0.0008) +[2023-10-08 14:38:01,120][102898] Updated weights for policy 1, policy_version 71790 (0.0010) +[2023-10-08 14:38:01,484][102898] Updated weights for policy 1, policy_version 71800 (0.0007) +[2023-10-08 14:38:01,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 146964480. Throughput: 0: 1795.5, 1: 1815.5. Samples: 36749624. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:38:01,876][101941] Avg episode reward: [(0, '8.960'), (1, '10.430')] +[2023-10-08 14:38:02,916][102897] Updated weights for policy 0, policy_version 71720 (0.0007) +[2023-10-08 14:38:03,287][102897] Updated weights for policy 0, policy_version 71730 (0.0007) +[2023-10-08 14:38:03,664][102897] Updated weights for policy 0, policy_version 71740 (0.0008) +[2023-10-08 14:38:05,059][102898] Updated weights for policy 1, policy_version 71810 (0.0008) +[2023-10-08 14:38:05,416][102898] Updated weights for policy 1, policy_version 71820 (0.0009) +[2023-10-08 14:38:05,782][102898] Updated weights for policy 1, policy_version 71830 (0.0010) +[2023-10-08 14:38:06,152][102898] Updated weights for policy 1, policy_version 71840 (0.0011) +[2023-10-08 14:38:06,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 147030016. Throughput: 0: 1794.4, 1: 1808.5. Samples: 36760462. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:38:06,876][101941] Avg episode reward: [(0, '8.940'), (1, '10.590')] +[2023-10-08 14:38:07,421][102897] Updated weights for policy 0, policy_version 71750 (0.0009) +[2023-10-08 14:38:07,801][102897] Updated weights for policy 0, policy_version 71760 (0.0009) +[2023-10-08 14:38:08,174][102897] Updated weights for policy 0, policy_version 71770 (0.0008) +[2023-10-08 14:38:09,743][102898] Updated weights for policy 1, policy_version 71850 (0.0011) +[2023-10-08 14:38:10,114][102898] Updated weights for policy 1, policy_version 71860 (0.0011) +[2023-10-08 14:38:10,477][102898] Updated weights for policy 1, policy_version 71870 (0.0011) +[2023-10-08 14:38:11,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 147095552. Throughput: 0: 1792.6, 1: 1813.9. Samples: 36781656. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:38:11,875][101941] Avg episode reward: [(0, '8.450'), (1, '9.910')] +[2023-10-08 14:38:12,108][102897] Updated weights for policy 0, policy_version 71780 (0.0009) +[2023-10-08 14:38:12,477][102897] Updated weights for policy 0, policy_version 71790 (0.0010) +[2023-10-08 14:38:12,847][102897] Updated weights for policy 0, policy_version 71800 (0.0008) +[2023-10-08 14:38:14,341][102898] Updated weights for policy 1, policy_version 71880 (0.0008) +[2023-10-08 14:38:14,706][102898] Updated weights for policy 1, policy_version 71890 (0.0008) +[2023-10-08 14:38:15,078][102898] Updated weights for policy 1, policy_version 71900 (0.0007) +[2023-10-08 14:38:16,720][102897] Updated weights for policy 0, policy_version 71810 (0.0008) +[2023-10-08 14:38:16,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 147161088. Throughput: 0: 1803.9, 1: 1797.6. Samples: 36803596. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:38:16,875][101941] Avg episode reward: [(0, '8.330'), (1, '9.940')] +[2023-10-08 14:38:16,884][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000071904_73629696.pth... +[2023-10-08 14:38:16,919][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000070208_71892992.pth +[2023-10-08 14:38:17,100][102897] Updated weights for policy 0, policy_version 71820 (0.0007) +[2023-10-08 14:38:17,467][102897] Updated weights for policy 0, policy_version 71830 (0.0008) +[2023-10-08 14:38:17,832][102897] Updated weights for policy 0, policy_version 71840 (0.0007) +[2023-10-08 14:38:17,832][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000071840_73564160.pth... +[2023-10-08 14:38:17,869][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000070144_71827456.pth +[2023-10-08 14:38:18,973][102898] Updated weights for policy 1, policy_version 71910 (0.0009) +[2023-10-08 14:38:19,349][102898] Updated weights for policy 1, policy_version 71920 (0.0009) +[2023-10-08 14:38:19,708][102898] Updated weights for policy 1, policy_version 71930 (0.0009) +[2023-10-08 14:38:21,580][102897] Updated weights for policy 0, policy_version 71850 (0.0007) +[2023-10-08 14:38:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 147226624. Throughput: 0: 1793.9, 1: 1803.9. Samples: 36813860. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:38:21,875][101941] Avg episode reward: [(0, '8.750'), (1, '9.610')] +[2023-10-08 14:38:21,944][102897] Updated weights for policy 0, policy_version 71860 (0.0008) +[2023-10-08 14:38:22,318][102897] Updated weights for policy 0, policy_version 71870 (0.0007) +[2023-10-08 14:38:23,529][102898] Updated weights for policy 1, policy_version 71940 (0.0007) +[2023-10-08 14:38:23,894][102898] Updated weights for policy 1, policy_version 71950 (0.0008) +[2023-10-08 14:38:24,255][102898] Updated weights for policy 1, policy_version 71960 (0.0009) +[2023-10-08 14:38:26,051][102897] Updated weights for policy 0, policy_version 71880 (0.0008) +[2023-10-08 14:38:26,431][102897] Updated weights for policy 0, policy_version 71890 (0.0008) +[2023-10-08 14:38:26,793][102897] Updated weights for policy 0, policy_version 71900 (0.0008) +[2023-10-08 14:38:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 147292160. Throughput: 0: 1803.6, 1: 1786.7. Samples: 36835614. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:38:26,875][101941] Avg episode reward: [(0, '8.650'), (1, '9.080')] +[2023-10-08 14:38:28,003][102898] Updated weights for policy 1, policy_version 71970 (0.0009) +[2023-10-08 14:38:28,377][102898] Updated weights for policy 1, policy_version 71980 (0.0009) +[2023-10-08 14:38:28,740][102898] Updated weights for policy 1, policy_version 71990 (0.0009) +[2023-10-08 14:38:29,109][102898] Updated weights for policy 1, policy_version 72000 (0.0009) +[2023-10-08 14:38:30,506][102897] Updated weights for policy 0, policy_version 71910 (0.0008) +[2023-10-08 14:38:30,885][102897] Updated weights for policy 0, policy_version 71920 (0.0010) +[2023-10-08 14:38:31,249][102897] Updated weights for policy 0, policy_version 71930 (0.0009) +[2023-10-08 14:38:31,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 147390464. Throughput: 0: 1804.2, 1: 1786.9. Samples: 36856880. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:38:31,876][101941] Avg episode reward: [(0, '8.090'), (1, '9.350')] +[2023-10-08 14:38:32,852][102898] Updated weights for policy 1, policy_version 72010 (0.0008) +[2023-10-08 14:38:33,220][102898] Updated weights for policy 1, policy_version 72020 (0.0007) +[2023-10-08 14:38:33,583][102898] Updated weights for policy 1, policy_version 72030 (0.0007) +[2023-10-08 14:38:34,950][102897] Updated weights for policy 0, policy_version 71940 (0.0009) +[2023-10-08 14:38:35,321][102897] Updated weights for policy 0, policy_version 71950 (0.0008) +[2023-10-08 14:38:35,689][102897] Updated weights for policy 0, policy_version 71960 (0.0008) +[2023-10-08 14:38:36,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 147456000. Throughput: 0: 1802.0, 1: 1785.0. Samples: 36867984. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:38:36,876][101941] Avg episode reward: [(0, '7.950'), (1, '10.050')] +[2023-10-08 14:38:37,334][102898] Updated weights for policy 1, policy_version 72040 (0.0008) +[2023-10-08 14:38:37,698][102898] Updated weights for policy 1, policy_version 72050 (0.0007) +[2023-10-08 14:38:38,069][102898] Updated weights for policy 1, policy_version 72060 (0.0007) +[2023-10-08 14:38:39,405][102897] Updated weights for policy 0, policy_version 71970 (0.0009) +[2023-10-08 14:38:39,769][102897] Updated weights for policy 0, policy_version 71980 (0.0008) +[2023-10-08 14:38:40,142][102897] Updated weights for policy 0, policy_version 71990 (0.0008) +[2023-10-08 14:38:40,504][102897] Updated weights for policy 0, policy_version 72000 (0.0008) +[2023-10-08 14:38:41,817][102898] Updated weights for policy 1, policy_version 72070 (0.0007) +[2023-10-08 14:38:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 147521536. Throughput: 0: 1801.5, 1: 1787.1. Samples: 36889584. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:38:41,875][101941] Avg episode reward: [(0, '8.160'), (1, '10.080')] +[2023-10-08 14:38:42,187][102898] Updated weights for policy 1, policy_version 72080 (0.0008) +[2023-10-08 14:38:42,557][102898] Updated weights for policy 1, policy_version 72090 (0.0009) +[2023-10-08 14:38:44,274][102897] Updated weights for policy 0, policy_version 72010 (0.0007) +[2023-10-08 14:38:44,643][102897] Updated weights for policy 0, policy_version 72020 (0.0008) +[2023-10-08 14:38:45,013][102897] Updated weights for policy 0, policy_version 72030 (0.0010) +[2023-10-08 14:38:46,296][102898] Updated weights for policy 1, policy_version 72100 (0.0009) +[2023-10-08 14:38:46,667][102898] Updated weights for policy 1, policy_version 72110 (0.0007) +[2023-10-08 14:38:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 147587072. Throughput: 0: 1796.8, 1: 1803.2. Samples: 36911626. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:38:46,876][101941] Avg episode reward: [(0, '9.010'), (1, '9.980')] +[2023-10-08 14:38:47,033][102898] Updated weights for policy 1, policy_version 72120 (0.0007) +[2023-10-08 14:38:48,668][102897] Updated weights for policy 0, policy_version 72040 (0.0009) +[2023-10-08 14:38:49,041][102897] Updated weights for policy 0, policy_version 72050 (0.0008) +[2023-10-08 14:38:49,409][102897] Updated weights for policy 0, policy_version 72060 (0.0009) +[2023-10-08 14:38:50,891][102898] Updated weights for policy 1, policy_version 72130 (0.0007) +[2023-10-08 14:38:51,262][102898] Updated weights for policy 1, policy_version 72140 (0.0008) +[2023-10-08 14:38:51,625][102898] Updated weights for policy 1, policy_version 72150 (0.0009) +[2023-10-08 14:38:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 147652608. Throughput: 0: 1802.1, 1: 1786.5. Samples: 36921946. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:38:51,875][101941] Avg episode reward: [(0, '8.760'), (1, '10.050')] +[2023-10-08 14:38:51,999][102898] Updated weights for policy 1, policy_version 72160 (0.0007) +[2023-10-08 14:38:53,160][102897] Updated weights for policy 0, policy_version 72070 (0.0008) +[2023-10-08 14:38:53,542][102897] Updated weights for policy 0, policy_version 72080 (0.0011) +[2023-10-08 14:38:53,916][102897] Updated weights for policy 0, policy_version 72090 (0.0010) +[2023-10-08 14:38:55,465][102898] Updated weights for policy 1, policy_version 72170 (0.0008) +[2023-10-08 14:38:55,823][102898] Updated weights for policy 1, policy_version 72180 (0.0010) +[2023-10-08 14:38:56,193][102898] Updated weights for policy 1, policy_version 72190 (0.0007) +[2023-10-08 14:38:56,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 147750912. Throughput: 0: 1792.1, 1: 1808.3. Samples: 36943676. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 14:38:56,875][101941] Avg episode reward: [(0, '8.280'), (1, '10.210')] +[2023-10-08 14:38:57,944][102897] Updated weights for policy 0, policy_version 72100 (0.0009) +[2023-10-08 14:38:58,317][102897] Updated weights for policy 0, policy_version 72110 (0.0007) +[2023-10-08 14:38:58,696][102897] Updated weights for policy 0, policy_version 72120 (0.0008) +[2023-10-08 14:38:59,929][102898] Updated weights for policy 1, policy_version 72200 (0.0010) +[2023-10-08 14:39:00,297][102898] Updated weights for policy 1, policy_version 72210 (0.0008) +[2023-10-08 14:39:00,651][102898] Updated weights for policy 1, policy_version 72220 (0.0010) +[2023-10-08 14:39:01,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 147816448. Throughput: 0: 1787.5, 1: 1794.8. Samples: 36964800. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 14:39:01,876][101941] Avg episode reward: [(0, '8.760'), (1, '9.900')] +[2023-10-08 14:39:02,451][102897] Updated weights for policy 0, policy_version 72130 (0.0009) +[2023-10-08 14:39:02,819][102897] Updated weights for policy 0, policy_version 72140 (0.0007) +[2023-10-08 14:39:03,188][102897] Updated weights for policy 0, policy_version 72150 (0.0008) +[2023-10-08 14:39:03,555][102897] Updated weights for policy 0, policy_version 72160 (0.0007) +[2023-10-08 14:39:04,347][102898] Updated weights for policy 1, policy_version 72230 (0.0009) +[2023-10-08 14:39:04,716][102898] Updated weights for policy 1, policy_version 72240 (0.0007) +[2023-10-08 14:39:05,086][102898] Updated weights for policy 1, policy_version 72250 (0.0007) +[2023-10-08 14:39:06,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 147881984. Throughput: 0: 1786.9, 1: 1806.8. Samples: 36975580. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 14:39:06,876][101941] Avg episode reward: [(0, '8.950'), (1, '9.890')] +[2023-10-08 14:39:07,271][102897] Updated weights for policy 0, policy_version 72170 (0.0008) +[2023-10-08 14:39:07,647][102897] Updated weights for policy 0, policy_version 72180 (0.0008) +[2023-10-08 14:39:08,015][102897] Updated weights for policy 0, policy_version 72190 (0.0008) +[2023-10-08 14:39:08,891][102898] Updated weights for policy 1, policy_version 72260 (0.0008) +[2023-10-08 14:39:09,255][102898] Updated weights for policy 1, policy_version 72270 (0.0009) +[2023-10-08 14:39:09,616][102898] Updated weights for policy 1, policy_version 72280 (0.0009) +[2023-10-08 14:39:11,680][102897] Updated weights for policy 0, policy_version 72200 (0.0009) +[2023-10-08 14:39:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 147947520. Throughput: 0: 1783.9, 1: 1803.9. Samples: 36997062. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 14:39:11,877][101941] Avg episode reward: [(0, '9.010'), (1, '9.810')] +[2023-10-08 14:39:12,052][102897] Updated weights for policy 0, policy_version 72210 (0.0010) +[2023-10-08 14:39:12,435][102897] Updated weights for policy 0, policy_version 72220 (0.0009) +[2023-10-08 14:39:13,299][102898] Updated weights for policy 1, policy_version 72290 (0.0009) +[2023-10-08 14:39:13,676][102898] Updated weights for policy 1, policy_version 72300 (0.0008) +[2023-10-08 14:39:14,045][102898] Updated weights for policy 1, policy_version 72310 (0.0007) +[2023-10-08 14:39:14,403][102898] Updated weights for policy 1, policy_version 72320 (0.0008) +[2023-10-08 14:39:16,263][102897] Updated weights for policy 0, policy_version 72230 (0.0009) +[2023-10-08 14:39:16,639][102897] Updated weights for policy 0, policy_version 72240 (0.0009) +[2023-10-08 14:39:16,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 148013056. Throughput: 0: 1802.8, 1: 1802.1. Samples: 37019100. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 14:39:16,876][101941] Avg episode reward: [(0, '7.910'), (1, '9.630')] +[2023-10-08 14:39:17,012][102897] Updated weights for policy 0, policy_version 72250 (0.0007) +[2023-10-08 14:39:18,088][102898] Updated weights for policy 1, policy_version 72330 (0.0008) +[2023-10-08 14:39:18,459][102898] Updated weights for policy 1, policy_version 72340 (0.0007) +[2023-10-08 14:39:18,828][102898] Updated weights for policy 1, policy_version 72350 (0.0009) +[2023-10-08 14:39:20,708][102897] Updated weights for policy 0, policy_version 72260 (0.0008) +[2023-10-08 14:39:21,074][102897] Updated weights for policy 0, policy_version 72270 (0.0008) +[2023-10-08 14:39:21,454][102897] Updated weights for policy 0, policy_version 72280 (0.0009) +[2023-10-08 14:39:21,875][101941] Fps is (10 sec: 16384.6, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 148111360. Throughput: 0: 1784.4, 1: 1800.9. Samples: 37029320. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 14:39:21,875][101941] Avg episode reward: [(0, '7.950'), (1, '9.750')] +[2023-10-08 14:39:22,552][102898] Updated weights for policy 1, policy_version 72360 (0.0007) +[2023-10-08 14:39:22,928][102898] Updated weights for policy 1, policy_version 72370 (0.0007) +[2023-10-08 14:39:23,289][102898] Updated weights for policy 1, policy_version 72380 (0.0009) +[2023-10-08 14:39:25,244][102897] Updated weights for policy 0, policy_version 72290 (0.0008) +[2023-10-08 14:39:25,611][102897] Updated weights for policy 0, policy_version 72300 (0.0008) +[2023-10-08 14:39:25,976][102897] Updated weights for policy 0, policy_version 72310 (0.0009) +[2023-10-08 14:39:26,348][102897] Updated weights for policy 0, policy_version 72320 (0.0008) +[2023-10-08 14:39:26,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 148176896. Throughput: 0: 1803.7, 1: 1793.5. Samples: 37051458. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 14:39:26,875][101941] Avg episode reward: [(0, '7.380'), (1, '9.800')] +[2023-10-08 14:39:27,110][102898] Updated weights for policy 1, policy_version 72390 (0.0009) +[2023-10-08 14:39:27,472][102898] Updated weights for policy 1, policy_version 72400 (0.0008) +[2023-10-08 14:39:27,843][102898] Updated weights for policy 1, policy_version 72410 (0.0008) +[2023-10-08 14:39:29,927][102897] Updated weights for policy 0, policy_version 72330 (0.0007) +[2023-10-08 14:39:30,290][102897] Updated weights for policy 0, policy_version 72340 (0.0009) +[2023-10-08 14:39:30,663][102897] Updated weights for policy 0, policy_version 72350 (0.0010) +[2023-10-08 14:39:31,610][102898] Updated weights for policy 1, policy_version 72420 (0.0008) +[2023-10-08 14:39:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 148242432. Throughput: 0: 1779.8, 1: 1798.6. Samples: 37072656. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 14:39:31,875][101941] Avg episode reward: [(0, '7.970'), (1, '9.220')] +[2023-10-08 14:39:31,973][102898] Updated weights for policy 1, policy_version 72430 (0.0009) +[2023-10-08 14:39:32,327][102898] Updated weights for policy 1, policy_version 72440 (0.0010) +[2023-10-08 14:39:34,403][102897] Updated weights for policy 0, policy_version 72360 (0.0009) +[2023-10-08 14:39:34,781][102897] Updated weights for policy 0, policy_version 72370 (0.0007) +[2023-10-08 14:39:35,154][102897] Updated weights for policy 0, policy_version 72380 (0.0009) +[2023-10-08 14:39:36,115][102898] Updated weights for policy 1, policy_version 72450 (0.0008) +[2023-10-08 14:39:36,478][102898] Updated weights for policy 1, policy_version 72460 (0.0008) +[2023-10-08 14:39:36,834][102898] Updated weights for policy 1, policy_version 72470 (0.0008) +[2023-10-08 14:39:36,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 148307968. Throughput: 0: 1804.8, 1: 1789.0. Samples: 37083670. Policy #0 lag: (min: 14.0, avg: 21.9, max: 46.0) +[2023-10-08 14:39:36,876][101941] Avg episode reward: [(0, '8.150'), (1, '8.970')] +[2023-10-08 14:39:37,195][102898] Updated weights for policy 1, policy_version 72480 (0.0007) +[2023-10-08 14:39:38,760][102897] Updated weights for policy 0, policy_version 72390 (0.0008) +[2023-10-08 14:39:39,133][102897] Updated weights for policy 0, policy_version 72400 (0.0010) +[2023-10-08 14:39:39,509][102897] Updated weights for policy 0, policy_version 72410 (0.0010) +[2023-10-08 14:39:40,926][102898] Updated weights for policy 1, policy_version 72490 (0.0010) +[2023-10-08 14:39:41,288][102898] Updated weights for policy 1, policy_version 72500 (0.0011) +[2023-10-08 14:39:41,659][102898] Updated weights for policy 1, policy_version 72510 (0.0011) +[2023-10-08 14:39:41,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 148406272. Throughput: 0: 1791.6, 1: 1796.6. Samples: 37105144. Policy #0 lag: (min: 1.0, avg: 13.4, max: 33.0) +[2023-10-08 14:39:41,876][101941] Avg episode reward: [(0, '8.150'), (1, '9.460')] +[2023-10-08 14:39:43,335][102897] Updated weights for policy 0, policy_version 72420 (0.0010) +[2023-10-08 14:39:43,703][102897] Updated weights for policy 0, policy_version 72430 (0.0008) +[2023-10-08 14:39:44,069][102897] Updated weights for policy 0, policy_version 72440 (0.0007) +[2023-10-08 14:39:45,459][102898] Updated weights for policy 1, policy_version 72520 (0.0010) +[2023-10-08 14:39:45,830][102898] Updated weights for policy 1, policy_version 72530 (0.0010) +[2023-10-08 14:39:46,190][102898] Updated weights for policy 1, policy_version 72540 (0.0011) +[2023-10-08 14:39:46,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 148471808. Throughput: 0: 1799.7, 1: 1787.2. Samples: 37126206. Policy #0 lag: (min: 1.0, avg: 13.4, max: 33.0) +[2023-10-08 14:39:46,875][101941] Avg episode reward: [(0, '8.060'), (1, '9.100')] +[2023-10-08 14:39:47,729][102897] Updated weights for policy 0, policy_version 72450 (0.0007) +[2023-10-08 14:39:48,101][102897] Updated weights for policy 0, policy_version 72460 (0.0008) +[2023-10-08 14:39:48,465][102897] Updated weights for policy 0, policy_version 72470 (0.0008) +[2023-10-08 14:39:48,833][102897] Updated weights for policy 0, policy_version 72480 (0.0008) +[2023-10-08 14:39:50,155][102898] Updated weights for policy 1, policy_version 72550 (0.0010) +[2023-10-08 14:39:50,542][102898] Updated weights for policy 1, policy_version 72560 (0.0010) +[2023-10-08 14:39:50,914][102898] Updated weights for policy 1, policy_version 72570 (0.0008) +[2023-10-08 14:39:51,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 148537344. Throughput: 0: 1801.9, 1: 1791.7. Samples: 37137292. Policy #0 lag: (min: 1.0, avg: 13.4, max: 33.0) +[2023-10-08 14:39:51,875][101941] Avg episode reward: [(0, '7.670'), (1, '10.010')] +[2023-10-08 14:39:52,455][102897] Updated weights for policy 0, policy_version 72490 (0.0010) +[2023-10-08 14:39:52,832][102897] Updated weights for policy 0, policy_version 72500 (0.0007) +[2023-10-08 14:39:53,193][102897] Updated weights for policy 0, policy_version 72510 (0.0009) +[2023-10-08 14:39:54,912][102898] Updated weights for policy 1, policy_version 72580 (0.0009) +[2023-10-08 14:39:55,288][102898] Updated weights for policy 1, policy_version 72590 (0.0011) +[2023-10-08 14:39:55,657][102898] Updated weights for policy 1, policy_version 72600 (0.0010) +[2023-10-08 14:39:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 148602880. Throughput: 0: 1799.5, 1: 1787.2. Samples: 37158462. Policy #0 lag: (min: 1.0, avg: 13.4, max: 33.0) +[2023-10-08 14:39:56,875][101941] Avg episode reward: [(0, '7.920'), (1, '9.210')] +[2023-10-08 14:39:57,037][102897] Updated weights for policy 0, policy_version 72520 (0.0010) +[2023-10-08 14:39:57,402][102897] Updated weights for policy 0, policy_version 72530 (0.0007) +[2023-10-08 14:39:57,778][102897] Updated weights for policy 0, policy_version 72540 (0.0009) +[2023-10-08 14:39:59,520][102898] Updated weights for policy 1, policy_version 72610 (0.0010) +[2023-10-08 14:39:59,897][102898] Updated weights for policy 1, policy_version 72620 (0.0010) +[2023-10-08 14:40:00,263][102898] Updated weights for policy 1, policy_version 72630 (0.0009) +[2023-10-08 14:40:00,621][102898] Updated weights for policy 1, policy_version 72640 (0.0009) +[2023-10-08 14:40:01,627][102897] Updated weights for policy 0, policy_version 72550 (0.0010) +[2023-10-08 14:40:01,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 148668416. Throughput: 0: 1810.8, 1: 1763.3. Samples: 37179932. Policy #0 lag: (min: 1.0, avg: 13.4, max: 33.0) +[2023-10-08 14:40:01,875][101941] Avg episode reward: [(0, '8.510'), (1, '8.840')] +[2023-10-08 14:40:02,002][102897] Updated weights for policy 0, policy_version 72560 (0.0009) +[2023-10-08 14:40:02,364][102897] Updated weights for policy 0, policy_version 72570 (0.0007) +[2023-10-08 14:40:04,303][102898] Updated weights for policy 1, policy_version 72650 (0.0008) +[2023-10-08 14:40:04,677][102898] Updated weights for policy 1, policy_version 72660 (0.0007) +[2023-10-08 14:40:05,036][102898] Updated weights for policy 1, policy_version 72670 (0.0009) +[2023-10-08 14:40:06,188][102897] Updated weights for policy 0, policy_version 72580 (0.0007) +[2023-10-08 14:40:06,558][102897] Updated weights for policy 0, policy_version 72590 (0.0007) +[2023-10-08 14:40:06,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 148733952. Throughput: 0: 1797.5, 1: 1782.2. Samples: 37190408. Policy #0 lag: (min: 1.0, avg: 13.4, max: 33.0) +[2023-10-08 14:40:06,876][101941] Avg episode reward: [(0, '7.920'), (1, '9.050')] +[2023-10-08 14:40:06,932][102897] Updated weights for policy 0, policy_version 72600 (0.0007) +[2023-10-08 14:40:08,939][102898] Updated weights for policy 1, policy_version 72680 (0.0009) +[2023-10-08 14:40:09,305][102898] Updated weights for policy 1, policy_version 72690 (0.0008) +[2023-10-08 14:40:09,664][102898] Updated weights for policy 1, policy_version 72700 (0.0007) +[2023-10-08 14:40:10,587][102897] Updated weights for policy 0, policy_version 72610 (0.0009) +[2023-10-08 14:40:10,949][102897] Updated weights for policy 0, policy_version 72620 (0.0010) +[2023-10-08 14:40:11,328][102897] Updated weights for policy 0, policy_version 72630 (0.0010) +[2023-10-08 14:40:11,700][102897] Updated weights for policy 0, policy_version 72640 (0.0009) +[2023-10-08 14:40:11,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 148832256. Throughput: 0: 1803.5, 1: 1763.1. Samples: 37211954. Policy #0 lag: (min: 1.0, avg: 13.4, max: 33.0) +[2023-10-08 14:40:11,876][101941] Avg episode reward: [(0, '8.590'), (1, '9.450')] +[2023-10-08 14:40:13,486][102898] Updated weights for policy 1, policy_version 72710 (0.0007) +[2023-10-08 14:40:13,853][102898] Updated weights for policy 1, policy_version 72720 (0.0008) +[2023-10-08 14:40:14,210][102898] Updated weights for policy 1, policy_version 72730 (0.0009) +[2023-10-08 14:40:15,650][102897] Updated weights for policy 0, policy_version 72650 (0.0010) +[2023-10-08 14:40:16,024][102897] Updated weights for policy 0, policy_version 72660 (0.0007) +[2023-10-08 14:40:16,397][102897] Updated weights for policy 0, policy_version 72670 (0.0007) +[2023-10-08 14:40:16,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 148897792. Throughput: 0: 1795.0, 1: 1767.4. Samples: 37232966. Policy #0 lag: (min: 1.0, avg: 13.4, max: 33.0) +[2023-10-08 14:40:16,876][101941] Avg episode reward: [(0, '8.820'), (1, '9.650')] +[2023-10-08 14:40:16,886][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000072672_74416128.pth... +[2023-10-08 14:40:16,886][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000072736_74481664.pth... +[2023-10-08 14:40:16,920][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000071072_72777728.pth +[2023-10-08 14:40:16,925][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000070976_72679424.pth +[2023-10-08 14:40:18,234][102898] Updated weights for policy 1, policy_version 72740 (0.0008) +[2023-10-08 14:40:18,596][102898] Updated weights for policy 1, policy_version 72750 (0.0011) +[2023-10-08 14:40:18,956][102898] Updated weights for policy 1, policy_version 72760 (0.0010) +[2023-10-08 14:40:20,184][102897] Updated weights for policy 0, policy_version 72680 (0.0007) +[2023-10-08 14:40:20,543][102897] Updated weights for policy 0, policy_version 72690 (0.0008) +[2023-10-08 14:40:20,911][102897] Updated weights for policy 0, policy_version 72700 (0.0007) +[2023-10-08 14:40:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 148963328. Throughput: 0: 1793.8, 1: 1767.5. Samples: 37243926. Policy #0 lag: (min: 1.0, avg: 13.4, max: 33.0) +[2023-10-08 14:40:21,875][101941] Avg episode reward: [(0, '8.340'), (1, '9.360')] +[2023-10-08 14:40:22,694][102898] Updated weights for policy 1, policy_version 72770 (0.0008) +[2023-10-08 14:40:23,064][102898] Updated weights for policy 1, policy_version 72780 (0.0008) +[2023-10-08 14:40:23,424][102898] Updated weights for policy 1, policy_version 72790 (0.0008) +[2023-10-08 14:40:23,792][102898] Updated weights for policy 1, policy_version 72800 (0.0007) +[2023-10-08 14:40:24,550][102897] Updated weights for policy 0, policy_version 72710 (0.0008) +[2023-10-08 14:40:24,918][102897] Updated weights for policy 0, policy_version 72720 (0.0008) +[2023-10-08 14:40:25,288][102897] Updated weights for policy 0, policy_version 72730 (0.0009) +[2023-10-08 14:40:26,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 149028864. Throughput: 0: 1791.1, 1: 1769.7. Samples: 37265376. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 14:40:26,875][101941] Avg episode reward: [(0, '8.440'), (1, '10.160')] +[2023-10-08 14:40:27,441][102898] Updated weights for policy 1, policy_version 72810 (0.0009) +[2023-10-08 14:40:27,809][102898] Updated weights for policy 1, policy_version 72820 (0.0007) +[2023-10-08 14:40:28,173][102898] Updated weights for policy 1, policy_version 72830 (0.0007) +[2023-10-08 14:40:29,074][102897] Updated weights for policy 0, policy_version 72740 (0.0010) +[2023-10-08 14:40:29,453][102897] Updated weights for policy 0, policy_version 72750 (0.0010) +[2023-10-08 14:40:29,820][102897] Updated weights for policy 0, policy_version 72760 (0.0009) +[2023-10-08 14:40:31,717][102898] Updated weights for policy 1, policy_version 72840 (0.0007) +[2023-10-08 14:40:31,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 149094400. Throughput: 0: 1777.1, 1: 1803.2. Samples: 37287324. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 14:40:31,876][101941] Avg episode reward: [(0, '9.110'), (1, '10.310')] +[2023-10-08 14:40:32,082][102898] Updated weights for policy 1, policy_version 72850 (0.0007) +[2023-10-08 14:40:32,438][102898] Updated weights for policy 1, policy_version 72860 (0.0010) +[2023-10-08 14:40:33,509][102897] Updated weights for policy 0, policy_version 72770 (0.0009) +[2023-10-08 14:40:33,875][102897] Updated weights for policy 0, policy_version 72780 (0.0009) +[2023-10-08 14:40:34,245][102897] Updated weights for policy 0, policy_version 72790 (0.0010) +[2023-10-08 14:40:34,617][102897] Updated weights for policy 0, policy_version 72800 (0.0010) +[2023-10-08 14:40:36,503][102898] Updated weights for policy 1, policy_version 72870 (0.0009) +[2023-10-08 14:40:36,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 149159936. Throughput: 0: 1784.5, 1: 1773.8. Samples: 37297416. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 14:40:36,876][101941] Avg episode reward: [(0, '9.450'), (1, '10.610')] +[2023-10-08 14:40:36,877][102634] Saving new best policy, reward=9.450! +[2023-10-08 14:40:36,890][102898] Updated weights for policy 1, policy_version 72880 (0.0010) +[2023-10-08 14:40:37,250][102898] Updated weights for policy 1, policy_version 72890 (0.0007) +[2023-10-08 14:40:38,306][102897] Updated weights for policy 0, policy_version 72810 (0.0011) +[2023-10-08 14:40:38,670][102897] Updated weights for policy 0, policy_version 72820 (0.0011) +[2023-10-08 14:40:39,036][102897] Updated weights for policy 0, policy_version 72830 (0.0011) +[2023-10-08 14:40:41,071][102898] Updated weights for policy 1, policy_version 72900 (0.0009) +[2023-10-08 14:40:41,443][102898] Updated weights for policy 1, policy_version 72910 (0.0008) +[2023-10-08 14:40:41,807][102898] Updated weights for policy 1, policy_version 72920 (0.0008) +[2023-10-08 14:40:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 14329.0). Total num frames: 149225472. Throughput: 0: 1775.5, 1: 1796.6. Samples: 37319204. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 14:40:41,876][101941] Avg episode reward: [(0, '9.050'), (1, '10.090')] +[2023-10-08 14:40:42,906][102897] Updated weights for policy 0, policy_version 72840 (0.0008) +[2023-10-08 14:40:43,277][102897] Updated weights for policy 0, policy_version 72850 (0.0010) +[2023-10-08 14:40:43,643][102897] Updated weights for policy 0, policy_version 72860 (0.0010) +[2023-10-08 14:40:45,487][102898] Updated weights for policy 1, policy_version 72930 (0.0009) +[2023-10-08 14:40:45,850][102898] Updated weights for policy 1, policy_version 72940 (0.0008) +[2023-10-08 14:40:46,224][102898] Updated weights for policy 1, policy_version 72950 (0.0008) +[2023-10-08 14:40:46,586][102898] Updated weights for policy 1, policy_version 72960 (0.0009) +[2023-10-08 14:40:46,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 149323776. Throughput: 0: 1771.7, 1: 1785.9. Samples: 37340024. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 14:40:46,876][101941] Avg episode reward: [(0, '8.470'), (1, '10.690')] +[2023-10-08 14:40:46,885][102760] Saving new best policy, reward=10.690! +[2023-10-08 14:40:47,756][102897] Updated weights for policy 0, policy_version 72870 (0.0008) +[2023-10-08 14:40:48,131][102897] Updated weights for policy 0, policy_version 72880 (0.0009) +[2023-10-08 14:40:48,509][102897] Updated weights for policy 0, policy_version 72890 (0.0009) +[2023-10-08 14:40:50,277][102898] Updated weights for policy 1, policy_version 72970 (0.0008) +[2023-10-08 14:40:50,645][102898] Updated weights for policy 1, policy_version 72980 (0.0009) +[2023-10-08 14:40:51,012][102898] Updated weights for policy 1, policy_version 72990 (0.0009) +[2023-10-08 14:40:51,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 149389312. Throughput: 0: 1770.5, 1: 1795.2. Samples: 37350862. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 14:40:51,876][101941] Avg episode reward: [(0, '8.070'), (1, '10.680')] +[2023-10-08 14:40:52,198][102897] Updated weights for policy 0, policy_version 72900 (0.0007) +[2023-10-08 14:40:52,569][102897] Updated weights for policy 0, policy_version 72910 (0.0008) +[2023-10-08 14:40:52,941][102897] Updated weights for policy 0, policy_version 72920 (0.0009) +[2023-10-08 14:40:54,721][102898] Updated weights for policy 1, policy_version 73000 (0.0007) +[2023-10-08 14:40:55,083][102898] Updated weights for policy 1, policy_version 73010 (0.0007) +[2023-10-08 14:40:55,449][102898] Updated weights for policy 1, policy_version 73020 (0.0009) +[2023-10-08 14:40:56,637][102897] Updated weights for policy 0, policy_version 72930 (0.0010) +[2023-10-08 14:40:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 149454848. Throughput: 0: 1770.4, 1: 1796.0. Samples: 37372438. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 14:40:56,876][101941] Avg episode reward: [(0, '8.220'), (1, '10.270')] +[2023-10-08 14:40:57,009][102897] Updated weights for policy 0, policy_version 72940 (0.0007) +[2023-10-08 14:40:57,385][102897] Updated weights for policy 0, policy_version 72950 (0.0007) +[2023-10-08 14:40:57,761][102897] Updated weights for policy 0, policy_version 72960 (0.0007) +[2023-10-08 14:40:59,244][102898] Updated weights for policy 1, policy_version 73030 (0.0009) +[2023-10-08 14:40:59,620][102898] Updated weights for policy 1, policy_version 73040 (0.0009) +[2023-10-08 14:40:59,984][102898] Updated weights for policy 1, policy_version 73050 (0.0010) +[2023-10-08 14:41:01,595][102897] Updated weights for policy 0, policy_version 72970 (0.0008) +[2023-10-08 14:41:01,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 149520384. Throughput: 0: 1799.4, 1: 1786.9. Samples: 37394346. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 14:41:01,875][101941] Avg episode reward: [(0, '8.090'), (1, '8.720')] +[2023-10-08 14:41:01,964][102897] Updated weights for policy 0, policy_version 72980 (0.0007) +[2023-10-08 14:41:02,348][102897] Updated weights for policy 0, policy_version 72990 (0.0009) +[2023-10-08 14:41:03,571][102898] Updated weights for policy 1, policy_version 73060 (0.0010) +[2023-10-08 14:41:03,925][102898] Updated weights for policy 1, policy_version 73070 (0.0009) +[2023-10-08 14:41:04,286][102898] Updated weights for policy 1, policy_version 73080 (0.0007) +[2023-10-08 14:41:06,104][102897] Updated weights for policy 0, policy_version 73000 (0.0008) +[2023-10-08 14:41:06,487][102897] Updated weights for policy 0, policy_version 73010 (0.0010) +[2023-10-08 14:41:06,853][102897] Updated weights for policy 0, policy_version 73020 (0.0007) +[2023-10-08 14:41:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 149585920. Throughput: 0: 1776.6, 1: 1797.5. Samples: 37404758. Policy #0 lag: (min: 19.0, avg: 19.0, max: 19.0) +[2023-10-08 14:41:06,876][101941] Avg episode reward: [(0, '8.060'), (1, '9.000')] +[2023-10-08 14:41:07,985][102898] Updated weights for policy 1, policy_version 73090 (0.0009) +[2023-10-08 14:41:08,352][102898] Updated weights for policy 1, policy_version 73100 (0.0007) +[2023-10-08 14:41:08,722][102898] Updated weights for policy 1, policy_version 73110 (0.0009) +[2023-10-08 14:41:09,081][102898] Updated weights for policy 1, policy_version 73120 (0.0009) +[2023-10-08 14:41:10,590][102897] Updated weights for policy 0, policy_version 73030 (0.0010) +[2023-10-08 14:41:10,968][102897] Updated weights for policy 0, policy_version 73040 (0.0009) +[2023-10-08 14:41:11,333][102897] Updated weights for policy 0, policy_version 73050 (0.0010) +[2023-10-08 14:41:11,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 149684224. Throughput: 0: 1804.1, 1: 1788.3. Samples: 37427034. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 14:41:11,876][101941] Avg episode reward: [(0, '8.790'), (1, '9.660')] +[2023-10-08 14:41:12,978][102898] Updated weights for policy 1, policy_version 73130 (0.0007) +[2023-10-08 14:41:13,344][102898] Updated weights for policy 1, policy_version 73140 (0.0008) +[2023-10-08 14:41:13,712][102898] Updated weights for policy 1, policy_version 73150 (0.0008) +[2023-10-08 14:41:15,012][102897] Updated weights for policy 0, policy_version 73060 (0.0008) +[2023-10-08 14:41:15,386][102897] Updated weights for policy 0, policy_version 73070 (0.0008) +[2023-10-08 14:41:15,756][102897] Updated weights for policy 0, policy_version 73080 (0.0009) +[2023-10-08 14:41:16,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 149749760. Throughput: 0: 1782.3, 1: 1789.5. Samples: 37448054. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 14:41:16,876][101941] Avg episode reward: [(0, '8.950'), (1, '10.170')] +[2023-10-08 14:41:17,481][102898] Updated weights for policy 1, policy_version 73160 (0.0009) +[2023-10-08 14:41:17,856][102898] Updated weights for policy 1, policy_version 73170 (0.0007) +[2023-10-08 14:41:18,216][102898] Updated weights for policy 1, policy_version 73180 (0.0009) +[2023-10-08 14:41:19,431][102897] Updated weights for policy 0, policy_version 73090 (0.0007) +[2023-10-08 14:41:19,796][102897] Updated weights for policy 0, policy_version 73100 (0.0009) +[2023-10-08 14:41:20,171][102897] Updated weights for policy 0, policy_version 73110 (0.0008) +[2023-10-08 14:41:20,537][102897] Updated weights for policy 0, policy_version 73120 (0.0008) +[2023-10-08 14:41:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 149815296. Throughput: 0: 1806.5, 1: 1788.6. Samples: 37459196. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 14:41:21,876][101941] Avg episode reward: [(0, '8.810'), (1, '10.090')] +[2023-10-08 14:41:21,996][102898] Updated weights for policy 1, policy_version 73190 (0.0008) +[2023-10-08 14:41:22,375][102898] Updated weights for policy 1, policy_version 73200 (0.0009) +[2023-10-08 14:41:22,741][102898] Updated weights for policy 1, policy_version 73210 (0.0008) +[2023-10-08 14:41:24,393][102897] Updated weights for policy 0, policy_version 73130 (0.0009) +[2023-10-08 14:41:24,758][102897] Updated weights for policy 0, policy_version 73140 (0.0009) +[2023-10-08 14:41:25,138][102897] Updated weights for policy 0, policy_version 73150 (0.0010) +[2023-10-08 14:41:26,500][102898] Updated weights for policy 1, policy_version 73220 (0.0007) +[2023-10-08 14:41:26,866][102898] Updated weights for policy 1, policy_version 73230 (0.0010) +[2023-10-08 14:41:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 149880832. Throughput: 0: 1783.8, 1: 1790.1. Samples: 37480032. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 14:41:26,876][101941] Avg episode reward: [(0, '8.180'), (1, '10.360')] +[2023-10-08 14:41:27,232][102898] Updated weights for policy 1, policy_version 73240 (0.0007) +[2023-10-08 14:41:28,907][102897] Updated weights for policy 0, policy_version 73160 (0.0008) +[2023-10-08 14:41:29,277][102897] Updated weights for policy 0, policy_version 73170 (0.0009) +[2023-10-08 14:41:29,645][102897] Updated weights for policy 0, policy_version 73180 (0.0007) +[2023-10-08 14:41:30,843][102898] Updated weights for policy 1, policy_version 73250 (0.0007) +[2023-10-08 14:41:31,214][102898] Updated weights for policy 1, policy_version 73260 (0.0007) +[2023-10-08 14:41:31,584][102898] Updated weights for policy 1, policy_version 73270 (0.0007) +[2023-10-08 14:41:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 149946368. Throughput: 0: 1788.8, 1: 1803.7. Samples: 37501684. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 14:41:31,876][101941] Avg episode reward: [(0, '7.700'), (1, '10.420')] +[2023-10-08 14:41:31,956][102898] Updated weights for policy 1, policy_version 73280 (0.0008) +[2023-10-08 14:41:33,477][102897] Updated weights for policy 0, policy_version 73190 (0.0008) +[2023-10-08 14:41:33,869][102897] Updated weights for policy 0, policy_version 73200 (0.0008) +[2023-10-08 14:41:34,233][102897] Updated weights for policy 0, policy_version 73210 (0.0010) +[2023-10-08 14:41:35,627][102898] Updated weights for policy 1, policy_version 73290 (0.0007) +[2023-10-08 14:41:35,996][102898] Updated weights for policy 1, policy_version 73300 (0.0009) +[2023-10-08 14:41:36,360][102898] Updated weights for policy 1, policy_version 73310 (0.0008) +[2023-10-08 14:41:36,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 150044672. Throughput: 0: 1789.7, 1: 1798.5. Samples: 37512332. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 14:41:36,876][101941] Avg episode reward: [(0, '7.960'), (1, '10.530')] +[2023-10-08 14:41:37,867][102897] Updated weights for policy 0, policy_version 73220 (0.0009) +[2023-10-08 14:41:38,237][102897] Updated weights for policy 0, policy_version 73230 (0.0007) +[2023-10-08 14:41:38,600][102897] Updated weights for policy 0, policy_version 73240 (0.0010) +[2023-10-08 14:41:40,130][102898] Updated weights for policy 1, policy_version 73320 (0.0010) +[2023-10-08 14:41:40,500][102898] Updated weights for policy 1, policy_version 73330 (0.0010) +[2023-10-08 14:41:40,873][102898] Updated weights for policy 1, policy_version 73340 (0.0008) +[2023-10-08 14:41:41,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 150110208. Throughput: 0: 1785.8, 1: 1812.2. Samples: 37534348. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 14:41:41,876][101941] Avg episode reward: [(0, '8.670'), (1, '10.300')] +[2023-10-08 14:41:42,444][102897] Updated weights for policy 0, policy_version 73250 (0.0008) +[2023-10-08 14:41:42,810][102897] Updated weights for policy 0, policy_version 73260 (0.0009) +[2023-10-08 14:41:43,187][102897] Updated weights for policy 0, policy_version 73270 (0.0009) +[2023-10-08 14:41:43,564][102897] Updated weights for policy 0, policy_version 73280 (0.0009) +[2023-10-08 14:41:44,562][102898] Updated weights for policy 1, policy_version 73350 (0.0008) +[2023-10-08 14:41:44,917][102898] Updated weights for policy 1, policy_version 73360 (0.0007) +[2023-10-08 14:41:45,282][102898] Updated weights for policy 1, policy_version 73370 (0.0010) +[2023-10-08 14:41:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 150175744. Throughput: 0: 1792.9, 1: 1802.8. Samples: 37556152. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 14:41:46,875][101941] Avg episode reward: [(0, '8.750'), (1, '8.970')] +[2023-10-08 14:41:47,364][102897] Updated weights for policy 0, policy_version 73290 (0.0007) +[2023-10-08 14:41:47,726][102897] Updated weights for policy 0, policy_version 73300 (0.0007) +[2023-10-08 14:41:48,102][102897] Updated weights for policy 0, policy_version 73310 (0.0007) +[2023-10-08 14:41:48,976][102898] Updated weights for policy 1, policy_version 73380 (0.0010) +[2023-10-08 14:41:49,341][102898] Updated weights for policy 1, policy_version 73390 (0.0010) +[2023-10-08 14:41:49,705][102898] Updated weights for policy 1, policy_version 73400 (0.0008) +[2023-10-08 14:41:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 150241280. Throughput: 0: 1785.7, 1: 1812.0. Samples: 37566654. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 14:41:51,876][101941] Avg episode reward: [(0, '8.880'), (1, '9.870')] +[2023-10-08 14:41:51,974][102897] Updated weights for policy 0, policy_version 73320 (0.0008) +[2023-10-08 14:41:52,348][102897] Updated weights for policy 0, policy_version 73330 (0.0008) +[2023-10-08 14:41:52,724][102897] Updated weights for policy 0, policy_version 73340 (0.0007) +[2023-10-08 14:41:53,587][102898] Updated weights for policy 1, policy_version 73410 (0.0008) +[2023-10-08 14:41:53,948][102898] Updated weights for policy 1, policy_version 73420 (0.0009) +[2023-10-08 14:41:54,310][102898] Updated weights for policy 1, policy_version 73430 (0.0009) +[2023-10-08 14:41:54,677][102898] Updated weights for policy 1, policy_version 73440 (0.0010) +[2023-10-08 14:41:56,607][102897] Updated weights for policy 0, policy_version 73350 (0.0008) +[2023-10-08 14:41:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 150306816. Throughput: 0: 1777.6, 1: 1797.8. Samples: 37587928. Policy #0 lag: (min: 31.0, avg: 38.0, max: 63.0) +[2023-10-08 14:41:56,876][101941] Avg episode reward: [(0, '8.110'), (1, '10.750')] +[2023-10-08 14:41:56,877][102760] Saving new best policy, reward=10.750! +[2023-10-08 14:41:56,984][102897] Updated weights for policy 0, policy_version 73360 (0.0007) +[2023-10-08 14:41:57,351][102897] Updated weights for policy 0, policy_version 73370 (0.0008) +[2023-10-08 14:41:58,376][102898] Updated weights for policy 1, policy_version 73450 (0.0007) +[2023-10-08 14:41:58,739][102898] Updated weights for policy 1, policy_version 73460 (0.0007) +[2023-10-08 14:41:59,099][102898] Updated weights for policy 1, policy_version 73470 (0.0010) +[2023-10-08 14:42:00,969][102897] Updated weights for policy 0, policy_version 73380 (0.0008) +[2023-10-08 14:42:01,335][102897] Updated weights for policy 0, policy_version 73390 (0.0009) +[2023-10-08 14:42:01,705][102897] Updated weights for policy 0, policy_version 73400 (0.0008) +[2023-10-08 14:42:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 150372352. Throughput: 0: 1795.3, 1: 1802.5. Samples: 37609954. Policy #0 lag: (min: 31.0, avg: 36.6, max: 63.0) +[2023-10-08 14:42:01,875][101941] Avg episode reward: [(0, '8.270'), (1, '10.370')] +[2023-10-08 14:42:02,766][102898] Updated weights for policy 1, policy_version 73480 (0.0008) +[2023-10-08 14:42:03,132][102898] Updated weights for policy 1, policy_version 73490 (0.0009) +[2023-10-08 14:42:03,494][102898] Updated weights for policy 1, policy_version 73500 (0.0008) +[2023-10-08 14:42:05,531][102897] Updated weights for policy 0, policy_version 73410 (0.0009) +[2023-10-08 14:42:05,899][102897] Updated weights for policy 0, policy_version 73420 (0.0009) +[2023-10-08 14:42:06,263][102897] Updated weights for policy 0, policy_version 73430 (0.0008) +[2023-10-08 14:42:06,634][102897] Updated weights for policy 0, policy_version 73440 (0.0007) +[2023-10-08 14:42:06,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 150470656. Throughput: 0: 1782.6, 1: 1801.7. Samples: 37620492. Policy #0 lag: (min: 31.0, avg: 36.6, max: 63.0) +[2023-10-08 14:42:06,876][101941] Avg episode reward: [(0, '8.270'), (1, '10.020')] +[2023-10-08 14:42:07,424][102898] Updated weights for policy 1, policy_version 73510 (0.0007) +[2023-10-08 14:42:07,803][102898] Updated weights for policy 1, policy_version 73520 (0.0008) +[2023-10-08 14:42:08,175][102898] Updated weights for policy 1, policy_version 73530 (0.0008) +[2023-10-08 14:42:10,293][102897] Updated weights for policy 0, policy_version 73450 (0.0007) +[2023-10-08 14:42:10,667][102897] Updated weights for policy 0, policy_version 73460 (0.0007) +[2023-10-08 14:42:11,028][102897] Updated weights for policy 0, policy_version 73470 (0.0007) +[2023-10-08 14:42:11,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 150536192. Throughput: 0: 1802.3, 1: 1803.2. Samples: 37642276. Policy #0 lag: (min: 31.0, avg: 36.6, max: 63.0) +[2023-10-08 14:42:11,876][101941] Avg episode reward: [(0, '8.200'), (1, '9.820')] +[2023-10-08 14:42:12,036][102898] Updated weights for policy 1, policy_version 73540 (0.0009) +[2023-10-08 14:42:12,410][102898] Updated weights for policy 1, policy_version 73550 (0.0008) +[2023-10-08 14:42:12,779][102898] Updated weights for policy 1, policy_version 73560 (0.0007) +[2023-10-08 14:42:14,759][102897] Updated weights for policy 0, policy_version 73480 (0.0008) +[2023-10-08 14:42:15,132][102897] Updated weights for policy 0, policy_version 73490 (0.0011) +[2023-10-08 14:42:15,493][102897] Updated weights for policy 0, policy_version 73500 (0.0010) +[2023-10-08 14:42:16,522][102898] Updated weights for policy 1, policy_version 73570 (0.0009) +[2023-10-08 14:42:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 150601728. Throughput: 0: 1782.8, 1: 1817.7. Samples: 37663708. Policy #0 lag: (min: 31.0, avg: 36.6, max: 63.0) +[2023-10-08 14:42:16,876][101941] Avg episode reward: [(0, '7.900'), (1, '10.080')] +[2023-10-08 14:42:16,888][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000073504_75268096.pth... +[2023-10-08 14:42:16,891][102898] Updated weights for policy 1, policy_version 73580 (0.0010) +[2023-10-08 14:42:16,928][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000071840_73564160.pth +[2023-10-08 14:42:17,258][102898] Updated weights for policy 1, policy_version 73590 (0.0009) +[2023-10-08 14:42:17,620][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000073600_75366400.pth... +[2023-10-08 14:42:17,622][102898] Updated weights for policy 1, policy_version 73600 (0.0007) +[2023-10-08 14:42:17,649][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000071904_73629696.pth +[2023-10-08 14:42:19,147][102897] Updated weights for policy 0, policy_version 73510 (0.0011) +[2023-10-08 14:42:19,541][102897] Updated weights for policy 0, policy_version 73520 (0.0009) +[2023-10-08 14:42:19,913][102897] Updated weights for policy 0, policy_version 73530 (0.0007) +[2023-10-08 14:42:21,522][102898] Updated weights for policy 1, policy_version 73610 (0.0008) +[2023-10-08 14:42:21,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 150667264. Throughput: 0: 1805.9, 1: 1792.4. Samples: 37674254. Policy #0 lag: (min: 31.0, avg: 36.6, max: 63.0) +[2023-10-08 14:42:21,875][101941] Avg episode reward: [(0, '8.270'), (1, '9.610')] +[2023-10-08 14:42:21,900][102898] Updated weights for policy 1, policy_version 73620 (0.0010) +[2023-10-08 14:42:22,260][102898] Updated weights for policy 1, policy_version 73630 (0.0007) +[2023-10-08 14:42:23,591][102897] Updated weights for policy 0, policy_version 73540 (0.0009) +[2023-10-08 14:42:23,955][102897] Updated weights for policy 0, policy_version 73550 (0.0009) +[2023-10-08 14:42:24,329][102897] Updated weights for policy 0, policy_version 73560 (0.0008) +[2023-10-08 14:42:25,983][102898] Updated weights for policy 1, policy_version 73640 (0.0007) +[2023-10-08 14:42:26,357][102898] Updated weights for policy 1, policy_version 73650 (0.0008) +[2023-10-08 14:42:26,717][102898] Updated weights for policy 1, policy_version 73660 (0.0007) +[2023-10-08 14:42:26,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 150765568. Throughput: 0: 1780.9, 1: 1800.5. Samples: 37695510. Policy #0 lag: (min: 31.0, avg: 36.6, max: 63.0) +[2023-10-08 14:42:26,876][101941] Avg episode reward: [(0, '8.530'), (1, '10.010')] +[2023-10-08 14:42:28,113][102897] Updated weights for policy 0, policy_version 73570 (0.0010) +[2023-10-08 14:42:28,490][102897] Updated weights for policy 0, policy_version 73580 (0.0007) +[2023-10-08 14:42:28,857][102897] Updated weights for policy 0, policy_version 73590 (0.0008) +[2023-10-08 14:42:29,227][102897] Updated weights for policy 0, policy_version 73600 (0.0009) +[2023-10-08 14:42:30,246][102898] Updated weights for policy 1, policy_version 73670 (0.0009) +[2023-10-08 14:42:30,619][102898] Updated weights for policy 1, policy_version 73680 (0.0009) +[2023-10-08 14:42:30,978][102898] Updated weights for policy 1, policy_version 73690 (0.0009) +[2023-10-08 14:42:31,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 150831104. Throughput: 0: 1780.1, 1: 1787.1. Samples: 37716680. Policy #0 lag: (min: 31.0, avg: 36.6, max: 63.0) +[2023-10-08 14:42:31,876][101941] Avg episode reward: [(0, '9.140'), (1, '10.050')] +[2023-10-08 14:42:32,983][102897] Updated weights for policy 0, policy_version 73610 (0.0008) +[2023-10-08 14:42:33,351][102897] Updated weights for policy 0, policy_version 73620 (0.0007) +[2023-10-08 14:42:33,720][102897] Updated weights for policy 0, policy_version 73630 (0.0008) +[2023-10-08 14:42:34,874][102898] Updated weights for policy 1, policy_version 73700 (0.0009) +[2023-10-08 14:42:35,241][102898] Updated weights for policy 1, policy_version 73710 (0.0008) +[2023-10-08 14:42:35,605][102898] Updated weights for policy 1, policy_version 73720 (0.0009) +[2023-10-08 14:42:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 150896640. Throughput: 0: 1781.8, 1: 1798.2. Samples: 37727756. Policy #0 lag: (min: 31.0, avg: 36.6, max: 63.0) +[2023-10-08 14:42:36,876][101941] Avg episode reward: [(0, '9.080'), (1, '10.440')] +[2023-10-08 14:42:37,412][102897] Updated weights for policy 0, policy_version 73640 (0.0009) +[2023-10-08 14:42:37,789][102897] Updated weights for policy 0, policy_version 73650 (0.0007) +[2023-10-08 14:42:38,161][102897] Updated weights for policy 0, policy_version 73660 (0.0008) +[2023-10-08 14:42:39,332][102898] Updated weights for policy 1, policy_version 73730 (0.0010) +[2023-10-08 14:42:39,696][102898] Updated weights for policy 1, policy_version 73740 (0.0007) +[2023-10-08 14:42:40,065][102898] Updated weights for policy 1, policy_version 73750 (0.0008) +[2023-10-08 14:42:40,434][102898] Updated weights for policy 1, policy_version 73760 (0.0010) +[2023-10-08 14:42:41,798][102897] Updated weights for policy 0, policy_version 73670 (0.0008) +[2023-10-08 14:42:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 150962176. Throughput: 0: 1794.8, 1: 1786.0. Samples: 37749064. Policy #0 lag: (min: 31.0, avg: 36.6, max: 63.0) +[2023-10-08 14:42:41,875][101941] Avg episode reward: [(0, '9.100'), (1, '9.870')] +[2023-10-08 14:42:42,174][102897] Updated weights for policy 0, policy_version 73680 (0.0007) +[2023-10-08 14:42:42,542][102897] Updated weights for policy 0, policy_version 73690 (0.0007) +[2023-10-08 14:42:44,207][102898] Updated weights for policy 1, policy_version 73770 (0.0011) +[2023-10-08 14:42:44,580][102898] Updated weights for policy 1, policy_version 73780 (0.0007) +[2023-10-08 14:42:44,941][102898] Updated weights for policy 1, policy_version 73790 (0.0008) +[2023-10-08 14:42:46,307][102897] Updated weights for policy 0, policy_version 73700 (0.0008) +[2023-10-08 14:42:46,679][102897] Updated weights for policy 0, policy_version 73710 (0.0009) +[2023-10-08 14:42:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 151027712. Throughput: 0: 1808.2, 1: 1780.5. Samples: 37771446. Policy #0 lag: (min: 31.0, avg: 36.6, max: 63.0) +[2023-10-08 14:42:46,876][101941] Avg episode reward: [(0, '9.090'), (1, '10.390')] +[2023-10-08 14:42:47,059][102897] Updated weights for policy 0, policy_version 73720 (0.0007) +[2023-10-08 14:42:48,643][102898] Updated weights for policy 1, policy_version 73800 (0.0007) +[2023-10-08 14:42:48,997][102898] Updated weights for policy 1, policy_version 73810 (0.0010) +[2023-10-08 14:42:49,368][102898] Updated weights for policy 1, policy_version 73820 (0.0010) +[2023-10-08 14:42:50,986][102897] Updated weights for policy 0, policy_version 73730 (0.0007) +[2023-10-08 14:42:51,360][102897] Updated weights for policy 0, policy_version 73740 (0.0008) +[2023-10-08 14:42:51,732][102897] Updated weights for policy 0, policy_version 73750 (0.0009) +[2023-10-08 14:42:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 151093248. Throughput: 0: 1795.3, 1: 1787.0. Samples: 37781694. Policy #0 lag: (min: 3.0, avg: 3.2, max: 12.0) +[2023-10-08 14:42:51,875][101941] Avg episode reward: [(0, '9.790'), (1, '9.750')] +[2023-10-08 14:42:52,101][102634] Saving new best policy, reward=9.790! +[2023-10-08 14:42:52,105][102897] Updated weights for policy 0, policy_version 73760 (0.0007) +[2023-10-08 14:42:53,089][102898] Updated weights for policy 1, policy_version 73830 (0.0008) +[2023-10-08 14:42:53,460][102898] Updated weights for policy 1, policy_version 73840 (0.0007) +[2023-10-08 14:42:53,835][102898] Updated weights for policy 1, policy_version 73850 (0.0008) +[2023-10-08 14:42:55,903][102897] Updated weights for policy 0, policy_version 73770 (0.0011) +[2023-10-08 14:42:56,277][102897] Updated weights for policy 0, policy_version 73780 (0.0010) +[2023-10-08 14:42:56,644][102897] Updated weights for policy 0, policy_version 73790 (0.0009) +[2023-10-08 14:42:56,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 151191552. Throughput: 0: 1807.8, 1: 1784.7. Samples: 37803938. Policy #0 lag: (min: 3.0, avg: 3.2, max: 12.0) +[2023-10-08 14:42:56,876][101941] Avg episode reward: [(0, '9.130'), (1, '9.800')] +[2023-10-08 14:42:57,581][102898] Updated weights for policy 1, policy_version 73860 (0.0009) +[2023-10-08 14:42:57,968][102898] Updated weights for policy 1, policy_version 73870 (0.0007) +[2023-10-08 14:42:58,323][102898] Updated weights for policy 1, policy_version 73880 (0.0007) +[2023-10-08 14:43:00,350][102897] Updated weights for policy 0, policy_version 73800 (0.0007) +[2023-10-08 14:43:00,719][102897] Updated weights for policy 0, policy_version 73810 (0.0007) +[2023-10-08 14:43:01,097][102897] Updated weights for policy 0, policy_version 73820 (0.0011) +[2023-10-08 14:43:01,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 151257088. Throughput: 0: 1790.5, 1: 1783.8. Samples: 37824550. Policy #0 lag: (min: 3.0, avg: 3.2, max: 12.0) +[2023-10-08 14:43:01,876][101941] Avg episode reward: [(0, '8.840'), (1, '11.430')] +[2023-10-08 14:43:01,885][102760] Saving new best policy, reward=11.430! +[2023-10-08 14:43:02,165][102898] Updated weights for policy 1, policy_version 73890 (0.0007) +[2023-10-08 14:43:02,522][102898] Updated weights for policy 1, policy_version 73900 (0.0008) +[2023-10-08 14:43:02,892][102898] Updated weights for policy 1, policy_version 73910 (0.0011) +[2023-10-08 14:43:03,258][102898] Updated weights for policy 1, policy_version 73920 (0.0010) +[2023-10-08 14:43:05,054][102897] Updated weights for policy 0, policy_version 73830 (0.0010) +[2023-10-08 14:43:05,441][102897] Updated weights for policy 0, policy_version 73840 (0.0007) +[2023-10-08 14:43:05,805][102897] Updated weights for policy 0, policy_version 73850 (0.0008) +[2023-10-08 14:43:06,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 151322624. Throughput: 0: 1799.7, 1: 1787.1. Samples: 37835662. Policy #0 lag: (min: 3.0, avg: 3.2, max: 12.0) +[2023-10-08 14:43:06,875][101941] Avg episode reward: [(0, '9.760'), (1, '11.490')] +[2023-10-08 14:43:06,966][102898] Updated weights for policy 1, policy_version 73930 (0.0010) +[2023-10-08 14:43:07,334][102898] Updated weights for policy 1, policy_version 73940 (0.0010) +[2023-10-08 14:43:07,708][102898] Updated weights for policy 1, policy_version 73950 (0.0008) +[2023-10-08 14:43:07,774][102760] Saving new best policy, reward=11.490! +[2023-10-08 14:43:09,448][102897] Updated weights for policy 0, policy_version 73860 (0.0007) +[2023-10-08 14:43:09,807][102897] Updated weights for policy 0, policy_version 73870 (0.0007) +[2023-10-08 14:43:10,183][102897] Updated weights for policy 0, policy_version 73880 (0.0011) +[2023-10-08 14:43:11,463][102898] Updated weights for policy 1, policy_version 73960 (0.0007) +[2023-10-08 14:43:11,832][102898] Updated weights for policy 1, policy_version 73970 (0.0010) +[2023-10-08 14:43:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 151388160. Throughput: 0: 1793.8, 1: 1790.3. Samples: 37856794. Policy #0 lag: (min: 3.0, avg: 3.2, max: 12.0) +[2023-10-08 14:43:11,876][101941] Avg episode reward: [(0, '9.280'), (1, '11.580')] +[2023-10-08 14:43:12,202][102898] Updated weights for policy 1, policy_version 73980 (0.0009) +[2023-10-08 14:43:12,346][102760] Saving new best policy, reward=11.580! +[2023-10-08 14:43:13,893][102897] Updated weights for policy 0, policy_version 73890 (0.0008) +[2023-10-08 14:43:14,251][102897] Updated weights for policy 0, policy_version 73900 (0.0009) +[2023-10-08 14:43:14,621][102897] Updated weights for policy 0, policy_version 73910 (0.0007) +[2023-10-08 14:43:14,987][102897] Updated weights for policy 0, policy_version 73920 (0.0007) +[2023-10-08 14:43:16,034][102898] Updated weights for policy 1, policy_version 73990 (0.0008) +[2023-10-08 14:43:16,406][102898] Updated weights for policy 1, policy_version 74000 (0.0009) +[2023-10-08 14:43:16,772][102898] Updated weights for policy 1, policy_version 74010 (0.0009) +[2023-10-08 14:43:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 151453696. Throughput: 0: 1788.5, 1: 1803.9. Samples: 37878336. Policy #0 lag: (min: 3.0, avg: 3.2, max: 12.0) +[2023-10-08 14:43:16,875][101941] Avg episode reward: [(0, '8.650'), (1, '11.690')] +[2023-10-08 14:43:16,985][102760] Saving new best policy, reward=11.690! +[2023-10-08 14:43:18,882][102897] Updated weights for policy 0, policy_version 73930 (0.0008) +[2023-10-08 14:43:19,257][102897] Updated weights for policy 0, policy_version 73940 (0.0009) +[2023-10-08 14:43:19,619][102897] Updated weights for policy 0, policy_version 73950 (0.0007) +[2023-10-08 14:43:20,540][102898] Updated weights for policy 1, policy_version 74020 (0.0008) +[2023-10-08 14:43:20,903][102898] Updated weights for policy 1, policy_version 74030 (0.0008) +[2023-10-08 14:43:21,282][102898] Updated weights for policy 1, policy_version 74040 (0.0010) +[2023-10-08 14:43:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 151552000. Throughput: 0: 1797.9, 1: 1788.4. Samples: 37889138. Policy #0 lag: (min: 3.0, avg: 3.2, max: 12.0) +[2023-10-08 14:43:21,876][101941] Avg episode reward: [(0, '8.040'), (1, '11.880')] +[2023-10-08 14:43:21,877][102760] Saving new best policy, reward=11.880! +[2023-10-08 14:43:23,250][102897] Updated weights for policy 0, policy_version 73960 (0.0007) +[2023-10-08 14:43:23,621][102897] Updated weights for policy 0, policy_version 73970 (0.0007) +[2023-10-08 14:43:23,997][102897] Updated weights for policy 0, policy_version 73980 (0.0009) +[2023-10-08 14:43:25,038][102898] Updated weights for policy 1, policy_version 74050 (0.0009) +[2023-10-08 14:43:25,411][102898] Updated weights for policy 1, policy_version 74060 (0.0007) +[2023-10-08 14:43:25,770][102898] Updated weights for policy 1, policy_version 74070 (0.0010) +[2023-10-08 14:43:26,132][102898] Updated weights for policy 1, policy_version 74080 (0.0009) +[2023-10-08 14:43:26,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 151617536. Throughput: 0: 1781.8, 1: 1803.7. Samples: 37910412. Policy #0 lag: (min: 3.0, avg: 3.2, max: 12.0) +[2023-10-08 14:43:26,875][101941] Avg episode reward: [(0, '8.050'), (1, '12.100')] +[2023-10-08 14:43:26,876][102760] Saving new best policy, reward=12.100! +[2023-10-08 14:43:27,721][102897] Updated weights for policy 0, policy_version 73990 (0.0007) +[2023-10-08 14:43:28,083][102897] Updated weights for policy 0, policy_version 74000 (0.0010) +[2023-10-08 14:43:28,457][102897] Updated weights for policy 0, policy_version 74010 (0.0011) +[2023-10-08 14:43:29,815][102898] Updated weights for policy 1, policy_version 74090 (0.0008) +[2023-10-08 14:43:30,184][102898] Updated weights for policy 1, policy_version 74100 (0.0008) +[2023-10-08 14:43:30,551][102898] Updated weights for policy 1, policy_version 74110 (0.0009) +[2023-10-08 14:43:31,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 151683072. Throughput: 0: 1781.4, 1: 1786.1. Samples: 37931982. Policy #0 lag: (min: 3.0, avg: 3.2, max: 12.0) +[2023-10-08 14:43:31,876][101941] Avg episode reward: [(0, '8.580'), (1, '11.170')] +[2023-10-08 14:43:32,282][102897] Updated weights for policy 0, policy_version 74020 (0.0009) +[2023-10-08 14:43:32,652][102897] Updated weights for policy 0, policy_version 74030 (0.0008) +[2023-10-08 14:43:33,021][102897] Updated weights for policy 0, policy_version 74040 (0.0008) +[2023-10-08 14:43:34,297][102898] Updated weights for policy 1, policy_version 74120 (0.0008) +[2023-10-08 14:43:34,667][102898] Updated weights for policy 1, policy_version 74130 (0.0009) +[2023-10-08 14:43:35,037][102898] Updated weights for policy 1, policy_version 74140 (0.0008) +[2023-10-08 14:43:36,816][102897] Updated weights for policy 0, policy_version 74050 (0.0010) +[2023-10-08 14:43:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 151748608. Throughput: 0: 1775.5, 1: 1806.8. Samples: 37942896. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 14:43:36,875][101941] Avg episode reward: [(0, '8.480'), (1, '10.710')] +[2023-10-08 14:43:37,192][102897] Updated weights for policy 0, policy_version 74060 (0.0010) +[2023-10-08 14:43:37,560][102897] Updated weights for policy 0, policy_version 74070 (0.0010) +[2023-10-08 14:43:37,925][102897] Updated weights for policy 0, policy_version 74080 (0.0010) +[2023-10-08 14:43:38,801][102898] Updated weights for policy 1, policy_version 74150 (0.0010) +[2023-10-08 14:43:39,170][102898] Updated weights for policy 1, policy_version 74160 (0.0008) +[2023-10-08 14:43:39,530][102898] Updated weights for policy 1, policy_version 74170 (0.0007) +[2023-10-08 14:43:41,761][102897] Updated weights for policy 0, policy_version 74090 (0.0008) +[2023-10-08 14:43:41,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 151814144. Throughput: 0: 1775.6, 1: 1790.3. Samples: 37964402. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 14:43:41,876][101941] Avg episode reward: [(0, '8.710'), (1, '10.170')] +[2023-10-08 14:43:42,137][102897] Updated weights for policy 0, policy_version 74100 (0.0009) +[2023-10-08 14:43:42,500][102897] Updated weights for policy 0, policy_version 74110 (0.0007) +[2023-10-08 14:43:43,464][102898] Updated weights for policy 1, policy_version 74180 (0.0007) +[2023-10-08 14:43:43,852][102898] Updated weights for policy 1, policy_version 74190 (0.0008) +[2023-10-08 14:43:44,224][102898] Updated weights for policy 1, policy_version 74200 (0.0009) +[2023-10-08 14:43:45,985][102897] Updated weights for policy 0, policy_version 74120 (0.0008) +[2023-10-08 14:43:46,353][102897] Updated weights for policy 0, policy_version 74130 (0.0008) +[2023-10-08 14:43:46,730][102897] Updated weights for policy 0, policy_version 74140 (0.0009) +[2023-10-08 14:43:46,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 151912448. Throughput: 0: 1798.2, 1: 1788.2. Samples: 37985938. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 14:43:46,875][101941] Avg episode reward: [(0, '8.690'), (1, '10.200')] +[2023-10-08 14:43:47,918][102898] Updated weights for policy 1, policy_version 74210 (0.0010) +[2023-10-08 14:43:48,274][102898] Updated weights for policy 1, policy_version 74220 (0.0009) +[2023-10-08 14:43:48,644][102898] Updated weights for policy 1, policy_version 74230 (0.0008) +[2023-10-08 14:43:49,012][102898] Updated weights for policy 1, policy_version 74240 (0.0009) +[2023-10-08 14:43:50,605][102897] Updated weights for policy 0, policy_version 74150 (0.0009) +[2023-10-08 14:43:50,979][102897] Updated weights for policy 0, policy_version 74160 (0.0010) +[2023-10-08 14:43:51,352][102897] Updated weights for policy 0, policy_version 74170 (0.0008) +[2023-10-08 14:43:51,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 151977984. Throughput: 0: 1784.1, 1: 1787.3. Samples: 37996376. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 14:43:51,876][101941] Avg episode reward: [(0, '8.660'), (1, '10.870')] +[2023-10-08 14:43:52,598][102898] Updated weights for policy 1, policy_version 74250 (0.0007) +[2023-10-08 14:43:52,965][102898] Updated weights for policy 1, policy_version 74260 (0.0007) +[2023-10-08 14:43:53,326][102898] Updated weights for policy 1, policy_version 74270 (0.0007) +[2023-10-08 14:43:55,226][102897] Updated weights for policy 0, policy_version 74180 (0.0007) +[2023-10-08 14:43:55,601][102897] Updated weights for policy 0, policy_version 74190 (0.0008) +[2023-10-08 14:43:55,968][102897] Updated weights for policy 0, policy_version 74200 (0.0007) +[2023-10-08 14:43:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 152043520. Throughput: 0: 1802.2, 1: 1789.3. Samples: 38018410. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 14:43:56,875][101941] Avg episode reward: [(0, '8.540'), (1, '10.740')] +[2023-10-08 14:43:56,986][102898] Updated weights for policy 1, policy_version 74280 (0.0007) +[2023-10-08 14:43:57,348][102898] Updated weights for policy 1, policy_version 74290 (0.0007) +[2023-10-08 14:43:57,720][102898] Updated weights for policy 1, policy_version 74300 (0.0009) +[2023-10-08 14:43:59,683][102897] Updated weights for policy 0, policy_version 74210 (0.0008) +[2023-10-08 14:44:00,055][102897] Updated weights for policy 0, policy_version 74220 (0.0010) +[2023-10-08 14:44:00,425][102897] Updated weights for policy 0, policy_version 74230 (0.0011) +[2023-10-08 14:44:00,799][102897] Updated weights for policy 0, policy_version 74240 (0.0010) +[2023-10-08 14:44:01,525][102898] Updated weights for policy 1, policy_version 74310 (0.0008) +[2023-10-08 14:44:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 152109056. Throughput: 0: 1776.4, 1: 1799.2. Samples: 38039236. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 14:44:01,876][101941] Avg episode reward: [(0, '8.460'), (1, '11.060')] +[2023-10-08 14:44:01,887][102898] Updated weights for policy 1, policy_version 74320 (0.0009) +[2023-10-08 14:44:02,251][102898] Updated weights for policy 1, policy_version 74330 (0.0009) +[2023-10-08 14:44:04,572][102897] Updated weights for policy 0, policy_version 74250 (0.0007) +[2023-10-08 14:44:04,952][102897] Updated weights for policy 0, policy_version 74260 (0.0009) +[2023-10-08 14:44:05,320][102897] Updated weights for policy 0, policy_version 74270 (0.0010) +[2023-10-08 14:44:06,115][102898] Updated weights for policy 1, policy_version 74340 (0.0008) +[2023-10-08 14:44:06,486][102898] Updated weights for policy 1, policy_version 74350 (0.0007) +[2023-10-08 14:44:06,848][102898] Updated weights for policy 1, policy_version 74360 (0.0011) +[2023-10-08 14:44:06,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 152174592. Throughput: 0: 1797.5, 1: 1788.1. Samples: 38050488. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 14:44:06,876][101941] Avg episode reward: [(0, '8.580'), (1, '10.160')] +[2023-10-08 14:44:08,999][102897] Updated weights for policy 0, policy_version 74280 (0.0010) +[2023-10-08 14:44:09,367][102897] Updated weights for policy 0, policy_version 74290 (0.0008) +[2023-10-08 14:44:09,730][102897] Updated weights for policy 0, policy_version 74300 (0.0008) +[2023-10-08 14:44:10,754][102898] Updated weights for policy 1, policy_version 74370 (0.0007) +[2023-10-08 14:44:11,114][102898] Updated weights for policy 1, policy_version 74380 (0.0008) +[2023-10-08 14:44:11,475][102898] Updated weights for policy 1, policy_version 74390 (0.0008) +[2023-10-08 14:44:11,843][102898] Updated weights for policy 1, policy_version 74400 (0.0010) +[2023-10-08 14:44:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 152272896. Throughput: 0: 1779.4, 1: 1806.1. Samples: 38071760. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 14:44:11,875][101941] Avg episode reward: [(0, '9.040'), (1, '11.380')] +[2023-10-08 14:44:13,424][102897] Updated weights for policy 0, policy_version 74310 (0.0009) +[2023-10-08 14:44:13,803][102897] Updated weights for policy 0, policy_version 74320 (0.0009) +[2023-10-08 14:44:14,169][102897] Updated weights for policy 0, policy_version 74330 (0.0007) +[2023-10-08 14:44:15,534][102898] Updated weights for policy 1, policy_version 74410 (0.0010) +[2023-10-08 14:44:15,896][102898] Updated weights for policy 1, policy_version 74420 (0.0009) +[2023-10-08 14:44:16,261][102898] Updated weights for policy 1, policy_version 74430 (0.0007) +[2023-10-08 14:44:16,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 152338432. Throughput: 0: 1788.8, 1: 1793.5. Samples: 38093184. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 14:44:16,876][101941] Avg episode reward: [(0, '8.610'), (1, '10.870')] +[2023-10-08 14:44:16,885][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000074336_76120064.pth... +[2023-10-08 14:44:16,885][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000074432_76218368.pth... +[2023-10-08 14:44:16,918][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000072736_74481664.pth +[2023-10-08 14:44:16,921][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000072672_74416128.pth +[2023-10-08 14:44:17,933][102897] Updated weights for policy 0, policy_version 74340 (0.0007) +[2023-10-08 14:44:18,303][102897] Updated weights for policy 0, policy_version 74350 (0.0008) +[2023-10-08 14:44:18,672][102897] Updated weights for policy 0, policy_version 74360 (0.0008) +[2023-10-08 14:44:19,966][102898] Updated weights for policy 1, policy_version 74440 (0.0009) +[2023-10-08 14:44:20,326][102898] Updated weights for policy 1, policy_version 74450 (0.0008) +[2023-10-08 14:44:20,685][102898] Updated weights for policy 1, policy_version 74460 (0.0010) +[2023-10-08 14:44:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 152403968. Throughput: 0: 1786.6, 1: 1801.5. Samples: 38104360. Policy #0 lag: (min: 31.0, avg: 33.4, max: 63.0) +[2023-10-08 14:44:21,876][101941] Avg episode reward: [(0, '8.260'), (1, '10.870')] +[2023-10-08 14:44:22,385][102897] Updated weights for policy 0, policy_version 74370 (0.0010) +[2023-10-08 14:44:22,754][102897] Updated weights for policy 0, policy_version 74380 (0.0009) +[2023-10-08 14:44:23,126][102897] Updated weights for policy 0, policy_version 74390 (0.0009) +[2023-10-08 14:44:23,496][102897] Updated weights for policy 0, policy_version 74400 (0.0008) +[2023-10-08 14:44:24,522][102898] Updated weights for policy 1, policy_version 74470 (0.0009) +[2023-10-08 14:44:24,887][102898] Updated weights for policy 1, policy_version 74480 (0.0009) +[2023-10-08 14:44:25,252][102898] Updated weights for policy 1, policy_version 74490 (0.0009) +[2023-10-08 14:44:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 152469504. Throughput: 0: 1792.6, 1: 1786.9. Samples: 38125482. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:44:26,876][101941] Avg episode reward: [(0, '8.990'), (1, '10.760')] +[2023-10-08 14:44:27,189][102897] Updated weights for policy 0, policy_version 74410 (0.0008) +[2023-10-08 14:44:27,556][102897] Updated weights for policy 0, policy_version 74420 (0.0008) +[2023-10-08 14:44:27,933][102897] Updated weights for policy 0, policy_version 74430 (0.0008) +[2023-10-08 14:44:28,917][102898] Updated weights for policy 1, policy_version 74500 (0.0008) +[2023-10-08 14:44:29,318][102898] Updated weights for policy 1, policy_version 74510 (0.0009) +[2023-10-08 14:44:29,676][102898] Updated weights for policy 1, policy_version 74520 (0.0008) +[2023-10-08 14:44:31,785][102897] Updated weights for policy 0, policy_version 74440 (0.0008) +[2023-10-08 14:44:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 152535040. Throughput: 0: 1804.5, 1: 1785.1. Samples: 38147470. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:44:31,876][101941] Avg episode reward: [(0, '7.980'), (1, '11.260')] +[2023-10-08 14:44:32,163][102897] Updated weights for policy 0, policy_version 74450 (0.0008) +[2023-10-08 14:44:32,545][102897] Updated weights for policy 0, policy_version 74460 (0.0008) +[2023-10-08 14:44:33,446][102898] Updated weights for policy 1, policy_version 74530 (0.0008) +[2023-10-08 14:44:33,812][102898] Updated weights for policy 1, policy_version 74540 (0.0008) +[2023-10-08 14:44:34,185][102898] Updated weights for policy 1, policy_version 74550 (0.0007) +[2023-10-08 14:44:34,552][102898] Updated weights for policy 1, policy_version 74560 (0.0008) +[2023-10-08 14:44:36,504][102897] Updated weights for policy 0, policy_version 74470 (0.0008) +[2023-10-08 14:44:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 152600576. Throughput: 0: 1786.3, 1: 1791.1. Samples: 38157360. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:44:36,876][101941] Avg episode reward: [(0, '8.360'), (1, '10.270')] +[2023-10-08 14:44:36,879][102897] Updated weights for policy 0, policy_version 74480 (0.0009) +[2023-10-08 14:44:37,248][102897] Updated weights for policy 0, policy_version 74490 (0.0010) +[2023-10-08 14:44:38,260][102898] Updated weights for policy 1, policy_version 74570 (0.0008) +[2023-10-08 14:44:38,621][102898] Updated weights for policy 1, policy_version 74580 (0.0008) +[2023-10-08 14:44:38,994][102898] Updated weights for policy 1, policy_version 74590 (0.0010) +[2023-10-08 14:44:41,097][102897] Updated weights for policy 0, policy_version 74500 (0.0010) +[2023-10-08 14:44:41,471][102897] Updated weights for policy 0, policy_version 74510 (0.0007) +[2023-10-08 14:44:41,837][102897] Updated weights for policy 0, policy_version 74520 (0.0007) +[2023-10-08 14:44:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 152666112. Throughput: 0: 1792.5, 1: 1779.0. Samples: 38179128. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:44:41,876][101941] Avg episode reward: [(0, '8.630'), (1, '9.880')] +[2023-10-08 14:44:42,768][102898] Updated weights for policy 1, policy_version 74600 (0.0009) +[2023-10-08 14:44:43,137][102898] Updated weights for policy 1, policy_version 74610 (0.0007) +[2023-10-08 14:44:43,498][102898] Updated weights for policy 1, policy_version 74620 (0.0008) +[2023-10-08 14:44:45,633][102897] Updated weights for policy 0, policy_version 74530 (0.0008) +[2023-10-08 14:44:45,998][102897] Updated weights for policy 0, policy_version 74540 (0.0008) +[2023-10-08 14:44:46,369][102897] Updated weights for policy 0, policy_version 74550 (0.0008) +[2023-10-08 14:44:46,735][102897] Updated weights for policy 0, policy_version 74560 (0.0008) +[2023-10-08 14:44:46,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 152764416. Throughput: 0: 1798.3, 1: 1789.1. Samples: 38200666. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:44:46,876][101941] Avg episode reward: [(0, '8.260'), (1, '10.290')] +[2023-10-08 14:44:47,229][102898] Updated weights for policy 1, policy_version 74630 (0.0009) +[2023-10-08 14:44:47,606][102898] Updated weights for policy 1, policy_version 74640 (0.0008) +[2023-10-08 14:44:47,974][102898] Updated weights for policy 1, policy_version 74650 (0.0008) +[2023-10-08 14:44:50,502][102897] Updated weights for policy 0, policy_version 74570 (0.0010) +[2023-10-08 14:44:50,866][102897] Updated weights for policy 0, policy_version 74580 (0.0007) +[2023-10-08 14:44:51,242][102897] Updated weights for policy 0, policy_version 74590 (0.0008) +[2023-10-08 14:44:51,858][102898] Updated weights for policy 1, policy_version 74660 (0.0010) +[2023-10-08 14:44:51,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 152829952. Throughput: 0: 1787.5, 1: 1784.4. Samples: 38211222. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:44:51,875][101941] Avg episode reward: [(0, '8.440'), (1, '10.000')] +[2023-10-08 14:44:52,231][102898] Updated weights for policy 1, policy_version 74670 (0.0008) +[2023-10-08 14:44:52,593][102898] Updated weights for policy 1, policy_version 74680 (0.0009) +[2023-10-08 14:44:54,908][102897] Updated weights for policy 0, policy_version 74600 (0.0010) +[2023-10-08 14:44:55,281][102897] Updated weights for policy 0, policy_version 74610 (0.0011) +[2023-10-08 14:44:55,658][102897] Updated weights for policy 0, policy_version 74620 (0.0007) +[2023-10-08 14:44:56,321][102898] Updated weights for policy 1, policy_version 74690 (0.0007) +[2023-10-08 14:44:56,688][102898] Updated weights for policy 1, policy_version 74700 (0.0007) +[2023-10-08 14:44:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 152895488. Throughput: 0: 1791.9, 1: 1784.3. Samples: 38232686. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:44:56,875][101941] Avg episode reward: [(0, '8.780'), (1, '10.800')] +[2023-10-08 14:44:57,052][102898] Updated weights for policy 1, policy_version 74710 (0.0007) +[2023-10-08 14:44:57,429][102898] Updated weights for policy 1, policy_version 74720 (0.0008) +[2023-10-08 14:44:59,478][102897] Updated weights for policy 0, policy_version 74630 (0.0007) +[2023-10-08 14:44:59,853][102897] Updated weights for policy 0, policy_version 74640 (0.0007) +[2023-10-08 14:45:00,235][102897] Updated weights for policy 0, policy_version 74650 (0.0009) +[2023-10-08 14:45:01,252][102898] Updated weights for policy 1, policy_version 74730 (0.0009) +[2023-10-08 14:45:01,613][102898] Updated weights for policy 1, policy_version 74740 (0.0011) +[2023-10-08 14:45:01,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 152961024. Throughput: 0: 1773.1, 1: 1796.6. Samples: 38253820. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:45:01,876][101941] Avg episode reward: [(0, '8.200'), (1, '10.450')] +[2023-10-08 14:45:01,979][102898] Updated weights for policy 1, policy_version 74750 (0.0007) +[2023-10-08 14:45:04,012][102897] Updated weights for policy 0, policy_version 74660 (0.0009) +[2023-10-08 14:45:04,379][102897] Updated weights for policy 0, policy_version 74670 (0.0009) +[2023-10-08 14:45:04,746][102897] Updated weights for policy 0, policy_version 74680 (0.0007) +[2023-10-08 14:45:05,811][102898] Updated weights for policy 1, policy_version 74760 (0.0008) +[2023-10-08 14:45:06,170][102898] Updated weights for policy 1, policy_version 74770 (0.0008) +[2023-10-08 14:45:06,542][102898] Updated weights for policy 1, policy_version 74780 (0.0007) +[2023-10-08 14:45:06,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 153059328. Throughput: 0: 1789.8, 1: 1778.6. Samples: 38264938. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:45:06,876][101941] Avg episode reward: [(0, '8.000'), (1, '10.310')] +[2023-10-08 14:45:08,594][102897] Updated weights for policy 0, policy_version 74690 (0.0009) +[2023-10-08 14:45:08,968][102897] Updated weights for policy 0, policy_version 74700 (0.0007) +[2023-10-08 14:45:09,331][102897] Updated weights for policy 0, policy_version 74710 (0.0008) +[2023-10-08 14:45:09,697][102897] Updated weights for policy 0, policy_version 74720 (0.0008) +[2023-10-08 14:45:10,248][102898] Updated weights for policy 1, policy_version 74790 (0.0009) +[2023-10-08 14:45:10,610][102898] Updated weights for policy 1, policy_version 74800 (0.0009) +[2023-10-08 14:45:10,974][102898] Updated weights for policy 1, policy_version 74810 (0.0009) +[2023-10-08 14:45:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 153124864. Throughput: 0: 1762.8, 1: 1803.9. Samples: 38285980. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:45:11,876][101941] Avg episode reward: [(0, '8.550'), (1, '10.270')] +[2023-10-08 14:45:13,478][102897] Updated weights for policy 0, policy_version 74730 (0.0007) +[2023-10-08 14:45:13,852][102897] Updated weights for policy 0, policy_version 74740 (0.0008) +[2023-10-08 14:45:14,220][102897] Updated weights for policy 0, policy_version 74750 (0.0009) +[2023-10-08 14:45:14,892][102898] Updated weights for policy 1, policy_version 74820 (0.0008) +[2023-10-08 14:45:15,266][102898] Updated weights for policy 1, policy_version 74830 (0.0009) +[2023-10-08 14:45:15,627][102898] Updated weights for policy 1, policy_version 74840 (0.0009) +[2023-10-08 14:45:16,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 153190400. Throughput: 0: 1767.0, 1: 1782.5. Samples: 38307200. Policy #0 lag: (min: 24.0, avg: 53.3, max: 56.0) +[2023-10-08 14:45:16,876][101941] Avg episode reward: [(0, '8.730'), (1, '11.160')] +[2023-10-08 14:45:18,046][102897] Updated weights for policy 0, policy_version 74760 (0.0009) +[2023-10-08 14:45:18,409][102897] Updated weights for policy 0, policy_version 74770 (0.0008) +[2023-10-08 14:45:18,780][102897] Updated weights for policy 0, policy_version 74780 (0.0007) +[2023-10-08 14:45:19,384][102898] Updated weights for policy 1, policy_version 74850 (0.0010) +[2023-10-08 14:45:19,757][102898] Updated weights for policy 1, policy_version 74860 (0.0008) +[2023-10-08 14:45:20,120][102898] Updated weights for policy 1, policy_version 74870 (0.0009) +[2023-10-08 14:45:20,490][102898] Updated weights for policy 1, policy_version 74880 (0.0010) +[2023-10-08 14:45:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 153255936. Throughput: 0: 1766.7, 1: 1810.5. Samples: 38318334. Policy #0 lag: (min: 24.0, avg: 53.3, max: 56.0) +[2023-10-08 14:45:21,876][101941] Avg episode reward: [(0, '8.560'), (1, '12.140')] +[2023-10-08 14:45:21,877][102760] Saving new best policy, reward=12.140! +[2023-10-08 14:45:22,603][102897] Updated weights for policy 0, policy_version 74790 (0.0007) +[2023-10-08 14:45:22,972][102897] Updated weights for policy 0, policy_version 74800 (0.0008) +[2023-10-08 14:45:23,349][102897] Updated weights for policy 0, policy_version 74810 (0.0010) +[2023-10-08 14:45:24,234][102898] Updated weights for policy 1, policy_version 74890 (0.0007) +[2023-10-08 14:45:24,600][102898] Updated weights for policy 1, policy_version 74900 (0.0008) +[2023-10-08 14:45:24,981][102898] Updated weights for policy 1, policy_version 74910 (0.0007) +[2023-10-08 14:45:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 153321472. Throughput: 0: 1770.3, 1: 1785.5. Samples: 38339138. Policy #0 lag: (min: 24.0, avg: 53.3, max: 56.0) +[2023-10-08 14:45:26,876][101941] Avg episode reward: [(0, '8.860'), (1, '11.380')] +[2023-10-08 14:45:27,090][102897] Updated weights for policy 0, policy_version 74820 (0.0011) +[2023-10-08 14:45:27,479][102897] Updated weights for policy 0, policy_version 74830 (0.0008) +[2023-10-08 14:45:27,845][102897] Updated weights for policy 0, policy_version 74840 (0.0007) +[2023-10-08 14:45:28,731][102898] Updated weights for policy 1, policy_version 74920 (0.0007) +[2023-10-08 14:45:29,088][102898] Updated weights for policy 1, policy_version 74930 (0.0008) +[2023-10-08 14:45:29,468][102898] Updated weights for policy 1, policy_version 74940 (0.0009) +[2023-10-08 14:45:31,647][102897] Updated weights for policy 0, policy_version 74850 (0.0007) +[2023-10-08 14:45:31,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 153387008. Throughput: 0: 1788.8, 1: 1779.5. Samples: 38361238. Policy #0 lag: (min: 24.0, avg: 53.3, max: 56.0) +[2023-10-08 14:45:31,876][101941] Avg episode reward: [(0, '9.160'), (1, '10.980')] +[2023-10-08 14:45:32,013][102897] Updated weights for policy 0, policy_version 74860 (0.0007) +[2023-10-08 14:45:32,377][102897] Updated weights for policy 0, policy_version 74870 (0.0007) +[2023-10-08 14:45:32,748][102897] Updated weights for policy 0, policy_version 74880 (0.0010) +[2023-10-08 14:45:33,316][102898] Updated weights for policy 1, policy_version 74950 (0.0009) +[2023-10-08 14:45:33,690][102898] Updated weights for policy 1, policy_version 74960 (0.0009) +[2023-10-08 14:45:34,047][102898] Updated weights for policy 1, policy_version 74970 (0.0007) +[2023-10-08 14:45:36,514][102897] Updated weights for policy 0, policy_version 74890 (0.0007) +[2023-10-08 14:45:36,873][102897] Updated weights for policy 0, policy_version 74900 (0.0009) +[2023-10-08 14:45:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 153452544. Throughput: 0: 1771.7, 1: 1780.3. Samples: 38371060. Policy #0 lag: (min: 24.0, avg: 53.3, max: 56.0) +[2023-10-08 14:45:36,876][101941] Avg episode reward: [(0, '8.990'), (1, '10.440')] +[2023-10-08 14:45:37,254][102897] Updated weights for policy 0, policy_version 74910 (0.0009) +[2023-10-08 14:45:37,956][102898] Updated weights for policy 1, policy_version 74980 (0.0009) +[2023-10-08 14:45:38,323][102898] Updated weights for policy 1, policy_version 74990 (0.0008) +[2023-10-08 14:45:38,694][102898] Updated weights for policy 1, policy_version 75000 (0.0007) +[2023-10-08 14:45:41,066][102897] Updated weights for policy 0, policy_version 74920 (0.0011) +[2023-10-08 14:45:41,443][102897] Updated weights for policy 0, policy_version 74930 (0.0007) +[2023-10-08 14:45:41,814][102897] Updated weights for policy 0, policy_version 74940 (0.0007) +[2023-10-08 14:45:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 153518080. Throughput: 0: 1791.9, 1: 1780.5. Samples: 38393442. Policy #0 lag: (min: 24.0, avg: 53.3, max: 56.0) +[2023-10-08 14:45:41,876][101941] Avg episode reward: [(0, '8.100'), (1, '11.670')] +[2023-10-08 14:45:42,250][102898] Updated weights for policy 1, policy_version 75010 (0.0010) +[2023-10-08 14:45:42,617][102898] Updated weights for policy 1, policy_version 75020 (0.0008) +[2023-10-08 14:45:42,989][102898] Updated weights for policy 1, policy_version 75030 (0.0008) +[2023-10-08 14:45:43,357][102898] Updated weights for policy 1, policy_version 75040 (0.0007) +[2023-10-08 14:45:45,487][102897] Updated weights for policy 0, policy_version 74950 (0.0009) +[2023-10-08 14:45:45,859][102897] Updated weights for policy 0, policy_version 74960 (0.0008) +[2023-10-08 14:45:46,227][102897] Updated weights for policy 0, policy_version 74970 (0.0008) +[2023-10-08 14:45:46,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 153616384. Throughput: 0: 1769.7, 1: 1801.4. Samples: 38414522. Policy #0 lag: (min: 24.0, avg: 53.3, max: 56.0) +[2023-10-08 14:45:46,876][101941] Avg episode reward: [(0, '7.340'), (1, '10.770')] +[2023-10-08 14:45:47,043][102898] Updated weights for policy 1, policy_version 75050 (0.0007) +[2023-10-08 14:45:47,418][102898] Updated weights for policy 1, policy_version 75060 (0.0008) +[2023-10-08 14:45:47,785][102898] Updated weights for policy 1, policy_version 75070 (0.0010) +[2023-10-08 14:45:50,048][102897] Updated weights for policy 0, policy_version 74980 (0.0008) +[2023-10-08 14:45:50,425][102897] Updated weights for policy 0, policy_version 74990 (0.0008) +[2023-10-08 14:45:50,792][102897] Updated weights for policy 0, policy_version 75000 (0.0008) +[2023-10-08 14:45:51,614][102898] Updated weights for policy 1, policy_version 75080 (0.0008) +[2023-10-08 14:45:51,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 153681920. Throughput: 0: 1785.1, 1: 1783.6. Samples: 38425530. Policy #0 lag: (min: 24.0, avg: 53.3, max: 56.0) +[2023-10-08 14:45:51,875][101941] Avg episode reward: [(0, '7.980'), (1, '10.600')] +[2023-10-08 14:45:51,989][102898] Updated weights for policy 1, policy_version 75090 (0.0008) +[2023-10-08 14:45:52,356][102898] Updated weights for policy 1, policy_version 75100 (0.0008) +[2023-10-08 14:45:54,635][102897] Updated weights for policy 0, policy_version 75010 (0.0008) +[2023-10-08 14:45:55,012][102897] Updated weights for policy 0, policy_version 75020 (0.0009) +[2023-10-08 14:45:55,375][102897] Updated weights for policy 0, policy_version 75030 (0.0009) +[2023-10-08 14:45:55,747][102897] Updated weights for policy 0, policy_version 75040 (0.0010) +[2023-10-08 14:45:56,024][102898] Updated weights for policy 1, policy_version 75110 (0.0008) +[2023-10-08 14:45:56,401][102898] Updated weights for policy 1, policy_version 75120 (0.0007) +[2023-10-08 14:45:56,766][102898] Updated weights for policy 1, policy_version 75130 (0.0008) +[2023-10-08 14:45:56,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 153747456. Throughput: 0: 1782.7, 1: 1794.7. Samples: 38446964. Policy #0 lag: (min: 24.0, avg: 53.3, max: 56.0) +[2023-10-08 14:45:56,876][101941] Avg episode reward: [(0, '8.010'), (1, '10.720')] +[2023-10-08 14:45:59,600][102897] Updated weights for policy 0, policy_version 75050 (0.0009) +[2023-10-08 14:45:59,959][102897] Updated weights for policy 0, policy_version 75060 (0.0011) +[2023-10-08 14:46:00,330][102897] Updated weights for policy 0, policy_version 75070 (0.0010) +[2023-10-08 14:46:00,734][102898] Updated weights for policy 1, policy_version 75140 (0.0010) +[2023-10-08 14:46:01,122][102898] Updated weights for policy 1, policy_version 75150 (0.0007) +[2023-10-08 14:46:01,484][102898] Updated weights for policy 1, policy_version 75160 (0.0009) +[2023-10-08 14:46:01,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 153845760. Throughput: 0: 1768.3, 1: 1794.6. Samples: 38467528. Policy #0 lag: (min: 24.0, avg: 53.3, max: 56.0) +[2023-10-08 14:46:01,876][101941] Avg episode reward: [(0, '8.700'), (1, '10.580')] +[2023-10-08 14:46:04,166][102897] Updated weights for policy 0, policy_version 75080 (0.0007) +[2023-10-08 14:46:04,537][102897] Updated weights for policy 0, policy_version 75090 (0.0007) +[2023-10-08 14:46:04,913][102897] Updated weights for policy 0, policy_version 75100 (0.0009) +[2023-10-08 14:46:05,238][102898] Updated weights for policy 1, policy_version 75170 (0.0011) +[2023-10-08 14:46:05,607][102898] Updated weights for policy 1, policy_version 75180 (0.0009) +[2023-10-08 14:46:05,972][102898] Updated weights for policy 1, policy_version 75190 (0.0007) +[2023-10-08 14:46:06,332][102898] Updated weights for policy 1, policy_version 75200 (0.0009) +[2023-10-08 14:46:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 153911296. Throughput: 0: 1788.5, 1: 1779.8. Samples: 38478908. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:46:06,876][101941] Avg episode reward: [(0, '8.770'), (1, '10.020')] +[2023-10-08 14:46:08,601][102897] Updated weights for policy 0, policy_version 75110 (0.0008) +[2023-10-08 14:46:08,976][102897] Updated weights for policy 0, policy_version 75120 (0.0008) +[2023-10-08 14:46:09,341][102897] Updated weights for policy 0, policy_version 75130 (0.0009) +[2023-10-08 14:46:10,089][102898] Updated weights for policy 1, policy_version 75210 (0.0009) +[2023-10-08 14:46:10,444][102898] Updated weights for policy 1, policy_version 75220 (0.0007) +[2023-10-08 14:46:10,813][102898] Updated weights for policy 1, policy_version 75230 (0.0007) +[2023-10-08 14:46:11,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 153976832. Throughput: 0: 1773.6, 1: 1795.1. Samples: 38499726. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:46:11,875][101941] Avg episode reward: [(0, '9.070'), (1, '10.170')] +[2023-10-08 14:46:13,239][102897] Updated weights for policy 0, policy_version 75140 (0.0009) +[2023-10-08 14:46:13,623][102897] Updated weights for policy 0, policy_version 75150 (0.0009) +[2023-10-08 14:46:14,004][102897] Updated weights for policy 0, policy_version 75160 (0.0011) +[2023-10-08 14:46:14,669][102898] Updated weights for policy 1, policy_version 75240 (0.0009) +[2023-10-08 14:46:15,044][102898] Updated weights for policy 1, policy_version 75250 (0.0008) +[2023-10-08 14:46:15,415][102898] Updated weights for policy 1, policy_version 75260 (0.0010) +[2023-10-08 14:46:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 154042368. Throughput: 0: 1772.9, 1: 1782.5. Samples: 38521234. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:46:16,876][101941] Avg episode reward: [(0, '8.740'), (1, '9.880')] +[2023-10-08 14:46:16,886][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000075264_77070336.pth... +[2023-10-08 14:46:16,886][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000075168_76972032.pth... +[2023-10-08 14:46:16,939][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000073600_75366400.pth +[2023-10-08 14:46:16,939][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000073504_75268096.pth +[2023-10-08 14:46:16,945][102760] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p1/milestones/checkpoint_000075264_77070336.pth +[2023-10-08 14:46:16,945][102634] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p0/milestones/checkpoint_000075168_76972032.pth +[2023-10-08 14:46:17,602][102897] Updated weights for policy 0, policy_version 75170 (0.0010) +[2023-10-08 14:46:17,976][102897] Updated weights for policy 0, policy_version 75180 (0.0008) +[2023-10-08 14:46:18,346][102897] Updated weights for policy 0, policy_version 75190 (0.0010) +[2023-10-08 14:46:18,715][102897] Updated weights for policy 0, policy_version 75200 (0.0010) +[2023-10-08 14:46:19,246][102898] Updated weights for policy 1, policy_version 75270 (0.0009) +[2023-10-08 14:46:19,609][102898] Updated weights for policy 1, policy_version 75280 (0.0009) +[2023-10-08 14:46:19,978][102898] Updated weights for policy 1, policy_version 75290 (0.0008) +[2023-10-08 14:46:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 154107904. Throughput: 0: 1772.8, 1: 1803.1. Samples: 38531974. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:46:21,876][101941] Avg episode reward: [(0, '8.650'), (1, '10.830')] +[2023-10-08 14:46:22,540][102897] Updated weights for policy 0, policy_version 75210 (0.0008) +[2023-10-08 14:46:22,912][102897] Updated weights for policy 0, policy_version 75220 (0.0008) +[2023-10-08 14:46:23,280][102897] Updated weights for policy 0, policy_version 75230 (0.0008) +[2023-10-08 14:46:23,666][102898] Updated weights for policy 1, policy_version 75300 (0.0008) +[2023-10-08 14:46:24,041][102898] Updated weights for policy 1, policy_version 75310 (0.0010) +[2023-10-08 14:46:24,402][102898] Updated weights for policy 1, policy_version 75320 (0.0007) +[2023-10-08 14:46:26,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 154173440. Throughput: 0: 1774.2, 1: 1782.8. Samples: 38553510. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:46:26,875][101941] Avg episode reward: [(0, '8.350'), (1, '11.390')] +[2023-10-08 14:46:26,972][102897] Updated weights for policy 0, policy_version 75240 (0.0007) +[2023-10-08 14:46:27,355][102897] Updated weights for policy 0, policy_version 75250 (0.0008) +[2023-10-08 14:46:27,724][102897] Updated weights for policy 0, policy_version 75260 (0.0007) +[2023-10-08 14:46:28,141][102898] Updated weights for policy 1, policy_version 75330 (0.0009) +[2023-10-08 14:46:28,504][102898] Updated weights for policy 1, policy_version 75340 (0.0008) +[2023-10-08 14:46:28,859][102898] Updated weights for policy 1, policy_version 75350 (0.0008) +[2023-10-08 14:46:29,229][102898] Updated weights for policy 1, policy_version 75360 (0.0008) +[2023-10-08 14:46:31,533][102897] Updated weights for policy 0, policy_version 75270 (0.0009) +[2023-10-08 14:46:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 154238976. Throughput: 0: 1804.9, 1: 1780.0. Samples: 38575844. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:46:31,876][101941] Avg episode reward: [(0, '8.090'), (1, '10.820')] +[2023-10-08 14:46:31,908][102897] Updated weights for policy 0, policy_version 75280 (0.0010) +[2023-10-08 14:46:32,265][102897] Updated weights for policy 0, policy_version 75290 (0.0011) +[2023-10-08 14:46:32,956][102898] Updated weights for policy 1, policy_version 75370 (0.0008) +[2023-10-08 14:46:33,321][102898] Updated weights for policy 1, policy_version 75380 (0.0007) +[2023-10-08 14:46:33,692][102898] Updated weights for policy 1, policy_version 75390 (0.0008) +[2023-10-08 14:46:35,992][102897] Updated weights for policy 0, policy_version 75300 (0.0009) +[2023-10-08 14:46:36,360][102897] Updated weights for policy 0, policy_version 75310 (0.0008) +[2023-10-08 14:46:36,725][102897] Updated weights for policy 0, policy_version 75320 (0.0008) +[2023-10-08 14:46:36,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 154304512. Throughput: 0: 1780.0, 1: 1786.3. Samples: 38586012. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:46:36,876][101941] Avg episode reward: [(0, '8.510'), (1, '10.460')] +[2023-10-08 14:46:37,517][102898] Updated weights for policy 1, policy_version 75400 (0.0008) +[2023-10-08 14:46:37,885][102898] Updated weights for policy 1, policy_version 75410 (0.0008) +[2023-10-08 14:46:38,245][102898] Updated weights for policy 1, policy_version 75420 (0.0009) +[2023-10-08 14:46:40,520][102897] Updated weights for policy 0, policy_version 75330 (0.0008) +[2023-10-08 14:46:40,896][102897] Updated weights for policy 0, policy_version 75340 (0.0009) +[2023-10-08 14:46:41,272][102897] Updated weights for policy 0, policy_version 75350 (0.0008) +[2023-10-08 14:46:41,632][102897] Updated weights for policy 0, policy_version 75360 (0.0010) +[2023-10-08 14:46:41,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 154402816. Throughput: 0: 1801.5, 1: 1781.9. Samples: 38608216. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:46:41,875][101941] Avg episode reward: [(0, '9.600'), (1, '10.370')] +[2023-10-08 14:46:41,888][102898] Updated weights for policy 1, policy_version 75430 (0.0007) +[2023-10-08 14:46:42,257][102898] Updated weights for policy 1, policy_version 75440 (0.0008) +[2023-10-08 14:46:42,619][102898] Updated weights for policy 1, policy_version 75450 (0.0009) +[2023-10-08 14:46:45,368][102897] Updated weights for policy 0, policy_version 75370 (0.0007) +[2023-10-08 14:46:45,739][102897] Updated weights for policy 0, policy_version 75380 (0.0008) +[2023-10-08 14:46:46,103][102897] Updated weights for policy 0, policy_version 75390 (0.0010) +[2023-10-08 14:46:46,570][102898] Updated weights for policy 1, policy_version 75460 (0.0009) +[2023-10-08 14:46:46,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 154468352. Throughput: 0: 1784.6, 1: 1805.5. Samples: 38629084. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:46:46,875][101941] Avg episode reward: [(0, '9.150'), (1, '9.750')] +[2023-10-08 14:46:46,961][102898] Updated weights for policy 1, policy_version 75470 (0.0009) +[2023-10-08 14:46:47,329][102898] Updated weights for policy 1, policy_version 75480 (0.0011) +[2023-10-08 14:46:49,939][102897] Updated weights for policy 0, policy_version 75400 (0.0008) +[2023-10-08 14:46:50,301][102897] Updated weights for policy 0, policy_version 75410 (0.0010) +[2023-10-08 14:46:50,673][102897] Updated weights for policy 0, policy_version 75420 (0.0009) +[2023-10-08 14:46:50,990][102898] Updated weights for policy 1, policy_version 75490 (0.0009) +[2023-10-08 14:46:51,360][102898] Updated weights for policy 1, policy_version 75500 (0.0008) +[2023-10-08 14:46:51,720][102898] Updated weights for policy 1, policy_version 75510 (0.0007) +[2023-10-08 14:46:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 154533888. Throughput: 0: 1798.2, 1: 1786.0. Samples: 38640198. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:46:51,876][101941] Avg episode reward: [(0, '8.710'), (1, '9.690')] +[2023-10-08 14:46:52,087][102898] Updated weights for policy 1, policy_version 75520 (0.0007) +[2023-10-08 14:46:54,521][102897] Updated weights for policy 0, policy_version 75430 (0.0009) +[2023-10-08 14:46:54,885][102897] Updated weights for policy 0, policy_version 75440 (0.0008) +[2023-10-08 14:46:55,256][102897] Updated weights for policy 0, policy_version 75450 (0.0007) +[2023-10-08 14:46:55,790][102898] Updated weights for policy 1, policy_version 75530 (0.0010) +[2023-10-08 14:46:56,163][102898] Updated weights for policy 1, policy_version 75540 (0.0008) +[2023-10-08 14:46:56,528][102898] Updated weights for policy 1, policy_version 75550 (0.0007) +[2023-10-08 14:46:56,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 154632192. Throughput: 0: 1786.6, 1: 1805.9. Samples: 38661388. Policy #0 lag: (min: 6.0, avg: 13.6, max: 38.0) +[2023-10-08 14:46:56,876][101941] Avg episode reward: [(0, '8.840'), (1, '10.470')] +[2023-10-08 14:46:58,981][102897] Updated weights for policy 0, policy_version 75460 (0.0008) +[2023-10-08 14:46:59,386][102897] Updated weights for policy 0, policy_version 75470 (0.0008) +[2023-10-08 14:46:59,754][102897] Updated weights for policy 0, policy_version 75480 (0.0008) +[2023-10-08 14:47:00,619][102898] Updated weights for policy 1, policy_version 75560 (0.0008) +[2023-10-08 14:47:00,985][102898] Updated weights for policy 1, policy_version 75570 (0.0009) +[2023-10-08 14:47:01,356][102898] Updated weights for policy 1, policy_version 75580 (0.0009) +[2023-10-08 14:47:01,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 154697728. Throughput: 0: 1788.3, 1: 1790.0. Samples: 38682256. Policy #0 lag: (min: 6.0, avg: 13.6, max: 38.0) +[2023-10-08 14:47:01,875][101941] Avg episode reward: [(0, '9.170'), (1, '10.990')] +[2023-10-08 14:47:03,404][102897] Updated weights for policy 0, policy_version 75490 (0.0009) +[2023-10-08 14:47:03,766][102897] Updated weights for policy 0, policy_version 75500 (0.0009) +[2023-10-08 14:47:04,145][102897] Updated weights for policy 0, policy_version 75510 (0.0009) +[2023-10-08 14:47:04,511][102897] Updated weights for policy 0, policy_version 75520 (0.0011) +[2023-10-08 14:47:04,984][102898] Updated weights for policy 1, policy_version 75590 (0.0008) +[2023-10-08 14:47:05,344][102898] Updated weights for policy 1, policy_version 75600 (0.0009) +[2023-10-08 14:47:05,704][102898] Updated weights for policy 1, policy_version 75610 (0.0009) +[2023-10-08 14:47:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 154763264. Throughput: 0: 1791.3, 1: 1799.2. Samples: 38693546. Policy #0 lag: (min: 6.0, avg: 13.6, max: 38.0) +[2023-10-08 14:47:06,876][101941] Avg episode reward: [(0, '8.480'), (1, '11.290')] +[2023-10-08 14:47:08,194][102897] Updated weights for policy 0, policy_version 75530 (0.0008) +[2023-10-08 14:47:08,567][102897] Updated weights for policy 0, policy_version 75540 (0.0007) +[2023-10-08 14:47:08,935][102897] Updated weights for policy 0, policy_version 75550 (0.0008) +[2023-10-08 14:47:09,432][102898] Updated weights for policy 1, policy_version 75620 (0.0008) +[2023-10-08 14:47:09,803][102898] Updated weights for policy 1, policy_version 75630 (0.0007) +[2023-10-08 14:47:10,171][102898] Updated weights for policy 1, policy_version 75640 (0.0009) +[2023-10-08 14:47:11,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 154828800. Throughput: 0: 1791.1, 1: 1788.6. Samples: 38714600. Policy #0 lag: (min: 6.0, avg: 13.6, max: 38.0) +[2023-10-08 14:47:11,876][101941] Avg episode reward: [(0, '7.380'), (1, '11.580')] +[2023-10-08 14:47:12,597][102897] Updated weights for policy 0, policy_version 75560 (0.0008) +[2023-10-08 14:47:12,965][102897] Updated weights for policy 0, policy_version 75570 (0.0007) +[2023-10-08 14:47:13,329][102897] Updated weights for policy 0, policy_version 75580 (0.0007) +[2023-10-08 14:47:13,949][102898] Updated weights for policy 1, policy_version 75650 (0.0009) +[2023-10-08 14:47:14,324][102898] Updated weights for policy 1, policy_version 75660 (0.0007) +[2023-10-08 14:47:14,694][102898] Updated weights for policy 1, policy_version 75670 (0.0007) +[2023-10-08 14:47:15,060][102898] Updated weights for policy 1, policy_version 75680 (0.0008) +[2023-10-08 14:47:16,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 154894336. Throughput: 0: 1794.3, 1: 1787.2. Samples: 38737012. Policy #0 lag: (min: 6.0, avg: 13.6, max: 38.0) +[2023-10-08 14:47:16,876][101941] Avg episode reward: [(0, '7.430'), (1, '11.310')] +[2023-10-08 14:47:17,057][102897] Updated weights for policy 0, policy_version 75590 (0.0011) +[2023-10-08 14:47:17,426][102897] Updated weights for policy 0, policy_version 75600 (0.0008) +[2023-10-08 14:47:17,799][102897] Updated weights for policy 0, policy_version 75610 (0.0008) +[2023-10-08 14:47:18,736][102898] Updated weights for policy 1, policy_version 75690 (0.0009) +[2023-10-08 14:47:19,106][102898] Updated weights for policy 1, policy_version 75700 (0.0010) +[2023-10-08 14:47:19,477][102898] Updated weights for policy 1, policy_version 75710 (0.0007) +[2023-10-08 14:47:21,661][102897] Updated weights for policy 0, policy_version 75620 (0.0008) +[2023-10-08 14:47:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 154959872. Throughput: 0: 1792.4, 1: 1787.5. Samples: 38747106. Policy #0 lag: (min: 6.0, avg: 13.6, max: 38.0) +[2023-10-08 14:47:21,876][101941] Avg episode reward: [(0, '8.070'), (1, '10.330')] +[2023-10-08 14:47:22,037][102897] Updated weights for policy 0, policy_version 75630 (0.0011) +[2023-10-08 14:47:22,407][102897] Updated weights for policy 0, policy_version 75640 (0.0012) +[2023-10-08 14:47:23,375][102898] Updated weights for policy 1, policy_version 75720 (0.0008) +[2023-10-08 14:47:23,746][102898] Updated weights for policy 1, policy_version 75730 (0.0008) +[2023-10-08 14:47:24,111][102898] Updated weights for policy 1, policy_version 75740 (0.0007) +[2023-10-08 14:47:26,215][102897] Updated weights for policy 0, policy_version 75650 (0.0011) +[2023-10-08 14:47:26,584][102897] Updated weights for policy 0, policy_version 75660 (0.0007) +[2023-10-08 14:47:26,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 155025408. Throughput: 0: 1790.0, 1: 1780.3. Samples: 38768880. Policy #0 lag: (min: 6.0, avg: 13.6, max: 38.0) +[2023-10-08 14:47:26,876][101941] Avg episode reward: [(0, '8.240'), (1, '11.150')] +[2023-10-08 14:47:26,956][102897] Updated weights for policy 0, policy_version 75670 (0.0008) +[2023-10-08 14:47:27,322][102897] Updated weights for policy 0, policy_version 75680 (0.0008) +[2023-10-08 14:47:27,723][102898] Updated weights for policy 1, policy_version 75750 (0.0007) +[2023-10-08 14:47:28,086][102898] Updated weights for policy 1, policy_version 75760 (0.0008) +[2023-10-08 14:47:28,449][102898] Updated weights for policy 1, policy_version 75770 (0.0010) +[2023-10-08 14:47:31,024][102897] Updated weights for policy 0, policy_version 75690 (0.0010) +[2023-10-08 14:47:31,395][102897] Updated weights for policy 0, policy_version 75700 (0.0010) +[2023-10-08 14:47:31,754][102897] Updated weights for policy 0, policy_version 75710 (0.0007) +[2023-10-08 14:47:31,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 155123712. Throughput: 0: 1798.7, 1: 1786.7. Samples: 38790424. Policy #0 lag: (min: 6.0, avg: 13.6, max: 38.0) +[2023-10-08 14:47:31,876][101941] Avg episode reward: [(0, '8.370'), (1, '10.400')] +[2023-10-08 14:47:32,280][102898] Updated weights for policy 1, policy_version 75780 (0.0007) +[2023-10-08 14:47:32,680][102898] Updated weights for policy 1, policy_version 75790 (0.0010) +[2023-10-08 14:47:33,040][102898] Updated weights for policy 1, policy_version 75800 (0.0010) +[2023-10-08 14:47:35,498][102897] Updated weights for policy 0, policy_version 75720 (0.0009) +[2023-10-08 14:47:35,874][102897] Updated weights for policy 0, policy_version 75730 (0.0010) +[2023-10-08 14:47:36,241][102897] Updated weights for policy 0, policy_version 75740 (0.0008) +[2023-10-08 14:47:36,763][102898] Updated weights for policy 1, policy_version 75810 (0.0008) +[2023-10-08 14:47:36,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 155189248. Throughput: 0: 1786.4, 1: 1784.8. Samples: 38800902. Policy #0 lag: (min: 6.0, avg: 13.6, max: 38.0) +[2023-10-08 14:47:36,876][101941] Avg episode reward: [(0, '8.330'), (1, '10.190')] +[2023-10-08 14:47:37,129][102898] Updated weights for policy 1, policy_version 75820 (0.0008) +[2023-10-08 14:47:37,494][102898] Updated weights for policy 1, policy_version 75830 (0.0007) +[2023-10-08 14:47:37,857][102898] Updated weights for policy 1, policy_version 75840 (0.0008) +[2023-10-08 14:47:40,047][102897] Updated weights for policy 0, policy_version 75750 (0.0007) +[2023-10-08 14:47:40,420][102897] Updated weights for policy 0, policy_version 75760 (0.0008) +[2023-10-08 14:47:40,803][102897] Updated weights for policy 0, policy_version 75770 (0.0007) +[2023-10-08 14:47:41,656][102898] Updated weights for policy 1, policy_version 75850 (0.0007) +[2023-10-08 14:47:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 155254784. Throughput: 0: 1803.5, 1: 1783.0. Samples: 38822778. Policy #0 lag: (min: 6.0, avg: 13.6, max: 38.0) +[2023-10-08 14:47:41,876][101941] Avg episode reward: [(0, '8.620'), (1, '10.000')] +[2023-10-08 14:47:42,030][102898] Updated weights for policy 1, policy_version 75860 (0.0007) +[2023-10-08 14:47:42,394][102898] Updated weights for policy 1, policy_version 75870 (0.0007) +[2023-10-08 14:47:44,725][102897] Updated weights for policy 0, policy_version 75780 (0.0010) +[2023-10-08 14:47:45,110][102897] Updated weights for policy 0, policy_version 75790 (0.0009) +[2023-10-08 14:47:45,477][102897] Updated weights for policy 0, policy_version 75800 (0.0009) +[2023-10-08 14:47:46,030][102898] Updated weights for policy 1, policy_version 75880 (0.0008) +[2023-10-08 14:47:46,397][102898] Updated weights for policy 1, policy_version 75890 (0.0008) +[2023-10-08 14:47:46,767][102898] Updated weights for policy 1, policy_version 75900 (0.0009) +[2023-10-08 14:47:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 155320320. Throughput: 0: 1781.9, 1: 1800.9. Samples: 38843484. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:47:46,875][101941] Avg episode reward: [(0, '8.530'), (1, '10.570')] +[2023-10-08 14:47:49,244][102897] Updated weights for policy 0, policy_version 75810 (0.0008) +[2023-10-08 14:47:49,614][102897] Updated weights for policy 0, policy_version 75820 (0.0007) +[2023-10-08 14:47:49,981][102897] Updated weights for policy 0, policy_version 75830 (0.0007) +[2023-10-08 14:47:50,354][102897] Updated weights for policy 0, policy_version 75840 (0.0013) +[2023-10-08 14:47:50,555][102898] Updated weights for policy 1, policy_version 75910 (0.0008) +[2023-10-08 14:47:50,919][102898] Updated weights for policy 1, policy_version 75920 (0.0010) +[2023-10-08 14:47:51,297][102898] Updated weights for policy 1, policy_version 75930 (0.0010) +[2023-10-08 14:47:51,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 155418624. Throughput: 0: 1800.8, 1: 1790.2. Samples: 38855140. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:47:51,876][101941] Avg episode reward: [(0, '8.760'), (1, '10.520')] +[2023-10-08 14:47:54,147][102897] Updated weights for policy 0, policy_version 75850 (0.0008) +[2023-10-08 14:47:54,510][102897] Updated weights for policy 0, policy_version 75860 (0.0007) +[2023-10-08 14:47:54,878][102897] Updated weights for policy 0, policy_version 75870 (0.0011) +[2023-10-08 14:47:55,068][102898] Updated weights for policy 1, policy_version 75940 (0.0009) +[2023-10-08 14:47:55,428][102898] Updated weights for policy 1, policy_version 75950 (0.0008) +[2023-10-08 14:47:55,794][102898] Updated weights for policy 1, policy_version 75960 (0.0010) +[2023-10-08 14:47:56,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 155484160. Throughput: 0: 1774.2, 1: 1802.5. Samples: 38875552. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:47:56,876][101941] Avg episode reward: [(0, '8.790'), (1, '10.380')] +[2023-10-08 14:47:58,594][102897] Updated weights for policy 0, policy_version 75880 (0.0009) +[2023-10-08 14:47:58,966][102897] Updated weights for policy 0, policy_version 75890 (0.0010) +[2023-10-08 14:47:59,324][102897] Updated weights for policy 0, policy_version 75900 (0.0010) +[2023-10-08 14:47:59,447][102898] Updated weights for policy 1, policy_version 75970 (0.0009) +[2023-10-08 14:47:59,820][102898] Updated weights for policy 1, policy_version 75980 (0.0009) +[2023-10-08 14:48:00,192][102898] Updated weights for policy 1, policy_version 75990 (0.0008) +[2023-10-08 14:48:00,559][102898] Updated weights for policy 1, policy_version 76000 (0.0009) +[2023-10-08 14:48:01,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 155549696. Throughput: 0: 1774.7, 1: 1788.0. Samples: 38897334. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:48:01,875][101941] Avg episode reward: [(0, '8.360'), (1, '9.300')] +[2023-10-08 14:48:03,071][102897] Updated weights for policy 0, policy_version 75910 (0.0007) +[2023-10-08 14:48:03,440][102897] Updated weights for policy 0, policy_version 75920 (0.0009) +[2023-10-08 14:48:03,816][102897] Updated weights for policy 0, policy_version 75930 (0.0007) +[2023-10-08 14:48:04,338][102898] Updated weights for policy 1, policy_version 76010 (0.0010) +[2023-10-08 14:48:04,701][102898] Updated weights for policy 1, policy_version 76020 (0.0008) +[2023-10-08 14:48:05,069][102898] Updated weights for policy 1, policy_version 76030 (0.0010) +[2023-10-08 14:48:06,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 155615232. Throughput: 0: 1773.8, 1: 1802.8. Samples: 38908050. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:48:06,875][101941] Avg episode reward: [(0, '7.900'), (1, '9.630')] +[2023-10-08 14:48:07,604][102897] Updated weights for policy 0, policy_version 75940 (0.0008) +[2023-10-08 14:48:07,960][102897] Updated weights for policy 0, policy_version 75950 (0.0010) +[2023-10-08 14:48:08,333][102897] Updated weights for policy 0, policy_version 75960 (0.0011) +[2023-10-08 14:48:08,947][102898] Updated weights for policy 1, policy_version 76040 (0.0008) +[2023-10-08 14:48:09,310][102898] Updated weights for policy 1, policy_version 76050 (0.0010) +[2023-10-08 14:48:09,682][102898] Updated weights for policy 1, policy_version 76060 (0.0010) +[2023-10-08 14:48:11,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 155680768. Throughput: 0: 1779.1, 1: 1790.2. Samples: 38929498. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:48:11,876][101941] Avg episode reward: [(0, '8.460'), (1, '10.370')] +[2023-10-08 14:48:12,055][102897] Updated weights for policy 0, policy_version 75970 (0.0011) +[2023-10-08 14:48:12,433][102897] Updated weights for policy 0, policy_version 75980 (0.0007) +[2023-10-08 14:48:12,813][102897] Updated weights for policy 0, policy_version 75990 (0.0009) +[2023-10-08 14:48:13,191][102897] Updated weights for policy 0, policy_version 76000 (0.0009) +[2023-10-08 14:48:13,415][102898] Updated weights for policy 1, policy_version 76070 (0.0007) +[2023-10-08 14:48:13,783][102898] Updated weights for policy 1, policy_version 76080 (0.0008) +[2023-10-08 14:48:14,151][102898] Updated weights for policy 1, policy_version 76090 (0.0007) +[2023-10-08 14:48:16,875][101941] Fps is (10 sec: 13106.5, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 155746304. Throughput: 0: 1795.7, 1: 1791.9. Samples: 38951868. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:48:16,877][101941] Avg episode reward: [(0, '8.480'), (1, '10.940')] +[2023-10-08 14:48:16,888][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000076096_77922304.pth... +[2023-10-08 14:48:16,922][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000074432_76218368.pth +[2023-10-08 14:48:17,066][102897] Updated weights for policy 0, policy_version 76010 (0.0007) +[2023-10-08 14:48:17,438][102897] Updated weights for policy 0, policy_version 76020 (0.0008) +[2023-10-08 14:48:17,800][102897] Updated weights for policy 0, policy_version 76030 (0.0008) +[2023-10-08 14:48:17,872][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000076032_77856768.pth... +[2023-10-08 14:48:17,905][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000074336_76120064.pth +[2023-10-08 14:48:17,971][102898] Updated weights for policy 1, policy_version 76100 (0.0008) +[2023-10-08 14:48:18,369][102898] Updated weights for policy 1, policy_version 76110 (0.0009) +[2023-10-08 14:48:18,729][102898] Updated weights for policy 1, policy_version 76120 (0.0009) +[2023-10-08 14:48:21,717][102897] Updated weights for policy 0, policy_version 76040 (0.0009) +[2023-10-08 14:48:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 155811840. Throughput: 0: 1781.1, 1: 1789.1. Samples: 38961560. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:48:21,876][101941] Avg episode reward: [(0, '8.630'), (1, '10.280')] +[2023-10-08 14:48:22,077][102897] Updated weights for policy 0, policy_version 76050 (0.0011) +[2023-10-08 14:48:22,452][102897] Updated weights for policy 0, policy_version 76060 (0.0010) +[2023-10-08 14:48:22,487][102898] Updated weights for policy 1, policy_version 76130 (0.0008) +[2023-10-08 14:48:22,858][102898] Updated weights for policy 1, policy_version 76140 (0.0009) +[2023-10-08 14:48:23,214][102898] Updated weights for policy 1, policy_version 76150 (0.0008) +[2023-10-08 14:48:23,582][102898] Updated weights for policy 1, policy_version 76160 (0.0010) +[2023-10-08 14:48:26,263][102897] Updated weights for policy 0, policy_version 76070 (0.0007) +[2023-10-08 14:48:26,622][102897] Updated weights for policy 0, policy_version 76080 (0.0007) +[2023-10-08 14:48:26,875][101941] Fps is (10 sec: 13107.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 155877376. Throughput: 0: 1790.0, 1: 1784.8. Samples: 38983646. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:48:26,875][101941] Avg episode reward: [(0, '8.230'), (1, '10.750')] +[2023-10-08 14:48:26,994][102897] Updated weights for policy 0, policy_version 76090 (0.0007) +[2023-10-08 14:48:27,321][102898] Updated weights for policy 1, policy_version 76170 (0.0009) +[2023-10-08 14:48:27,692][102898] Updated weights for policy 1, policy_version 76180 (0.0010) +[2023-10-08 14:48:28,048][102898] Updated weights for policy 1, policy_version 76190 (0.0007) +[2023-10-08 14:48:30,718][102897] Updated weights for policy 0, policy_version 76100 (0.0007) +[2023-10-08 14:48:31,120][102897] Updated weights for policy 0, policy_version 76110 (0.0008) +[2023-10-08 14:48:31,488][102897] Updated weights for policy 0, policy_version 76120 (0.0008) +[2023-10-08 14:48:31,698][102898] Updated weights for policy 1, policy_version 76200 (0.0009) +[2023-10-08 14:48:31,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 155975680. Throughput: 0: 1790.5, 1: 1799.2. Samples: 39005018. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:48:31,875][101941] Avg episode reward: [(0, '8.590'), (1, '10.770')] +[2023-10-08 14:48:32,059][102898] Updated weights for policy 1, policy_version 76210 (0.0008) +[2023-10-08 14:48:32,424][102898] Updated weights for policy 1, policy_version 76220 (0.0008) +[2023-10-08 14:48:35,273][102897] Updated weights for policy 0, policy_version 76130 (0.0009) +[2023-10-08 14:48:35,636][102897] Updated weights for policy 0, policy_version 76140 (0.0008) +[2023-10-08 14:48:36,004][102897] Updated weights for policy 0, policy_version 76150 (0.0010) +[2023-10-08 14:48:36,375][102897] Updated weights for policy 0, policy_version 76160 (0.0009) +[2023-10-08 14:48:36,391][102898] Updated weights for policy 1, policy_version 76230 (0.0008) +[2023-10-08 14:48:36,757][102898] Updated weights for policy 1, policy_version 76240 (0.0008) +[2023-10-08 14:48:36,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 156041216. Throughput: 0: 1787.5, 1: 1778.8. Samples: 39015622. Policy #0 lag: (min: 1.0, avg: 20.1, max: 33.0) +[2023-10-08 14:48:36,875][101941] Avg episode reward: [(0, '7.660'), (1, '10.790')] +[2023-10-08 14:48:37,119][102898] Updated weights for policy 1, policy_version 76250 (0.0009) +[2023-10-08 14:48:40,053][102897] Updated weights for policy 0, policy_version 76170 (0.0007) +[2023-10-08 14:48:40,414][102897] Updated weights for policy 0, policy_version 76180 (0.0010) +[2023-10-08 14:48:40,793][102897] Updated weights for policy 0, policy_version 76190 (0.0008) +[2023-10-08 14:48:40,824][102898] Updated weights for policy 1, policy_version 76260 (0.0010) +[2023-10-08 14:48:41,189][102898] Updated weights for policy 1, policy_version 76270 (0.0008) +[2023-10-08 14:48:41,549][102898] Updated weights for policy 1, policy_version 76280 (0.0008) +[2023-10-08 14:48:41,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 156139520. Throughput: 0: 1796.4, 1: 1790.7. Samples: 39036972. Policy #0 lag: (min: 1.0, avg: 20.1, max: 33.0) +[2023-10-08 14:48:41,876][101941] Avg episode reward: [(0, '8.430'), (1, '10.050')] +[2023-10-08 14:48:44,461][102897] Updated weights for policy 0, policy_version 76200 (0.0007) +[2023-10-08 14:48:44,845][102897] Updated weights for policy 0, policy_version 76210 (0.0007) +[2023-10-08 14:48:45,221][102897] Updated weights for policy 0, policy_version 76220 (0.0007) +[2023-10-08 14:48:45,504][102898] Updated weights for policy 1, policy_version 76290 (0.0008) +[2023-10-08 14:48:45,872][102898] Updated weights for policy 1, policy_version 76300 (0.0009) +[2023-10-08 14:48:46,240][102898] Updated weights for policy 1, policy_version 76310 (0.0007) +[2023-10-08 14:48:46,600][102898] Updated weights for policy 1, policy_version 76320 (0.0008) +[2023-10-08 14:48:46,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 156205056. Throughput: 0: 1784.1, 1: 1779.7. Samples: 39057706. Policy #0 lag: (min: 1.0, avg: 20.1, max: 33.0) +[2023-10-08 14:48:46,876][101941] Avg episode reward: [(0, '8.770'), (1, '10.420')] +[2023-10-08 14:48:48,961][102897] Updated weights for policy 0, policy_version 76230 (0.0010) +[2023-10-08 14:48:49,330][102897] Updated weights for policy 0, policy_version 76240 (0.0009) +[2023-10-08 14:48:49,691][102897] Updated weights for policy 0, policy_version 76250 (0.0010) +[2023-10-08 14:48:50,397][102898] Updated weights for policy 1, policy_version 76330 (0.0007) +[2023-10-08 14:48:50,767][102898] Updated weights for policy 1, policy_version 76340 (0.0007) +[2023-10-08 14:48:51,131][102898] Updated weights for policy 1, policy_version 76350 (0.0008) +[2023-10-08 14:48:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 156270592. Throughput: 0: 1794.6, 1: 1788.0. Samples: 39069268. Policy #0 lag: (min: 1.0, avg: 20.1, max: 33.0) +[2023-10-08 14:48:51,875][101941] Avg episode reward: [(0, '8.710'), (1, '9.650')] +[2023-10-08 14:48:53,359][102897] Updated weights for policy 0, policy_version 76260 (0.0009) +[2023-10-08 14:48:53,733][102897] Updated weights for policy 0, policy_version 76270 (0.0007) +[2023-10-08 14:48:54,107][102897] Updated weights for policy 0, policy_version 76280 (0.0011) +[2023-10-08 14:48:54,898][102898] Updated weights for policy 1, policy_version 76360 (0.0007) +[2023-10-08 14:48:55,272][102898] Updated weights for policy 1, policy_version 76370 (0.0008) +[2023-10-08 14:48:55,635][102898] Updated weights for policy 1, policy_version 76380 (0.0010) +[2023-10-08 14:48:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 156336128. Throughput: 0: 1778.3, 1: 1790.2. Samples: 39090082. Policy #0 lag: (min: 1.0, avg: 20.1, max: 33.0) +[2023-10-08 14:48:56,876][101941] Avg episode reward: [(0, '8.870'), (1, '9.940')] +[2023-10-08 14:48:58,070][102897] Updated weights for policy 0, policy_version 76290 (0.0011) +[2023-10-08 14:48:58,450][102897] Updated weights for policy 0, policy_version 76300 (0.0009) +[2023-10-08 14:48:58,821][102897] Updated weights for policy 0, policy_version 76310 (0.0009) +[2023-10-08 14:48:59,182][102897] Updated weights for policy 0, policy_version 76320 (0.0009) +[2023-10-08 14:48:59,277][102898] Updated weights for policy 1, policy_version 76390 (0.0008) +[2023-10-08 14:48:59,637][102898] Updated weights for policy 1, policy_version 76400 (0.0009) +[2023-10-08 14:49:00,009][102898] Updated weights for policy 1, policy_version 76410 (0.0011) +[2023-10-08 14:49:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 156401664. Throughput: 0: 1782.1, 1: 1777.3. Samples: 39112038. Policy #0 lag: (min: 1.0, avg: 20.1, max: 33.0) +[2023-10-08 14:49:01,876][101941] Avg episode reward: [(0, '7.960'), (1, '10.420')] +[2023-10-08 14:49:02,829][102897] Updated weights for policy 0, policy_version 76330 (0.0009) +[2023-10-08 14:49:03,205][102897] Updated weights for policy 0, policy_version 76340 (0.0008) +[2023-10-08 14:49:03,579][102897] Updated weights for policy 0, policy_version 76350 (0.0007) +[2023-10-08 14:49:03,901][102898] Updated weights for policy 1, policy_version 76420 (0.0009) +[2023-10-08 14:49:04,283][102898] Updated weights for policy 1, policy_version 76430 (0.0009) +[2023-10-08 14:49:04,648][102898] Updated weights for policy 1, policy_version 76440 (0.0008) +[2023-10-08 14:49:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 156467200. Throughput: 0: 1775.5, 1: 1795.4. Samples: 39122252. Policy #0 lag: (min: 1.0, avg: 20.1, max: 33.0) +[2023-10-08 14:49:06,876][101941] Avg episode reward: [(0, '7.470'), (1, '10.840')] +[2023-10-08 14:49:07,228][102897] Updated weights for policy 0, policy_version 76360 (0.0007) +[2023-10-08 14:49:07,608][102897] Updated weights for policy 0, policy_version 76370 (0.0008) +[2023-10-08 14:49:07,972][102897] Updated weights for policy 0, policy_version 76380 (0.0008) +[2023-10-08 14:49:08,426][102898] Updated weights for policy 1, policy_version 76450 (0.0008) +[2023-10-08 14:49:08,794][102898] Updated weights for policy 1, policy_version 76460 (0.0008) +[2023-10-08 14:49:09,155][102898] Updated weights for policy 1, policy_version 76470 (0.0010) +[2023-10-08 14:49:09,527][102898] Updated weights for policy 1, policy_version 76480 (0.0011) +[2023-10-08 14:49:11,564][102897] Updated weights for policy 0, policy_version 76390 (0.0008) +[2023-10-08 14:49:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 156532736. Throughput: 0: 1783.2, 1: 1781.9. Samples: 39144074. Policy #0 lag: (min: 1.0, avg: 20.1, max: 33.0) +[2023-10-08 14:49:11,876][101941] Avg episode reward: [(0, '7.750'), (1, '10.260')] +[2023-10-08 14:49:11,942][102897] Updated weights for policy 0, policy_version 76400 (0.0011) +[2023-10-08 14:49:12,310][102897] Updated weights for policy 0, policy_version 76410 (0.0009) +[2023-10-08 14:49:13,238][102898] Updated weights for policy 1, policy_version 76490 (0.0009) +[2023-10-08 14:49:13,602][102898] Updated weights for policy 1, policy_version 76500 (0.0009) +[2023-10-08 14:49:13,959][102898] Updated weights for policy 1, policy_version 76510 (0.0010) +[2023-10-08 14:49:16,166][102897] Updated weights for policy 0, policy_version 76420 (0.0008) +[2023-10-08 14:49:16,549][102897] Updated weights for policy 0, policy_version 76430 (0.0009) +[2023-10-08 14:49:16,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 156598272. Throughput: 0: 1794.2, 1: 1780.4. Samples: 39165876. Policy #0 lag: (min: 1.0, avg: 20.1, max: 33.0) +[2023-10-08 14:49:16,876][101941] Avg episode reward: [(0, '8.070'), (1, '9.500')] +[2023-10-08 14:49:16,927][102897] Updated weights for policy 0, policy_version 76440 (0.0008) +[2023-10-08 14:49:17,734][102898] Updated weights for policy 1, policy_version 76520 (0.0009) +[2023-10-08 14:49:18,101][102898] Updated weights for policy 1, policy_version 76530 (0.0009) +[2023-10-08 14:49:18,471][102898] Updated weights for policy 1, policy_version 76540 (0.0008) +[2023-10-08 14:49:20,624][102897] Updated weights for policy 0, policy_version 76450 (0.0008) +[2023-10-08 14:49:20,999][102897] Updated weights for policy 0, policy_version 76460 (0.0008) +[2023-10-08 14:49:21,358][102897] Updated weights for policy 0, policy_version 76470 (0.0007) +[2023-10-08 14:49:21,729][102897] Updated weights for policy 0, policy_version 76480 (0.0008) +[2023-10-08 14:49:21,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 156696576. Throughput: 0: 1784.7, 1: 1781.6. Samples: 39176104. Policy #0 lag: (min: 1.0, avg: 20.1, max: 33.0) +[2023-10-08 14:49:21,876][101941] Avg episode reward: [(0, '9.040'), (1, '10.720')] +[2023-10-08 14:49:22,151][102898] Updated weights for policy 1, policy_version 76550 (0.0008) +[2023-10-08 14:49:22,518][102898] Updated weights for policy 1, policy_version 76560 (0.0007) +[2023-10-08 14:49:22,888][102898] Updated weights for policy 1, policy_version 76570 (0.0007) +[2023-10-08 14:49:25,682][102897] Updated weights for policy 0, policy_version 76490 (0.0008) +[2023-10-08 14:49:26,057][102897] Updated weights for policy 0, policy_version 76500 (0.0010) +[2023-10-08 14:49:26,420][102897] Updated weights for policy 0, policy_version 76510 (0.0008) +[2023-10-08 14:49:26,558][102898] Updated weights for policy 1, policy_version 76580 (0.0009) +[2023-10-08 14:49:26,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 156762112. Throughput: 0: 1800.8, 1: 1784.1. Samples: 39198294. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:49:26,876][101941] Avg episode reward: [(0, '8.800'), (1, '10.960')] +[2023-10-08 14:49:26,932][102898] Updated weights for policy 1, policy_version 76590 (0.0008) +[2023-10-08 14:49:27,291][102898] Updated weights for policy 1, policy_version 76600 (0.0008) +[2023-10-08 14:49:30,223][102897] Updated weights for policy 0, policy_version 76520 (0.0008) +[2023-10-08 14:49:30,591][102897] Updated weights for policy 0, policy_version 76530 (0.0009) +[2023-10-08 14:49:30,961][102897] Updated weights for policy 0, policy_version 76540 (0.0008) +[2023-10-08 14:49:31,122][102898] Updated weights for policy 1, policy_version 76610 (0.0009) +[2023-10-08 14:49:31,487][102898] Updated weights for policy 1, policy_version 76620 (0.0009) +[2023-10-08 14:49:31,849][102898] Updated weights for policy 1, policy_version 76630 (0.0011) +[2023-10-08 14:49:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 156827648. Throughput: 0: 1777.4, 1: 1801.6. Samples: 39218758. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:49:31,876][101941] Avg episode reward: [(0, '8.610'), (1, '9.710')] +[2023-10-08 14:49:32,219][102898] Updated weights for policy 1, policy_version 76640 (0.0010) +[2023-10-08 14:49:34,806][102897] Updated weights for policy 0, policy_version 76550 (0.0008) +[2023-10-08 14:49:35,170][102897] Updated weights for policy 0, policy_version 76560 (0.0007) +[2023-10-08 14:49:35,534][102897] Updated weights for policy 0, policy_version 76570 (0.0009) +[2023-10-08 14:49:36,077][102898] Updated weights for policy 1, policy_version 76650 (0.0009) +[2023-10-08 14:49:36,438][102898] Updated weights for policy 1, policy_version 76660 (0.0007) +[2023-10-08 14:49:36,804][102898] Updated weights for policy 1, policy_version 76670 (0.0010) +[2023-10-08 14:49:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 156893184. Throughput: 0: 1800.7, 1: 1781.8. Samples: 39230480. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:49:36,876][101941] Avg episode reward: [(0, '8.760'), (1, '10.040')] +[2023-10-08 14:49:39,224][102897] Updated weights for policy 0, policy_version 76580 (0.0009) +[2023-10-08 14:49:39,593][102897] Updated weights for policy 0, policy_version 76590 (0.0010) +[2023-10-08 14:49:39,950][102897] Updated weights for policy 0, policy_version 76600 (0.0008) +[2023-10-08 14:49:40,394][102898] Updated weights for policy 1, policy_version 76680 (0.0010) +[2023-10-08 14:49:40,766][102898] Updated weights for policy 1, policy_version 76690 (0.0010) +[2023-10-08 14:49:41,122][102898] Updated weights for policy 1, policy_version 76700 (0.0008) +[2023-10-08 14:49:41,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 156991488. Throughput: 0: 1787.2, 1: 1796.3. Samples: 39251338. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:49:41,876][101941] Avg episode reward: [(0, '8.750'), (1, '9.660')] +[2023-10-08 14:49:43,540][102897] Updated weights for policy 0, policy_version 76610 (0.0007) +[2023-10-08 14:49:43,912][102897] Updated weights for policy 0, policy_version 76620 (0.0008) +[2023-10-08 14:49:44,276][102897] Updated weights for policy 0, policy_version 76630 (0.0008) +[2023-10-08 14:49:44,645][102897] Updated weights for policy 0, policy_version 76640 (0.0011) +[2023-10-08 14:49:44,932][102898] Updated weights for policy 1, policy_version 76710 (0.0009) +[2023-10-08 14:49:45,297][102898] Updated weights for policy 1, policy_version 76720 (0.0009) +[2023-10-08 14:49:45,665][102898] Updated weights for policy 1, policy_version 76730 (0.0010) +[2023-10-08 14:49:46,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 157057024. Throughput: 0: 1791.3, 1: 1781.3. Samples: 39272806. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:49:46,876][101941] Avg episode reward: [(0, '8.130'), (1, '10.840')] +[2023-10-08 14:49:48,559][102897] Updated weights for policy 0, policy_version 76650 (0.0007) +[2023-10-08 14:49:48,931][102897] Updated weights for policy 0, policy_version 76660 (0.0007) +[2023-10-08 14:49:49,294][102897] Updated weights for policy 0, policy_version 76670 (0.0007) +[2023-10-08 14:49:49,575][102898] Updated weights for policy 1, policy_version 76740 (0.0008) +[2023-10-08 14:49:49,963][102898] Updated weights for policy 1, policy_version 76750 (0.0008) +[2023-10-08 14:49:50,337][102898] Updated weights for policy 1, policy_version 76760 (0.0008) +[2023-10-08 14:49:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 157122560. Throughput: 0: 1794.7, 1: 1801.6. Samples: 39284088. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:49:51,876][101941] Avg episode reward: [(0, '8.620'), (1, '10.400')] +[2023-10-08 14:49:52,989][102897] Updated weights for policy 0, policy_version 76680 (0.0009) +[2023-10-08 14:49:53,362][102897] Updated weights for policy 0, policy_version 76690 (0.0007) +[2023-10-08 14:49:53,728][102897] Updated weights for policy 0, policy_version 76700 (0.0009) +[2023-10-08 14:49:54,024][102898] Updated weights for policy 1, policy_version 76770 (0.0009) +[2023-10-08 14:49:54,388][102898] Updated weights for policy 1, policy_version 76780 (0.0010) +[2023-10-08 14:49:54,754][102898] Updated weights for policy 1, policy_version 76790 (0.0007) +[2023-10-08 14:49:55,126][102898] Updated weights for policy 1, policy_version 76800 (0.0007) +[2023-10-08 14:49:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 157188096. Throughput: 0: 1791.4, 1: 1786.2. Samples: 39305066. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:49:56,876][101941] Avg episode reward: [(0, '8.930'), (1, '11.780')] +[2023-10-08 14:49:57,484][102897] Updated weights for policy 0, policy_version 76710 (0.0009) +[2023-10-08 14:49:57,855][102897] Updated weights for policy 0, policy_version 76720 (0.0008) +[2023-10-08 14:49:58,227][102897] Updated weights for policy 0, policy_version 76730 (0.0008) +[2023-10-08 14:49:58,981][102898] Updated weights for policy 1, policy_version 76810 (0.0010) +[2023-10-08 14:49:59,342][102898] Updated weights for policy 1, policy_version 76820 (0.0009) +[2023-10-08 14:49:59,717][102898] Updated weights for policy 1, policy_version 76830 (0.0008) +[2023-10-08 14:50:01,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 157253632. Throughput: 0: 1805.6, 1: 1785.1. Samples: 39327458. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:50:01,876][101941] Avg episode reward: [(0, '8.560'), (1, '10.310')] +[2023-10-08 14:50:02,169][102897] Updated weights for policy 0, policy_version 76740 (0.0008) +[2023-10-08 14:50:02,561][102897] Updated weights for policy 0, policy_version 76750 (0.0009) +[2023-10-08 14:50:02,942][102897] Updated weights for policy 0, policy_version 76760 (0.0007) +[2023-10-08 14:50:03,419][102898] Updated weights for policy 1, policy_version 76840 (0.0009) +[2023-10-08 14:50:03,791][102898] Updated weights for policy 1, policy_version 76850 (0.0008) +[2023-10-08 14:50:04,157][102898] Updated weights for policy 1, policy_version 76860 (0.0010) +[2023-10-08 14:50:06,603][102897] Updated weights for policy 0, policy_version 76770 (0.0008) +[2023-10-08 14:50:06,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 157319168. Throughput: 0: 1793.7, 1: 1786.6. Samples: 39337218. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:50:06,876][101941] Avg episode reward: [(0, '8.830'), (1, '9.310')] +[2023-10-08 14:50:06,966][102897] Updated weights for policy 0, policy_version 76780 (0.0009) +[2023-10-08 14:50:07,329][102897] Updated weights for policy 0, policy_version 76790 (0.0008) +[2023-10-08 14:50:07,690][102897] Updated weights for policy 0, policy_version 76800 (0.0008) +[2023-10-08 14:50:07,922][102898] Updated weights for policy 1, policy_version 76870 (0.0009) +[2023-10-08 14:50:08,291][102898] Updated weights for policy 1, policy_version 76880 (0.0008) +[2023-10-08 14:50:08,657][102898] Updated weights for policy 1, policy_version 76890 (0.0008) +[2023-10-08 14:50:11,373][102897] Updated weights for policy 0, policy_version 76810 (0.0009) +[2023-10-08 14:50:11,744][102897] Updated weights for policy 0, policy_version 76820 (0.0008) +[2023-10-08 14:50:11,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 157384704. Throughput: 0: 1797.0, 1: 1790.0. Samples: 39359710. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:50:11,875][101941] Avg episode reward: [(0, '8.400'), (1, '10.230')] +[2023-10-08 14:50:12,117][102897] Updated weights for policy 0, policy_version 76830 (0.0008) +[2023-10-08 14:50:12,431][102898] Updated weights for policy 1, policy_version 76900 (0.0007) +[2023-10-08 14:50:12,796][102898] Updated weights for policy 1, policy_version 76910 (0.0009) +[2023-10-08 14:50:13,164][102898] Updated weights for policy 1, policy_version 76920 (0.0011) +[2023-10-08 14:50:15,802][102897] Updated weights for policy 0, policy_version 76840 (0.0008) +[2023-10-08 14:50:16,183][102897] Updated weights for policy 0, policy_version 76850 (0.0009) +[2023-10-08 14:50:16,557][102897] Updated weights for policy 0, policy_version 76860 (0.0007) +[2023-10-08 14:50:16,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 157483008. Throughput: 0: 1807.9, 1: 1802.0. Samples: 39381202. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:50:16,876][101941] Avg episode reward: [(0, '8.900'), (1, '11.090')] +[2023-10-08 14:50:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000076864_78708736.pth... +[2023-10-08 14:50:16,914][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000075168_76972032.pth +[2023-10-08 14:50:17,005][102898] Updated weights for policy 1, policy_version 76930 (0.0007) +[2023-10-08 14:50:17,374][102898] Updated weights for policy 1, policy_version 76940 (0.0008) +[2023-10-08 14:50:17,738][102898] Updated weights for policy 1, policy_version 76950 (0.0010) +[2023-10-08 14:50:18,093][102898] Updated weights for policy 1, policy_version 76960 (0.0008) +[2023-10-08 14:50:18,094][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000076960_78807040.pth... +[2023-10-08 14:50:18,133][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000075264_77070336.pth +[2023-10-08 14:50:20,295][102897] Updated weights for policy 0, policy_version 76870 (0.0008) +[2023-10-08 14:50:20,665][102897] Updated weights for policy 0, policy_version 76880 (0.0007) +[2023-10-08 14:50:21,035][102897] Updated weights for policy 0, policy_version 76890 (0.0009) +[2023-10-08 14:50:21,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 157548544. Throughput: 0: 1796.4, 1: 1790.0. Samples: 39391864. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:50:21,876][101941] Avg episode reward: [(0, '8.380'), (1, '10.840')] +[2023-10-08 14:50:21,919][102898] Updated weights for policy 1, policy_version 76970 (0.0008) +[2023-10-08 14:50:22,290][102898] Updated weights for policy 1, policy_version 76980 (0.0010) +[2023-10-08 14:50:22,657][102898] Updated weights for policy 1, policy_version 76990 (0.0010) +[2023-10-08 14:50:24,785][102897] Updated weights for policy 0, policy_version 76900 (0.0008) +[2023-10-08 14:50:25,155][102897] Updated weights for policy 0, policy_version 76910 (0.0007) +[2023-10-08 14:50:25,521][102897] Updated weights for policy 0, policy_version 76920 (0.0007) +[2023-10-08 14:50:26,255][102898] Updated weights for policy 1, policy_version 77000 (0.0008) +[2023-10-08 14:50:26,620][102898] Updated weights for policy 1, policy_version 77010 (0.0011) +[2023-10-08 14:50:26,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 157614080. Throughput: 0: 1806.5, 1: 1800.5. Samples: 39413654. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:50:26,876][101941] Avg episode reward: [(0, '9.030'), (1, '11.390')] +[2023-10-08 14:50:26,984][102898] Updated weights for policy 1, policy_version 77020 (0.0008) +[2023-10-08 14:50:29,270][102897] Updated weights for policy 0, policy_version 76930 (0.0007) +[2023-10-08 14:50:29,640][102897] Updated weights for policy 0, policy_version 76940 (0.0008) +[2023-10-08 14:50:30,015][102897] Updated weights for policy 0, policy_version 76950 (0.0009) +[2023-10-08 14:50:30,385][102897] Updated weights for policy 0, policy_version 76960 (0.0008) +[2023-10-08 14:50:30,713][102898] Updated weights for policy 1, policy_version 77030 (0.0009) +[2023-10-08 14:50:31,078][102898] Updated weights for policy 1, policy_version 77040 (0.0007) +[2023-10-08 14:50:31,449][102898] Updated weights for policy 1, policy_version 77050 (0.0008) +[2023-10-08 14:50:31,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 157712384. Throughput: 0: 1792.0, 1: 1798.9. Samples: 39434398. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:50:31,876][101941] Avg episode reward: [(0, '8.760'), (1, '10.390')] +[2023-10-08 14:50:34,032][102897] Updated weights for policy 0, policy_version 76970 (0.0007) +[2023-10-08 14:50:34,399][102897] Updated weights for policy 0, policy_version 76980 (0.0007) +[2023-10-08 14:50:34,767][102897] Updated weights for policy 0, policy_version 76990 (0.0007) +[2023-10-08 14:50:35,306][102898] Updated weights for policy 1, policy_version 77060 (0.0008) +[2023-10-08 14:50:35,701][102898] Updated weights for policy 1, policy_version 77070 (0.0009) +[2023-10-08 14:50:36,065][102898] Updated weights for policy 1, policy_version 77080 (0.0010) +[2023-10-08 14:50:36,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 157777920. Throughput: 0: 1807.2, 1: 1791.2. Samples: 39446012. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:50:36,876][101941] Avg episode reward: [(0, '8.450'), (1, '10.980')] +[2023-10-08 14:50:38,470][102897] Updated weights for policy 0, policy_version 77000 (0.0007) +[2023-10-08 14:50:38,844][102897] Updated weights for policy 0, policy_version 77010 (0.0007) +[2023-10-08 14:50:39,213][102897] Updated weights for policy 0, policy_version 77020 (0.0007) +[2023-10-08 14:50:39,860][102898] Updated weights for policy 1, policy_version 77090 (0.0011) +[2023-10-08 14:50:40,234][102898] Updated weights for policy 1, policy_version 77100 (0.0007) +[2023-10-08 14:50:40,596][102898] Updated weights for policy 1, policy_version 77110 (0.0007) +[2023-10-08 14:50:40,967][102898] Updated weights for policy 1, policy_version 77120 (0.0010) +[2023-10-08 14:50:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 157843456. Throughput: 0: 1794.1, 1: 1803.2. Samples: 39466944. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:50:41,876][101941] Avg episode reward: [(0, '8.260'), (1, '10.180')] +[2023-10-08 14:50:42,952][102897] Updated weights for policy 0, policy_version 77030 (0.0007) +[2023-10-08 14:50:43,326][102897] Updated weights for policy 0, policy_version 77040 (0.0007) +[2023-10-08 14:50:43,704][102897] Updated weights for policy 0, policy_version 77050 (0.0008) +[2023-10-08 14:50:44,646][102898] Updated weights for policy 1, policy_version 77130 (0.0009) +[2023-10-08 14:50:45,013][102898] Updated weights for policy 1, policy_version 77140 (0.0008) +[2023-10-08 14:50:45,380][102898] Updated weights for policy 1, policy_version 77150 (0.0009) +[2023-10-08 14:50:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 157908992. Throughput: 0: 1789.8, 1: 1791.0. Samples: 39488596. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:50:46,876][101941] Avg episode reward: [(0, '8.290'), (1, '11.050')] +[2023-10-08 14:50:47,458][102897] Updated weights for policy 0, policy_version 77060 (0.0009) +[2023-10-08 14:50:47,825][102897] Updated weights for policy 0, policy_version 77070 (0.0009) +[2023-10-08 14:50:48,199][102897] Updated weights for policy 0, policy_version 77080 (0.0008) +[2023-10-08 14:50:49,168][102898] Updated weights for policy 1, policy_version 77160 (0.0010) +[2023-10-08 14:50:49,536][102898] Updated weights for policy 1, policy_version 77170 (0.0009) +[2023-10-08 14:50:49,907][102898] Updated weights for policy 1, policy_version 77180 (0.0010) +[2023-10-08 14:50:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 157974528. Throughput: 0: 1791.5, 1: 1804.3. Samples: 39499026. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:50:51,875][101941] Avg episode reward: [(0, '8.420'), (1, '11.550')] +[2023-10-08 14:50:52,033][102897] Updated weights for policy 0, policy_version 77090 (0.0008) +[2023-10-08 14:50:52,410][102897] Updated weights for policy 0, policy_version 77100 (0.0008) +[2023-10-08 14:50:52,766][102897] Updated weights for policy 0, policy_version 77110 (0.0007) +[2023-10-08 14:50:53,139][102897] Updated weights for policy 0, policy_version 77120 (0.0007) +[2023-10-08 14:50:53,663][102898] Updated weights for policy 1, policy_version 77190 (0.0010) +[2023-10-08 14:50:54,024][102898] Updated weights for policy 1, policy_version 77200 (0.0007) +[2023-10-08 14:50:54,396][102898] Updated weights for policy 1, policy_version 77210 (0.0007) +[2023-10-08 14:50:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 158040064. Throughput: 0: 1784.8, 1: 1787.2. Samples: 39520452. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:50:56,875][101941] Avg episode reward: [(0, '8.150'), (1, '11.300')] +[2023-10-08 14:50:57,022][102897] Updated weights for policy 0, policy_version 77130 (0.0008) +[2023-10-08 14:50:57,388][102897] Updated weights for policy 0, policy_version 77140 (0.0008) +[2023-10-08 14:50:57,764][102897] Updated weights for policy 0, policy_version 77150 (0.0009) +[2023-10-08 14:50:58,071][102898] Updated weights for policy 1, policy_version 77220 (0.0009) +[2023-10-08 14:50:58,438][102898] Updated weights for policy 1, policy_version 77230 (0.0009) +[2023-10-08 14:50:58,796][102898] Updated weights for policy 1, policy_version 77240 (0.0010) +[2023-10-08 14:51:01,511][102897] Updated weights for policy 0, policy_version 77160 (0.0011) +[2023-10-08 14:51:01,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 158105600. Throughput: 0: 1801.1, 1: 1785.7. Samples: 39542608. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:51:01,876][101941] Avg episode reward: [(0, '7.800'), (1, '9.780')] +[2023-10-08 14:51:01,886][102897] Updated weights for policy 0, policy_version 77170 (0.0009) +[2023-10-08 14:51:02,252][102897] Updated weights for policy 0, policy_version 77180 (0.0007) +[2023-10-08 14:51:02,586][102898] Updated weights for policy 1, policy_version 77250 (0.0009) +[2023-10-08 14:51:02,960][102898] Updated weights for policy 1, policy_version 77260 (0.0007) +[2023-10-08 14:51:03,316][102898] Updated weights for policy 1, policy_version 77270 (0.0007) +[2023-10-08 14:51:03,694][102898] Updated weights for policy 1, policy_version 77280 (0.0008) +[2023-10-08 14:51:06,051][102897] Updated weights for policy 0, policy_version 77190 (0.0009) +[2023-10-08 14:51:06,419][102897] Updated weights for policy 0, policy_version 77200 (0.0011) +[2023-10-08 14:51:06,796][102897] Updated weights for policy 0, policy_version 77210 (0.0008) +[2023-10-08 14:51:06,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 158171136. Throughput: 0: 1781.7, 1: 1792.9. Samples: 39552722. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:51:06,875][101941] Avg episode reward: [(0, '8.300'), (1, '9.950')] +[2023-10-08 14:51:07,422][102898] Updated weights for policy 1, policy_version 77290 (0.0008) +[2023-10-08 14:51:07,799][102898] Updated weights for policy 1, policy_version 77300 (0.0007) +[2023-10-08 14:51:08,161][102898] Updated weights for policy 1, policy_version 77310 (0.0008) +[2023-10-08 14:51:10,462][102897] Updated weights for policy 0, policy_version 77220 (0.0009) +[2023-10-08 14:51:10,835][102897] Updated weights for policy 0, policy_version 77230 (0.0008) +[2023-10-08 14:51:11,199][102897] Updated weights for policy 0, policy_version 77240 (0.0009) +[2023-10-08 14:51:11,826][102898] Updated weights for policy 1, policy_version 77320 (0.0009) +[2023-10-08 14:51:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 158269440. Throughput: 0: 1800.2, 1: 1786.0. Samples: 39575032. Policy #0 lag: (min: 31.0, avg: 44.6, max: 63.0) +[2023-10-08 14:51:11,876][101941] Avg episode reward: [(0, '8.870'), (1, '10.080')] +[2023-10-08 14:51:12,200][102898] Updated weights for policy 1, policy_version 77330 (0.0008) +[2023-10-08 14:51:12,574][102898] Updated weights for policy 1, policy_version 77340 (0.0009) +[2023-10-08 14:51:15,019][102897] Updated weights for policy 0, policy_version 77250 (0.0007) +[2023-10-08 14:51:15,392][102897] Updated weights for policy 0, policy_version 77260 (0.0008) +[2023-10-08 14:51:15,755][102897] Updated weights for policy 0, policy_version 77270 (0.0008) +[2023-10-08 14:51:16,132][102897] Updated weights for policy 0, policy_version 77280 (0.0008) +[2023-10-08 14:51:16,289][102898] Updated weights for policy 1, policy_version 77350 (0.0009) +[2023-10-08 14:51:16,661][102898] Updated weights for policy 1, policy_version 77360 (0.0011) +[2023-10-08 14:51:16,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 158334976. Throughput: 0: 1774.2, 1: 1800.4. Samples: 39595256. Policy #0 lag: (min: 31.0, avg: 44.6, max: 63.0) +[2023-10-08 14:51:16,876][101941] Avg episode reward: [(0, '9.060'), (1, '10.940')] +[2023-10-08 14:51:17,019][102898] Updated weights for policy 1, policy_version 77370 (0.0010) +[2023-10-08 14:51:19,677][102897] Updated weights for policy 0, policy_version 77290 (0.0010) +[2023-10-08 14:51:20,058][102897] Updated weights for policy 0, policy_version 77300 (0.0010) +[2023-10-08 14:51:20,427][102897] Updated weights for policy 0, policy_version 77310 (0.0007) +[2023-10-08 14:51:20,946][102898] Updated weights for policy 1, policy_version 77380 (0.0009) +[2023-10-08 14:51:21,346][102898] Updated weights for policy 1, policy_version 77390 (0.0008) +[2023-10-08 14:51:21,715][102898] Updated weights for policy 1, policy_version 77400 (0.0009) +[2023-10-08 14:51:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 158400512. Throughput: 0: 1794.9, 1: 1783.5. Samples: 39607040. Policy #0 lag: (min: 31.0, avg: 44.6, max: 63.0) +[2023-10-08 14:51:21,876][101941] Avg episode reward: [(0, '9.290'), (1, '10.260')] +[2023-10-08 14:51:24,219][102897] Updated weights for policy 0, policy_version 77320 (0.0010) +[2023-10-08 14:51:24,588][102897] Updated weights for policy 0, policy_version 77330 (0.0010) +[2023-10-08 14:51:24,963][102897] Updated weights for policy 0, policy_version 77340 (0.0010) +[2023-10-08 14:51:25,360][102898] Updated weights for policy 1, policy_version 77410 (0.0008) +[2023-10-08 14:51:25,725][102898] Updated weights for policy 1, policy_version 77420 (0.0007) +[2023-10-08 14:51:26,091][102898] Updated weights for policy 1, policy_version 77430 (0.0007) +[2023-10-08 14:51:26,460][102898] Updated weights for policy 1, policy_version 77440 (0.0009) +[2023-10-08 14:51:26,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 158498816. Throughput: 0: 1774.8, 1: 1801.5. Samples: 39627876. Policy #0 lag: (min: 31.0, avg: 44.6, max: 63.0) +[2023-10-08 14:51:26,876][101941] Avg episode reward: [(0, '8.220'), (1, '10.670')] +[2023-10-08 14:51:28,706][102897] Updated weights for policy 0, policy_version 77350 (0.0008) +[2023-10-08 14:51:29,071][102897] Updated weights for policy 0, policy_version 77360 (0.0009) +[2023-10-08 14:51:29,441][102897] Updated weights for policy 0, policy_version 77370 (0.0008) +[2023-10-08 14:51:30,260][102898] Updated weights for policy 1, policy_version 77450 (0.0009) +[2023-10-08 14:51:30,634][102898] Updated weights for policy 1, policy_version 77460 (0.0007) +[2023-10-08 14:51:30,995][102898] Updated weights for policy 1, policy_version 77470 (0.0007) +[2023-10-08 14:51:31,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 158564352. Throughput: 0: 1782.2, 1: 1787.5. Samples: 39649232. Policy #0 lag: (min: 31.0, avg: 44.6, max: 63.0) +[2023-10-08 14:51:31,876][101941] Avg episode reward: [(0, '8.060'), (1, '10.730')] +[2023-10-08 14:51:33,240][102897] Updated weights for policy 0, policy_version 77380 (0.0007) +[2023-10-08 14:51:33,628][102897] Updated weights for policy 0, policy_version 77390 (0.0007) +[2023-10-08 14:51:33,991][102897] Updated weights for policy 0, policy_version 77400 (0.0007) +[2023-10-08 14:51:34,806][102898] Updated weights for policy 1, policy_version 77480 (0.0007) +[2023-10-08 14:51:35,180][102898] Updated weights for policy 1, policy_version 77490 (0.0008) +[2023-10-08 14:51:35,541][102898] Updated weights for policy 1, policy_version 77500 (0.0009) +[2023-10-08 14:51:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 158629888. Throughput: 0: 1778.5, 1: 1809.7. Samples: 39660498. Policy #0 lag: (min: 31.0, avg: 44.6, max: 63.0) +[2023-10-08 14:51:36,876][101941] Avg episode reward: [(0, '7.780'), (1, '10.670')] +[2023-10-08 14:51:37,602][102897] Updated weights for policy 0, policy_version 77410 (0.0010) +[2023-10-08 14:51:37,974][102897] Updated weights for policy 0, policy_version 77420 (0.0007) +[2023-10-08 14:51:38,345][102897] Updated weights for policy 0, policy_version 77430 (0.0008) +[2023-10-08 14:51:38,721][102897] Updated weights for policy 0, policy_version 77440 (0.0007) +[2023-10-08 14:51:39,277][102898] Updated weights for policy 1, policy_version 77510 (0.0008) +[2023-10-08 14:51:39,645][102898] Updated weights for policy 1, policy_version 77520 (0.0007) +[2023-10-08 14:51:40,018][102898] Updated weights for policy 1, policy_version 77530 (0.0009) +[2023-10-08 14:51:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 158695424. Throughput: 0: 1789.4, 1: 1794.2. Samples: 39681714. Policy #0 lag: (min: 31.0, avg: 44.6, max: 63.0) +[2023-10-08 14:51:41,875][101941] Avg episode reward: [(0, '8.380'), (1, '10.410')] +[2023-10-08 14:51:42,537][102897] Updated weights for policy 0, policy_version 77450 (0.0009) +[2023-10-08 14:51:42,910][102897] Updated weights for policy 0, policy_version 77460 (0.0008) +[2023-10-08 14:51:43,269][102897] Updated weights for policy 0, policy_version 77470 (0.0007) +[2023-10-08 14:51:43,700][102898] Updated weights for policy 1, policy_version 77540 (0.0008) +[2023-10-08 14:51:44,057][102898] Updated weights for policy 1, policy_version 77550 (0.0008) +[2023-10-08 14:51:44,429][102898] Updated weights for policy 1, policy_version 77560 (0.0010) +[2023-10-08 14:51:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 158760960. Throughput: 0: 1798.4, 1: 1790.8. Samples: 39704122. Policy #0 lag: (min: 31.0, avg: 44.6, max: 63.0) +[2023-10-08 14:51:46,876][101941] Avg episode reward: [(0, '8.460'), (1, '11.180')] +[2023-10-08 14:51:46,993][102897] Updated weights for policy 0, policy_version 77480 (0.0009) +[2023-10-08 14:51:47,359][102897] Updated weights for policy 0, policy_version 77490 (0.0007) +[2023-10-08 14:51:47,740][102897] Updated weights for policy 0, policy_version 77500 (0.0007) +[2023-10-08 14:51:48,191][102898] Updated weights for policy 1, policy_version 77570 (0.0010) +[2023-10-08 14:51:48,559][102898] Updated weights for policy 1, policy_version 77580 (0.0010) +[2023-10-08 14:51:48,924][102898] Updated weights for policy 1, policy_version 77590 (0.0009) +[2023-10-08 14:51:49,294][102898] Updated weights for policy 1, policy_version 77600 (0.0009) +[2023-10-08 14:51:51,507][102897] Updated weights for policy 0, policy_version 77510 (0.0008) +[2023-10-08 14:51:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 158826496. Throughput: 0: 1789.8, 1: 1788.7. Samples: 39713754. Policy #0 lag: (min: 31.0, avg: 44.6, max: 63.0) +[2023-10-08 14:51:51,876][101941] Avg episode reward: [(0, '9.450'), (1, '11.200')] +[2023-10-08 14:51:51,880][102897] Updated weights for policy 0, policy_version 77520 (0.0008) +[2023-10-08 14:51:52,239][102897] Updated weights for policy 0, policy_version 77530 (0.0010) +[2023-10-08 14:51:53,090][102898] Updated weights for policy 1, policy_version 77610 (0.0007) +[2023-10-08 14:51:53,453][102898] Updated weights for policy 1, policy_version 77620 (0.0010) +[2023-10-08 14:51:53,821][102898] Updated weights for policy 1, policy_version 77630 (0.0009) +[2023-10-08 14:51:56,030][102897] Updated weights for policy 0, policy_version 77540 (0.0010) +[2023-10-08 14:51:56,401][102897] Updated weights for policy 0, policy_version 77550 (0.0009) +[2023-10-08 14:51:56,767][102897] Updated weights for policy 0, policy_version 77560 (0.0008) +[2023-10-08 14:51:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 158892032. Throughput: 0: 1792.3, 1: 1791.0. Samples: 39736282. Policy #0 lag: (min: 31.0, avg: 44.6, max: 63.0) +[2023-10-08 14:51:56,875][101941] Avg episode reward: [(0, '8.920'), (1, '11.940')] +[2023-10-08 14:51:57,381][102898] Updated weights for policy 1, policy_version 77640 (0.0010) +[2023-10-08 14:51:57,734][102898] Updated weights for policy 1, policy_version 77650 (0.0011) +[2023-10-08 14:51:58,106][102898] Updated weights for policy 1, policy_version 77660 (0.0011) +[2023-10-08 14:52:00,523][102897] Updated weights for policy 0, policy_version 77570 (0.0008) +[2023-10-08 14:52:00,886][102897] Updated weights for policy 0, policy_version 77580 (0.0008) +[2023-10-08 14:52:01,263][102897] Updated weights for policy 0, policy_version 77590 (0.0008) +[2023-10-08 14:52:01,642][102897] Updated weights for policy 0, policy_version 77600 (0.0007) +[2023-10-08 14:52:01,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 158990336. Throughput: 0: 1805.8, 1: 1801.4. Samples: 39757578. Policy #0 lag: (min: 4.0, avg: 9.9, max: 36.0) +[2023-10-08 14:52:01,876][101941] Avg episode reward: [(0, '8.240'), (1, '11.490')] +[2023-10-08 14:52:02,023][102898] Updated weights for policy 1, policy_version 77670 (0.0009) +[2023-10-08 14:52:02,387][102898] Updated weights for policy 1, policy_version 77680 (0.0007) +[2023-10-08 14:52:02,766][102898] Updated weights for policy 1, policy_version 77690 (0.0007) +[2023-10-08 14:52:05,366][102897] Updated weights for policy 0, policy_version 77610 (0.0007) +[2023-10-08 14:52:05,738][102897] Updated weights for policy 0, policy_version 77620 (0.0007) +[2023-10-08 14:52:06,098][102897] Updated weights for policy 0, policy_version 77630 (0.0007) +[2023-10-08 14:52:06,659][102898] Updated weights for policy 1, policy_version 77700 (0.0007) +[2023-10-08 14:52:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 159055872. Throughput: 0: 1792.9, 1: 1793.7. Samples: 39768436. Policy #0 lag: (min: 4.0, avg: 9.9, max: 36.0) +[2023-10-08 14:52:06,876][101941] Avg episode reward: [(0, '8.180'), (1, '10.460')] +[2023-10-08 14:52:07,054][102898] Updated weights for policy 1, policy_version 77710 (0.0008) +[2023-10-08 14:52:07,412][102898] Updated weights for policy 1, policy_version 77720 (0.0007) +[2023-10-08 14:52:09,953][102897] Updated weights for policy 0, policy_version 77640 (0.0008) +[2023-10-08 14:52:10,325][102897] Updated weights for policy 0, policy_version 77650 (0.0010) +[2023-10-08 14:52:10,696][102897] Updated weights for policy 0, policy_version 77660 (0.0009) +[2023-10-08 14:52:11,198][102898] Updated weights for policy 1, policy_version 77730 (0.0008) +[2023-10-08 14:52:11,560][102898] Updated weights for policy 1, policy_version 77740 (0.0008) +[2023-10-08 14:52:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 159121408. Throughput: 0: 1805.1, 1: 1790.5. Samples: 39789676. Policy #0 lag: (min: 4.0, avg: 9.9, max: 36.0) +[2023-10-08 14:52:11,875][101941] Avg episode reward: [(0, '8.840'), (1, '10.500')] +[2023-10-08 14:52:11,925][102898] Updated weights for policy 1, policy_version 77750 (0.0008) +[2023-10-08 14:52:12,290][102898] Updated weights for policy 1, policy_version 77760 (0.0007) +[2023-10-08 14:52:14,415][102897] Updated weights for policy 0, policy_version 77670 (0.0008) +[2023-10-08 14:52:14,780][102897] Updated weights for policy 0, policy_version 77680 (0.0010) +[2023-10-08 14:52:15,159][102897] Updated weights for policy 0, policy_version 77690 (0.0011) +[2023-10-08 14:52:16,171][102898] Updated weights for policy 1, policy_version 77770 (0.0009) +[2023-10-08 14:52:16,544][102898] Updated weights for policy 1, policy_version 77780 (0.0007) +[2023-10-08 14:52:16,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 159186944. Throughput: 0: 1789.5, 1: 1800.1. Samples: 39810766. Policy #0 lag: (min: 4.0, avg: 9.9, max: 36.0) +[2023-10-08 14:52:16,876][101941] Avg episode reward: [(0, '8.840'), (1, '10.980')] +[2023-10-08 14:52:16,886][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000077696_79560704.pth... +[2023-10-08 14:52:16,900][102898] Updated weights for policy 1, policy_version 77790 (0.0007) +[2023-10-08 14:52:16,916][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000076032_77856768.pth +[2023-10-08 14:52:16,971][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000077792_79659008.pth... +[2023-10-08 14:52:17,008][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000076096_77922304.pth +[2023-10-08 14:52:18,993][102897] Updated weights for policy 0, policy_version 77700 (0.0010) +[2023-10-08 14:52:19,372][102897] Updated weights for policy 0, policy_version 77710 (0.0010) +[2023-10-08 14:52:19,751][102897] Updated weights for policy 0, policy_version 77720 (0.0009) +[2023-10-08 14:52:20,750][102898] Updated weights for policy 1, policy_version 77800 (0.0009) +[2023-10-08 14:52:21,126][102898] Updated weights for policy 1, policy_version 77810 (0.0008) +[2023-10-08 14:52:21,491][102898] Updated weights for policy 1, policy_version 77820 (0.0007) +[2023-10-08 14:52:21,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 159285248. Throughput: 0: 1806.2, 1: 1777.6. Samples: 39821770. Policy #0 lag: (min: 4.0, avg: 9.9, max: 36.0) +[2023-10-08 14:52:21,876][101941] Avg episode reward: [(0, '8.480'), (1, '10.520')] +[2023-10-08 14:52:23,583][102897] Updated weights for policy 0, policy_version 77730 (0.0007) +[2023-10-08 14:52:23,950][102897] Updated weights for policy 0, policy_version 77740 (0.0007) +[2023-10-08 14:52:24,324][102897] Updated weights for policy 0, policy_version 77750 (0.0007) +[2023-10-08 14:52:24,699][102897] Updated weights for policy 0, policy_version 77760 (0.0008) +[2023-10-08 14:52:25,159][102898] Updated weights for policy 1, policy_version 77830 (0.0008) +[2023-10-08 14:52:25,522][102898] Updated weights for policy 1, policy_version 77840 (0.0011) +[2023-10-08 14:52:25,892][102898] Updated weights for policy 1, policy_version 77850 (0.0007) +[2023-10-08 14:52:26,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 159350784. Throughput: 0: 1780.7, 1: 1795.5. Samples: 39842644. Policy #0 lag: (min: 4.0, avg: 9.9, max: 36.0) +[2023-10-08 14:52:26,875][101941] Avg episode reward: [(0, '8.620'), (1, '10.610')] +[2023-10-08 14:52:28,359][102897] Updated weights for policy 0, policy_version 77770 (0.0007) +[2023-10-08 14:52:28,730][102897] Updated weights for policy 0, policy_version 77780 (0.0007) +[2023-10-08 14:52:29,096][102897] Updated weights for policy 0, policy_version 77790 (0.0010) +[2023-10-08 14:52:29,720][102898] Updated weights for policy 1, policy_version 77860 (0.0007) +[2023-10-08 14:52:30,090][102898] Updated weights for policy 1, policy_version 77870 (0.0008) +[2023-10-08 14:52:30,450][102898] Updated weights for policy 1, policy_version 77880 (0.0007) +[2023-10-08 14:52:31,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 159416320. Throughput: 0: 1779.0, 1: 1779.3. Samples: 39864244. Policy #0 lag: (min: 4.0, avg: 9.9, max: 36.0) +[2023-10-08 14:52:31,875][101941] Avg episode reward: [(0, '8.180'), (1, '10.400')] +[2023-10-08 14:52:32,930][102897] Updated weights for policy 0, policy_version 77800 (0.0008) +[2023-10-08 14:52:33,302][102897] Updated weights for policy 0, policy_version 77810 (0.0007) +[2023-10-08 14:52:33,672][102897] Updated weights for policy 0, policy_version 77820 (0.0007) +[2023-10-08 14:52:34,319][102898] Updated weights for policy 1, policy_version 77890 (0.0008) +[2023-10-08 14:52:34,684][102898] Updated weights for policy 1, policy_version 77900 (0.0009) +[2023-10-08 14:52:35,050][102898] Updated weights for policy 1, policy_version 77910 (0.0008) +[2023-10-08 14:52:35,415][102898] Updated weights for policy 1, policy_version 77920 (0.0010) +[2023-10-08 14:52:36,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 159481856. Throughput: 0: 1778.7, 1: 1803.5. Samples: 39874958. Policy #0 lag: (min: 4.0, avg: 9.9, max: 36.0) +[2023-10-08 14:52:36,876][101941] Avg episode reward: [(0, '8.020'), (1, '10.570')] +[2023-10-08 14:52:37,518][102897] Updated weights for policy 0, policy_version 77830 (0.0011) +[2023-10-08 14:52:37,890][102897] Updated weights for policy 0, policy_version 77840 (0.0009) +[2023-10-08 14:52:38,261][102897] Updated weights for policy 0, policy_version 77850 (0.0007) +[2023-10-08 14:52:39,160][102898] Updated weights for policy 1, policy_version 77930 (0.0010) +[2023-10-08 14:52:39,525][102898] Updated weights for policy 1, policy_version 77940 (0.0008) +[2023-10-08 14:52:39,898][102898] Updated weights for policy 1, policy_version 77950 (0.0008) +[2023-10-08 14:52:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 159547392. Throughput: 0: 1776.7, 1: 1774.8. Samples: 39896096. Policy #0 lag: (min: 4.0, avg: 9.9, max: 36.0) +[2023-10-08 14:52:41,876][101941] Avg episode reward: [(0, '8.400'), (1, '10.530')] +[2023-10-08 14:52:42,150][102897] Updated weights for policy 0, policy_version 77860 (0.0007) +[2023-10-08 14:52:42,523][102897] Updated weights for policy 0, policy_version 77870 (0.0008) +[2023-10-08 14:52:42,896][102897] Updated weights for policy 0, policy_version 77880 (0.0008) +[2023-10-08 14:52:43,646][102898] Updated weights for policy 1, policy_version 77960 (0.0008) +[2023-10-08 14:52:44,014][102898] Updated weights for policy 1, policy_version 77970 (0.0009) +[2023-10-08 14:52:44,370][102898] Updated weights for policy 1, policy_version 77980 (0.0007) +[2023-10-08 14:52:46,744][102897] Updated weights for policy 0, policy_version 77890 (0.0007) +[2023-10-08 14:52:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 159612928. Throughput: 0: 1797.5, 1: 1780.0. Samples: 39918570. Policy #0 lag: (min: 4.0, avg: 9.9, max: 36.0) +[2023-10-08 14:52:46,876][101941] Avg episode reward: [(0, '8.930'), (1, '10.670')] +[2023-10-08 14:52:47,107][102897] Updated weights for policy 0, policy_version 77900 (0.0007) +[2023-10-08 14:52:47,482][102897] Updated weights for policy 0, policy_version 77910 (0.0007) +[2023-10-08 14:52:47,849][102897] Updated weights for policy 0, policy_version 77920 (0.0009) +[2023-10-08 14:52:48,026][102898] Updated weights for policy 1, policy_version 77990 (0.0008) +[2023-10-08 14:52:48,393][102898] Updated weights for policy 1, policy_version 78000 (0.0009) +[2023-10-08 14:52:48,765][102898] Updated weights for policy 1, policy_version 78010 (0.0009) +[2023-10-08 14:52:51,641][102897] Updated weights for policy 0, policy_version 77930 (0.0008) +[2023-10-08 14:52:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 159678464. Throughput: 0: 1774.7, 1: 1778.9. Samples: 39928346. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 14:52:51,875][101941] Avg episode reward: [(0, '8.940'), (1, '10.970')] +[2023-10-08 14:52:52,011][102897] Updated weights for policy 0, policy_version 77940 (0.0008) +[2023-10-08 14:52:52,386][102897] Updated weights for policy 0, policy_version 77950 (0.0009) +[2023-10-08 14:52:52,523][102898] Updated weights for policy 1, policy_version 78020 (0.0007) +[2023-10-08 14:52:52,884][102898] Updated weights for policy 1, policy_version 78030 (0.0007) +[2023-10-08 14:52:53,253][102898] Updated weights for policy 1, policy_version 78040 (0.0007) +[2023-10-08 14:52:56,193][102897] Updated weights for policy 0, policy_version 77960 (0.0007) +[2023-10-08 14:52:56,559][102897] Updated weights for policy 0, policy_version 77970 (0.0008) +[2023-10-08 14:52:56,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 159744000. Throughput: 0: 1794.6, 1: 1784.8. Samples: 39950750. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 14:52:56,875][101941] Avg episode reward: [(0, '9.410'), (1, '11.530')] +[2023-10-08 14:52:56,925][102897] Updated weights for policy 0, policy_version 77980 (0.0009) +[2023-10-08 14:52:56,991][102898] Updated weights for policy 1, policy_version 78050 (0.0008) +[2023-10-08 14:52:57,401][102898] Updated weights for policy 1, policy_version 78060 (0.0009) +[2023-10-08 14:52:57,764][102898] Updated weights for policy 1, policy_version 78070 (0.0010) +[2023-10-08 14:52:58,125][102898] Updated weights for policy 1, policy_version 78080 (0.0010) +[2023-10-08 14:53:00,608][102897] Updated weights for policy 0, policy_version 77990 (0.0010) +[2023-10-08 14:53:00,974][102897] Updated weights for policy 0, policy_version 78000 (0.0007) +[2023-10-08 14:53:01,338][102897] Updated weights for policy 0, policy_version 78010 (0.0007) +[2023-10-08 14:53:01,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 159842304. Throughput: 0: 1783.3, 1: 1800.4. Samples: 39972034. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 14:53:01,876][101941] Avg episode reward: [(0, '9.370'), (1, '11.820')] +[2023-10-08 14:53:01,948][102898] Updated weights for policy 1, policy_version 78090 (0.0010) +[2023-10-08 14:53:02,305][102898] Updated weights for policy 1, policy_version 78100 (0.0009) +[2023-10-08 14:53:02,676][102898] Updated weights for policy 1, policy_version 78110 (0.0009) +[2023-10-08 14:53:05,169][102897] Updated weights for policy 0, policy_version 78020 (0.0008) +[2023-10-08 14:53:05,564][102897] Updated weights for policy 0, policy_version 78030 (0.0007) +[2023-10-08 14:53:05,929][102897] Updated weights for policy 0, policy_version 78040 (0.0007) +[2023-10-08 14:53:06,390][102898] Updated weights for policy 1, policy_version 78120 (0.0008) +[2023-10-08 14:53:06,742][102898] Updated weights for policy 1, policy_version 78130 (0.0010) +[2023-10-08 14:53:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 159907840. Throughput: 0: 1790.7, 1: 1784.8. Samples: 39982666. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 14:53:06,875][101941] Avg episode reward: [(0, '8.450'), (1, '11.250')] +[2023-10-08 14:53:07,106][102898] Updated weights for policy 1, policy_version 78140 (0.0010) +[2023-10-08 14:53:09,650][102897] Updated weights for policy 0, policy_version 78050 (0.0009) +[2023-10-08 14:53:10,016][102897] Updated weights for policy 0, policy_version 78060 (0.0007) +[2023-10-08 14:53:10,389][102897] Updated weights for policy 0, policy_version 78070 (0.0010) +[2023-10-08 14:53:10,761][102897] Updated weights for policy 0, policy_version 78080 (0.0007) +[2023-10-08 14:53:10,985][102898] Updated weights for policy 1, policy_version 78150 (0.0010) +[2023-10-08 14:53:11,358][102898] Updated weights for policy 1, policy_version 78160 (0.0010) +[2023-10-08 14:53:11,722][102898] Updated weights for policy 1, policy_version 78170 (0.0009) +[2023-10-08 14:53:11,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 159973376. Throughput: 0: 1782.0, 1: 1797.4. Samples: 40003716. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 14:53:11,875][101941] Avg episode reward: [(0, '8.670'), (1, '10.900')] +[2023-10-08 14:53:14,722][102897] Updated weights for policy 0, policy_version 78090 (0.0009) +[2023-10-08 14:53:15,091][102897] Updated weights for policy 0, policy_version 78100 (0.0011) +[2023-10-08 14:53:15,447][102898] Updated weights for policy 1, policy_version 78180 (0.0009) +[2023-10-08 14:53:15,468][102897] Updated weights for policy 0, policy_version 78110 (0.0009) +[2023-10-08 14:53:15,808][102898] Updated weights for policy 1, policy_version 78190 (0.0009) +[2023-10-08 14:53:16,171][102898] Updated weights for policy 1, policy_version 78200 (0.0009) +[2023-10-08 14:53:16,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 160071680. Throughput: 0: 1764.6, 1: 1788.7. Samples: 40024142. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 14:53:16,875][101941] Avg episode reward: [(0, '9.160'), (1, '10.670')] +[2023-10-08 14:53:19,169][102897] Updated weights for policy 0, policy_version 78120 (0.0010) +[2023-10-08 14:53:19,557][102897] Updated weights for policy 0, policy_version 78130 (0.0008) +[2023-10-08 14:53:19,917][102898] Updated weights for policy 1, policy_version 78210 (0.0007) +[2023-10-08 14:53:19,929][102897] Updated weights for policy 0, policy_version 78140 (0.0008) +[2023-10-08 14:53:20,289][102898] Updated weights for policy 1, policy_version 78220 (0.0008) +[2023-10-08 14:53:20,652][102898] Updated weights for policy 1, policy_version 78230 (0.0009) +[2023-10-08 14:53:21,019][102898] Updated weights for policy 1, policy_version 78240 (0.0007) +[2023-10-08 14:53:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 160137216. Throughput: 0: 1789.1, 1: 1795.2. Samples: 40036250. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 14:53:21,875][101941] Avg episode reward: [(0, '8.510'), (1, '10.650')] +[2023-10-08 14:53:23,740][102897] Updated weights for policy 0, policy_version 78150 (0.0008) +[2023-10-08 14:53:24,119][102897] Updated weights for policy 0, policy_version 78160 (0.0011) +[2023-10-08 14:53:24,491][102897] Updated weights for policy 0, policy_version 78170 (0.0011) +[2023-10-08 14:53:24,757][102898] Updated weights for policy 1, policy_version 78250 (0.0007) +[2023-10-08 14:53:25,125][102898] Updated weights for policy 1, policy_version 78260 (0.0007) +[2023-10-08 14:53:25,500][102898] Updated weights for policy 1, policy_version 78270 (0.0007) +[2023-10-08 14:53:26,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 160202752. Throughput: 0: 1768.7, 1: 1794.7. Samples: 40056452. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 14:53:26,876][101941] Avg episode reward: [(0, '9.040'), (1, '10.540')] +[2023-10-08 14:53:28,315][102897] Updated weights for policy 0, policy_version 78180 (0.0008) +[2023-10-08 14:53:28,695][102897] Updated weights for policy 0, policy_version 78190 (0.0010) +[2023-10-08 14:53:29,063][102897] Updated weights for policy 0, policy_version 78200 (0.0010) +[2023-10-08 14:53:29,113][102898] Updated weights for policy 1, policy_version 78280 (0.0009) +[2023-10-08 14:53:29,474][102898] Updated weights for policy 1, policy_version 78290 (0.0009) +[2023-10-08 14:53:29,842][102898] Updated weights for policy 1, policy_version 78300 (0.0008) +[2023-10-08 14:53:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 160268288. Throughput: 0: 1770.5, 1: 1784.0. Samples: 40078520. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 14:53:31,876][101941] Avg episode reward: [(0, '8.830'), (1, '10.230')] +[2023-10-08 14:53:32,782][102897] Updated weights for policy 0, policy_version 78210 (0.0008) +[2023-10-08 14:53:33,143][102897] Updated weights for policy 0, policy_version 78220 (0.0008) +[2023-10-08 14:53:33,506][102897] Updated weights for policy 0, policy_version 78230 (0.0007) +[2023-10-08 14:53:33,780][102898] Updated weights for policy 1, policy_version 78310 (0.0009) +[2023-10-08 14:53:33,872][102897] Updated weights for policy 0, policy_version 78240 (0.0009) +[2023-10-08 14:53:34,144][102898] Updated weights for policy 1, policy_version 78320 (0.0007) +[2023-10-08 14:53:34,511][102898] Updated weights for policy 1, policy_version 78330 (0.0009) +[2023-10-08 14:53:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 160333824. Throughput: 0: 1770.2, 1: 1792.4. Samples: 40088664. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 14:53:36,876][101941] Avg episode reward: [(0, '8.780'), (1, '10.580')] +[2023-10-08 14:53:37,595][102897] Updated weights for policy 0, policy_version 78250 (0.0008) +[2023-10-08 14:53:37,956][102897] Updated weights for policy 0, policy_version 78260 (0.0008) +[2023-10-08 14:53:38,322][102897] Updated weights for policy 0, policy_version 78270 (0.0010) +[2023-10-08 14:53:38,435][102898] Updated weights for policy 1, policy_version 78340 (0.0010) +[2023-10-08 14:53:38,795][102898] Updated weights for policy 1, policy_version 78350 (0.0007) +[2023-10-08 14:53:39,171][102898] Updated weights for policy 1, policy_version 78360 (0.0008) +[2023-10-08 14:53:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 160399360. Throughput: 0: 1774.0, 1: 1777.1. Samples: 40110548. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:53:41,876][101941] Avg episode reward: [(0, '8.650'), (1, '11.200')] +[2023-10-08 14:53:42,009][102897] Updated weights for policy 0, policy_version 78280 (0.0010) +[2023-10-08 14:53:42,373][102897] Updated weights for policy 0, policy_version 78290 (0.0009) +[2023-10-08 14:53:42,746][102897] Updated weights for policy 0, policy_version 78300 (0.0008) +[2023-10-08 14:53:43,026][102898] Updated weights for policy 1, policy_version 78370 (0.0009) +[2023-10-08 14:53:43,429][102898] Updated weights for policy 1, policy_version 78380 (0.0007) +[2023-10-08 14:53:43,807][102898] Updated weights for policy 1, policy_version 78390 (0.0008) +[2023-10-08 14:53:44,173][102898] Updated weights for policy 1, policy_version 78400 (0.0008) +[2023-10-08 14:53:46,420][102897] Updated weights for policy 0, policy_version 78310 (0.0008) +[2023-10-08 14:53:46,787][102897] Updated weights for policy 0, policy_version 78320 (0.0010) +[2023-10-08 14:53:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 160464896. Throughput: 0: 1794.8, 1: 1775.4. Samples: 40132694. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:53:46,876][101941] Avg episode reward: [(0, '8.640'), (1, '9.620')] +[2023-10-08 14:53:47,150][102897] Updated weights for policy 0, policy_version 78330 (0.0008) +[2023-10-08 14:53:47,744][102898] Updated weights for policy 1, policy_version 78410 (0.0009) +[2023-10-08 14:53:48,119][102898] Updated weights for policy 1, policy_version 78420 (0.0007) +[2023-10-08 14:53:48,477][102898] Updated weights for policy 1, policy_version 78430 (0.0008) +[2023-10-08 14:53:51,042][102897] Updated weights for policy 0, policy_version 78340 (0.0007) +[2023-10-08 14:53:51,435][102897] Updated weights for policy 0, policy_version 78350 (0.0009) +[2023-10-08 14:53:51,807][102897] Updated weights for policy 0, policy_version 78360 (0.0008) +[2023-10-08 14:53:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 160530432. Throughput: 0: 1776.5, 1: 1775.7. Samples: 40142518. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:53:51,875][101941] Avg episode reward: [(0, '7.890'), (1, '10.410')] +[2023-10-08 14:53:52,411][102898] Updated weights for policy 1, policy_version 78440 (0.0011) +[2023-10-08 14:53:52,772][102898] Updated weights for policy 1, policy_version 78450 (0.0011) +[2023-10-08 14:53:53,135][102898] Updated weights for policy 1, policy_version 78460 (0.0010) +[2023-10-08 14:53:55,505][102897] Updated weights for policy 0, policy_version 78370 (0.0009) +[2023-10-08 14:53:55,870][102897] Updated weights for policy 0, policy_version 78380 (0.0010) +[2023-10-08 14:53:56,245][102897] Updated weights for policy 0, policy_version 78390 (0.0008) +[2023-10-08 14:53:56,618][102897] Updated weights for policy 0, policy_version 78400 (0.0008) +[2023-10-08 14:53:56,865][102898] Updated weights for policy 1, policy_version 78470 (0.0007) +[2023-10-08 14:53:56,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 160628736. Throughput: 0: 1798.4, 1: 1772.7. Samples: 40164414. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:53:56,876][101941] Avg episode reward: [(0, '8.630'), (1, '10.870')] +[2023-10-08 14:53:57,233][102898] Updated weights for policy 1, policy_version 78480 (0.0007) +[2023-10-08 14:53:57,608][102898] Updated weights for policy 1, policy_version 78490 (0.0007) +[2023-10-08 14:54:00,423][102897] Updated weights for policy 0, policy_version 78410 (0.0010) +[2023-10-08 14:54:00,798][102897] Updated weights for policy 0, policy_version 78420 (0.0008) +[2023-10-08 14:54:01,166][102897] Updated weights for policy 0, policy_version 78430 (0.0007) +[2023-10-08 14:54:01,344][102898] Updated weights for policy 1, policy_version 78500 (0.0008) +[2023-10-08 14:54:01,710][102898] Updated weights for policy 1, policy_version 78510 (0.0010) +[2023-10-08 14:54:01,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 160694272. Throughput: 0: 1782.0, 1: 1800.3. Samples: 40185344. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:54:01,876][101941] Avg episode reward: [(0, '9.230'), (1, '10.440')] +[2023-10-08 14:54:02,075][102898] Updated weights for policy 1, policy_version 78520 (0.0009) +[2023-10-08 14:54:04,855][102897] Updated weights for policy 0, policy_version 78440 (0.0007) +[2023-10-08 14:54:05,228][102897] Updated weights for policy 0, policy_version 78450 (0.0007) +[2023-10-08 14:54:05,595][102897] Updated weights for policy 0, policy_version 78460 (0.0007) +[2023-10-08 14:54:05,877][102898] Updated weights for policy 1, policy_version 78530 (0.0007) +[2023-10-08 14:54:06,248][102898] Updated weights for policy 1, policy_version 78540 (0.0008) +[2023-10-08 14:54:06,611][102898] Updated weights for policy 1, policy_version 78550 (0.0007) +[2023-10-08 14:54:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 160759808. Throughput: 0: 1794.2, 1: 1773.3. Samples: 40196786. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:54:06,876][101941] Avg episode reward: [(0, '8.620'), (1, '10.570')] +[2023-10-08 14:54:06,984][102898] Updated weights for policy 1, policy_version 78560 (0.0011) +[2023-10-08 14:54:09,466][102897] Updated weights for policy 0, policy_version 78470 (0.0008) +[2023-10-08 14:54:09,833][102897] Updated weights for policy 0, policy_version 78480 (0.0007) +[2023-10-08 14:54:10,198][102897] Updated weights for policy 0, policy_version 78490 (0.0008) +[2023-10-08 14:54:10,557][102898] Updated weights for policy 1, policy_version 78570 (0.0008) +[2023-10-08 14:54:10,916][102898] Updated weights for policy 1, policy_version 78580 (0.0010) +[2023-10-08 14:54:11,281][102898] Updated weights for policy 1, policy_version 78590 (0.0009) +[2023-10-08 14:54:11,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 160858112. Throughput: 0: 1785.0, 1: 1801.1. Samples: 40217826. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:54:11,876][101941] Avg episode reward: [(0, '7.550'), (1, '10.950')] +[2023-10-08 14:54:14,006][102897] Updated weights for policy 0, policy_version 78500 (0.0008) +[2023-10-08 14:54:14,359][102897] Updated weights for policy 0, policy_version 78510 (0.0009) +[2023-10-08 14:54:14,738][102897] Updated weights for policy 0, policy_version 78520 (0.0009) +[2023-10-08 14:54:15,185][102898] Updated weights for policy 1, policy_version 78600 (0.0007) +[2023-10-08 14:54:15,558][102898] Updated weights for policy 1, policy_version 78610 (0.0009) +[2023-10-08 14:54:15,924][102898] Updated weights for policy 1, policy_version 78620 (0.0008) +[2023-10-08 14:54:16,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 160923648. Throughput: 0: 1783.8, 1: 1783.9. Samples: 40239064. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:54:16,876][101941] Avg episode reward: [(0, '8.030'), (1, '10.780')] +[2023-10-08 14:54:16,885][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000078528_80412672.pth... +[2023-10-08 14:54:16,885][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000078624_80510976.pth... +[2023-10-08 14:54:16,914][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000076864_78708736.pth +[2023-10-08 14:54:16,926][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000076960_78807040.pth +[2023-10-08 14:54:18,452][102897] Updated weights for policy 0, policy_version 78530 (0.0009) +[2023-10-08 14:54:18,822][102897] Updated weights for policy 0, policy_version 78540 (0.0007) +[2023-10-08 14:54:19,200][102897] Updated weights for policy 0, policy_version 78550 (0.0007) +[2023-10-08 14:54:19,554][102898] Updated weights for policy 1, policy_version 78630 (0.0009) +[2023-10-08 14:54:19,563][102897] Updated weights for policy 0, policy_version 78560 (0.0008) +[2023-10-08 14:54:19,915][102898] Updated weights for policy 1, policy_version 78640 (0.0009) +[2023-10-08 14:54:20,279][102898] Updated weights for policy 1, policy_version 78650 (0.0008) +[2023-10-08 14:54:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 160989184. Throughput: 0: 1788.2, 1: 1805.4. Samples: 40250376. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:54:21,876][101941] Avg episode reward: [(0, '8.070'), (1, '10.910')] +[2023-10-08 14:54:23,445][102897] Updated weights for policy 0, policy_version 78570 (0.0008) +[2023-10-08 14:54:23,820][102897] Updated weights for policy 0, policy_version 78580 (0.0008) +[2023-10-08 14:54:23,981][102898] Updated weights for policy 1, policy_version 78660 (0.0010) +[2023-10-08 14:54:24,195][102897] Updated weights for policy 0, policy_version 78590 (0.0008) +[2023-10-08 14:54:24,349][102898] Updated weights for policy 1, policy_version 78670 (0.0009) +[2023-10-08 14:54:24,723][102898] Updated weights for policy 1, policy_version 78680 (0.0010) +[2023-10-08 14:54:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 161054720. Throughput: 0: 1776.2, 1: 1792.5. Samples: 40271140. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:54:26,875][101941] Avg episode reward: [(0, '8.770'), (1, '10.980')] +[2023-10-08 14:54:27,996][102897] Updated weights for policy 0, policy_version 78600 (0.0008) +[2023-10-08 14:54:28,365][102897] Updated weights for policy 0, policy_version 78610 (0.0009) +[2023-10-08 14:54:28,619][102898] Updated weights for policy 1, policy_version 78690 (0.0010) +[2023-10-08 14:54:28,740][102897] Updated weights for policy 0, policy_version 78620 (0.0007) +[2023-10-08 14:54:28,988][102898] Updated weights for policy 1, policy_version 78700 (0.0010) +[2023-10-08 14:54:29,353][102898] Updated weights for policy 1, policy_version 78710 (0.0009) +[2023-10-08 14:54:29,717][102898] Updated weights for policy 1, policy_version 78720 (0.0008) +[2023-10-08 14:54:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 161120256. Throughput: 0: 1777.6, 1: 1790.7. Samples: 40293268. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 14:54:31,876][101941] Avg episode reward: [(0, '8.700'), (1, '11.590')] +[2023-10-08 14:54:32,455][102897] Updated weights for policy 0, policy_version 78630 (0.0008) +[2023-10-08 14:54:32,824][102897] Updated weights for policy 0, policy_version 78640 (0.0008) +[2023-10-08 14:54:33,193][102897] Updated weights for policy 0, policy_version 78650 (0.0007) +[2023-10-08 14:54:33,500][102898] Updated weights for policy 1, policy_version 78730 (0.0009) +[2023-10-08 14:54:33,870][102898] Updated weights for policy 1, policy_version 78740 (0.0009) +[2023-10-08 14:54:34,232][102898] Updated weights for policy 1, policy_version 78750 (0.0008) +[2023-10-08 14:54:36,801][102897] Updated weights for policy 0, policy_version 78660 (0.0008) +[2023-10-08 14:54:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 161185792. Throughput: 0: 1773.5, 1: 1794.7. Samples: 40303086. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 14:54:36,875][101941] Avg episode reward: [(0, '7.760'), (1, '12.280')] +[2023-10-08 14:54:36,876][102760] Saving new best policy, reward=12.280! +[2023-10-08 14:54:37,189][102897] Updated weights for policy 0, policy_version 78670 (0.0009) +[2023-10-08 14:54:37,556][102897] Updated weights for policy 0, policy_version 78680 (0.0008) +[2023-10-08 14:54:37,772][102898] Updated weights for policy 1, policy_version 78760 (0.0008) +[2023-10-08 14:54:38,141][102898] Updated weights for policy 1, policy_version 78770 (0.0009) +[2023-10-08 14:54:38,515][102898] Updated weights for policy 1, policy_version 78780 (0.0008) +[2023-10-08 14:54:41,321][102897] Updated weights for policy 0, policy_version 78690 (0.0008) +[2023-10-08 14:54:41,701][102897] Updated weights for policy 0, policy_version 78700 (0.0008) +[2023-10-08 14:54:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 161251328. Throughput: 0: 1780.1, 1: 1802.6. Samples: 40325634. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 14:54:41,876][101941] Avg episode reward: [(0, '8.090'), (1, '13.120')] +[2023-10-08 14:54:41,878][102760] Saving new best policy, reward=13.120! +[2023-10-08 14:54:42,074][102897] Updated weights for policy 0, policy_version 78710 (0.0008) +[2023-10-08 14:54:42,372][102898] Updated weights for policy 1, policy_version 78790 (0.0008) +[2023-10-08 14:54:42,445][102897] Updated weights for policy 0, policy_version 78720 (0.0007) +[2023-10-08 14:54:42,739][102898] Updated weights for policy 1, policy_version 78800 (0.0007) +[2023-10-08 14:54:43,103][102898] Updated weights for policy 1, policy_version 78810 (0.0009) +[2023-10-08 14:54:46,183][102897] Updated weights for policy 0, policy_version 78730 (0.0008) +[2023-10-08 14:54:46,560][102897] Updated weights for policy 0, policy_version 78740 (0.0007) +[2023-10-08 14:54:46,794][102898] Updated weights for policy 1, policy_version 78820 (0.0008) +[2023-10-08 14:54:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 161316864. Throughput: 0: 1796.4, 1: 1801.8. Samples: 40347264. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 14:54:46,875][101941] Avg episode reward: [(0, '8.020'), (1, '12.040')] +[2023-10-08 14:54:46,929][102897] Updated weights for policy 0, policy_version 78750 (0.0007) +[2023-10-08 14:54:47,152][102898] Updated weights for policy 1, policy_version 78830 (0.0008) +[2023-10-08 14:54:47,518][102898] Updated weights for policy 1, policy_version 78840 (0.0009) +[2023-10-08 14:54:50,871][102897] Updated weights for policy 0, policy_version 78760 (0.0008) +[2023-10-08 14:54:51,240][102897] Updated weights for policy 0, policy_version 78770 (0.0008) +[2023-10-08 14:54:51,416][102898] Updated weights for policy 1, policy_version 78850 (0.0008) +[2023-10-08 14:54:51,606][102897] Updated weights for policy 0, policy_version 78780 (0.0007) +[2023-10-08 14:54:51,776][102898] Updated weights for policy 1, policy_version 78860 (0.0008) +[2023-10-08 14:54:51,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 161415168. Throughput: 0: 1775.7, 1: 1793.7. Samples: 40357412. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 14:54:51,875][101941] Avg episode reward: [(0, '8.750'), (1, '10.080')] +[2023-10-08 14:54:52,145][102898] Updated weights for policy 1, policy_version 78870 (0.0008) +[2023-10-08 14:54:52,512][102898] Updated weights for policy 1, policy_version 78880 (0.0008) +[2023-10-08 14:54:55,398][102897] Updated weights for policy 0, policy_version 78790 (0.0008) +[2023-10-08 14:54:55,765][102897] Updated weights for policy 0, policy_version 78800 (0.0010) +[2023-10-08 14:54:56,138][102897] Updated weights for policy 0, policy_version 78810 (0.0009) +[2023-10-08 14:54:56,260][102898] Updated weights for policy 1, policy_version 78890 (0.0007) +[2023-10-08 14:54:56,617][102898] Updated weights for policy 1, policy_version 78900 (0.0010) +[2023-10-08 14:54:56,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 161480704. Throughput: 0: 1794.4, 1: 1795.3. Samples: 40379362. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 14:54:56,875][101941] Avg episode reward: [(0, '9.380'), (1, '11.200')] +[2023-10-08 14:54:56,984][102898] Updated weights for policy 1, policy_version 78910 (0.0011) +[2023-10-08 14:55:00,026][102897] Updated weights for policy 0, policy_version 78820 (0.0007) +[2023-10-08 14:55:00,393][102897] Updated weights for policy 0, policy_version 78830 (0.0008) +[2023-10-08 14:55:00,758][102897] Updated weights for policy 0, policy_version 78840 (0.0008) +[2023-10-08 14:55:00,908][102898] Updated weights for policy 1, policy_version 78920 (0.0009) +[2023-10-08 14:55:01,275][102898] Updated weights for policy 1, policy_version 78930 (0.0009) +[2023-10-08 14:55:01,638][102898] Updated weights for policy 1, policy_version 78940 (0.0009) +[2023-10-08 14:55:01,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 161579008. Throughput: 0: 1767.4, 1: 1787.8. Samples: 40399048. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 14:55:01,876][101941] Avg episode reward: [(0, '8.630'), (1, '12.090')] +[2023-10-08 14:55:04,550][102897] Updated weights for policy 0, policy_version 78850 (0.0008) +[2023-10-08 14:55:04,926][102897] Updated weights for policy 0, policy_version 78860 (0.0008) +[2023-10-08 14:55:05,298][102897] Updated weights for policy 0, policy_version 78870 (0.0007) +[2023-10-08 14:55:05,454][102898] Updated weights for policy 1, policy_version 78950 (0.0009) +[2023-10-08 14:55:05,662][102897] Updated weights for policy 0, policy_version 78880 (0.0008) +[2023-10-08 14:55:05,827][102898] Updated weights for policy 1, policy_version 78960 (0.0009) +[2023-10-08 14:55:06,201][102898] Updated weights for policy 1, policy_version 78970 (0.0009) +[2023-10-08 14:55:06,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 161644544. Throughput: 0: 1792.6, 1: 1782.1. Samples: 40411238. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 14:55:06,876][101941] Avg episode reward: [(0, '8.360'), (1, '11.430')] +[2023-10-08 14:55:09,492][102897] Updated weights for policy 0, policy_version 78890 (0.0008) +[2023-10-08 14:55:09,858][102897] Updated weights for policy 0, policy_version 78900 (0.0008) +[2023-10-08 14:55:09,933][102898] Updated weights for policy 1, policy_version 78980 (0.0008) +[2023-10-08 14:55:10,224][102897] Updated weights for policy 0, policy_version 78910 (0.0010) +[2023-10-08 14:55:10,301][102898] Updated weights for policy 1, policy_version 78990 (0.0007) +[2023-10-08 14:55:10,666][102898] Updated weights for policy 1, policy_version 79000 (0.0007) +[2023-10-08 14:55:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 161710080. Throughput: 0: 1768.8, 1: 1793.5. Samples: 40431446. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 14:55:11,875][101941] Avg episode reward: [(0, '8.190'), (1, '10.890')] +[2023-10-08 14:55:14,031][102897] Updated weights for policy 0, policy_version 78920 (0.0009) +[2023-10-08 14:55:14,366][102898] Updated weights for policy 1, policy_version 79010 (0.0008) +[2023-10-08 14:55:14,404][102897] Updated weights for policy 0, policy_version 78930 (0.0009) +[2023-10-08 14:55:14,751][102898] Updated weights for policy 1, policy_version 79020 (0.0007) +[2023-10-08 14:55:14,777][102897] Updated weights for policy 0, policy_version 78940 (0.0007) +[2023-10-08 14:55:15,120][102898] Updated weights for policy 1, policy_version 79030 (0.0007) +[2023-10-08 14:55:15,487][102898] Updated weights for policy 1, policy_version 79040 (0.0009) +[2023-10-08 14:55:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 161775616. Throughput: 0: 1768.4, 1: 1782.0. Samples: 40453036. Policy #0 lag: (min: 31.0, avg: 31.0, max: 32.0) +[2023-10-08 14:55:16,876][101941] Avg episode reward: [(0, '8.790'), (1, '11.270')] +[2023-10-08 14:55:18,494][102897] Updated weights for policy 0, policy_version 78950 (0.0007) +[2023-10-08 14:55:18,875][102897] Updated weights for policy 0, policy_version 78960 (0.0007) +[2023-10-08 14:55:19,239][102897] Updated weights for policy 0, policy_version 78970 (0.0008) +[2023-10-08 14:55:19,250][102898] Updated weights for policy 1, policy_version 79050 (0.0008) +[2023-10-08 14:55:19,603][102898] Updated weights for policy 1, policy_version 79060 (0.0009) +[2023-10-08 14:55:19,968][102898] Updated weights for policy 1, policy_version 79070 (0.0009) +[2023-10-08 14:55:21,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 161841152. Throughput: 0: 1772.8, 1: 1795.5. Samples: 40463662. Policy #0 lag: (min: 21.0, avg: 24.0, max: 53.0) +[2023-10-08 14:55:21,876][101941] Avg episode reward: [(0, '8.470'), (1, '11.230')] +[2023-10-08 14:55:23,015][102897] Updated weights for policy 0, policy_version 78980 (0.0008) +[2023-10-08 14:55:23,385][102897] Updated weights for policy 0, policy_version 78990 (0.0007) +[2023-10-08 14:55:23,729][102898] Updated weights for policy 1, policy_version 79080 (0.0008) +[2023-10-08 14:55:23,749][102897] Updated weights for policy 0, policy_version 79000 (0.0007) +[2023-10-08 14:55:24,099][102898] Updated weights for policy 1, policy_version 79090 (0.0009) +[2023-10-08 14:55:24,458][102898] Updated weights for policy 1, policy_version 79100 (0.0007) +[2023-10-08 14:55:26,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 161906688. Throughput: 0: 1768.2, 1: 1773.2. Samples: 40484998. Policy #0 lag: (min: 21.0, avg: 24.0, max: 53.0) +[2023-10-08 14:55:26,876][101941] Avg episode reward: [(0, '8.880'), (1, '11.520')] +[2023-10-08 14:55:27,608][102897] Updated weights for policy 0, policy_version 79010 (0.0007) +[2023-10-08 14:55:28,005][102897] Updated weights for policy 0, policy_version 79020 (0.0008) +[2023-10-08 14:55:28,145][102898] Updated weights for policy 1, policy_version 79110 (0.0009) +[2023-10-08 14:55:28,363][102897] Updated weights for policy 0, policy_version 79030 (0.0007) +[2023-10-08 14:55:28,499][102898] Updated weights for policy 1, policy_version 79120 (0.0007) +[2023-10-08 14:55:28,734][102897] Updated weights for policy 0, policy_version 79040 (0.0008) +[2023-10-08 14:55:28,870][102898] Updated weights for policy 1, policy_version 79130 (0.0008) +[2023-10-08 14:55:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 161972224. Throughput: 0: 1779.2, 1: 1782.4. Samples: 40507532. Policy #0 lag: (min: 21.0, avg: 24.0, max: 53.0) +[2023-10-08 14:55:31,876][101941] Avg episode reward: [(0, '8.560'), (1, '12.650')] +[2023-10-08 14:55:32,484][102898] Updated weights for policy 1, policy_version 79140 (0.0009) +[2023-10-08 14:55:32,580][102897] Updated weights for policy 0, policy_version 79050 (0.0007) +[2023-10-08 14:55:32,850][102898] Updated weights for policy 1, policy_version 79150 (0.0009) +[2023-10-08 14:55:32,948][102897] Updated weights for policy 0, policy_version 79060 (0.0007) +[2023-10-08 14:55:33,211][102898] Updated weights for policy 1, policy_version 79160 (0.0007) +[2023-10-08 14:55:33,318][102897] Updated weights for policy 0, policy_version 79070 (0.0007) +[2023-10-08 14:55:36,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 162037760. Throughput: 0: 1768.6, 1: 1788.2. Samples: 40517470. Policy #0 lag: (min: 21.0, avg: 24.0, max: 53.0) +[2023-10-08 14:55:36,875][101941] Avg episode reward: [(0, '8.060'), (1, '12.040')] +[2023-10-08 14:55:37,040][102898] Updated weights for policy 1, policy_version 79170 (0.0009) +[2023-10-08 14:55:37,120][102897] Updated weights for policy 0, policy_version 79080 (0.0008) +[2023-10-08 14:55:37,398][102898] Updated weights for policy 1, policy_version 79180 (0.0008) +[2023-10-08 14:55:37,501][102897] Updated weights for policy 0, policy_version 79090 (0.0008) +[2023-10-08 14:55:37,764][102898] Updated weights for policy 1, policy_version 79190 (0.0010) +[2023-10-08 14:55:37,866][102897] Updated weights for policy 0, policy_version 79100 (0.0008) +[2023-10-08 14:55:38,123][102898] Updated weights for policy 1, policy_version 79200 (0.0009) +[2023-10-08 14:55:41,780][102897] Updated weights for policy 0, policy_version 79110 (0.0008) +[2023-10-08 14:55:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 162103296. Throughput: 0: 1774.4, 1: 1786.0. Samples: 40539578. Policy #0 lag: (min: 21.0, avg: 24.0, max: 53.0) +[2023-10-08 14:55:41,875][101941] Avg episode reward: [(0, '8.280'), (1, '11.990')] +[2023-10-08 14:55:42,076][102898] Updated weights for policy 1, policy_version 79210 (0.0009) +[2023-10-08 14:55:42,144][102897] Updated weights for policy 0, policy_version 79120 (0.0007) +[2023-10-08 14:55:42,441][102898] Updated weights for policy 1, policy_version 79220 (0.0008) +[2023-10-08 14:55:42,511][102897] Updated weights for policy 0, policy_version 79130 (0.0008) +[2023-10-08 14:55:42,807][102898] Updated weights for policy 1, policy_version 79230 (0.0009) +[2023-10-08 14:55:46,353][102897] Updated weights for policy 0, policy_version 79140 (0.0007) +[2023-10-08 14:55:46,399][102898] Updated weights for policy 1, policy_version 79240 (0.0007) +[2023-10-08 14:55:46,719][102897] Updated weights for policy 0, policy_version 79150 (0.0007) +[2023-10-08 14:55:46,765][102898] Updated weights for policy 1, policy_version 79250 (0.0009) +[2023-10-08 14:55:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 162168832. Throughput: 0: 1792.8, 1: 1809.4. Samples: 40561150. Policy #0 lag: (min: 21.0, avg: 24.0, max: 53.0) +[2023-10-08 14:55:46,876][101941] Avg episode reward: [(0, '8.570'), (1, '11.020')] +[2023-10-08 14:55:47,087][102897] Updated weights for policy 0, policy_version 79160 (0.0007) +[2023-10-08 14:55:47,126][102898] Updated weights for policy 1, policy_version 79260 (0.0008) +[2023-10-08 14:55:50,924][102897] Updated weights for policy 0, policy_version 79170 (0.0009) +[2023-10-08 14:55:50,932][102898] Updated weights for policy 1, policy_version 79270 (0.0011) +[2023-10-08 14:55:51,288][102897] Updated weights for policy 0, policy_version 79180 (0.0008) +[2023-10-08 14:55:51,297][102898] Updated weights for policy 1, policy_version 79280 (0.0008) +[2023-10-08 14:55:51,665][102898] Updated weights for policy 1, policy_version 79290 (0.0008) +[2023-10-08 14:55:51,675][102897] Updated weights for policy 0, policy_version 79190 (0.0007) +[2023-10-08 14:55:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 14218.0). Total num frames: 162234368. Throughput: 0: 1765.2, 1: 1792.4. Samples: 40571328. Policy #0 lag: (min: 21.0, avg: 24.0, max: 53.0) +[2023-10-08 14:55:51,878][101941] Avg episode reward: [(0, '9.130'), (1, '11.540')] +[2023-10-08 14:55:52,037][102897] Updated weights for policy 0, policy_version 79200 (0.0009) +[2023-10-08 14:55:55,419][102898] Updated weights for policy 1, policy_version 79300 (0.0008) +[2023-10-08 14:55:55,778][102898] Updated weights for policy 1, policy_version 79310 (0.0007) +[2023-10-08 14:55:55,967][102897] Updated weights for policy 0, policy_version 79210 (0.0008) +[2023-10-08 14:55:56,142][102898] Updated weights for policy 1, policy_version 79320 (0.0009) +[2023-10-08 14:55:56,342][102897] Updated weights for policy 0, policy_version 79220 (0.0009) +[2023-10-08 14:55:56,719][102897] Updated weights for policy 0, policy_version 79230 (0.0009) +[2023-10-08 14:55:56,875][101941] Fps is (10 sec: 19660.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 162365440. Throughput: 0: 1794.2, 1: 1805.8. Samples: 40593448. Policy #0 lag: (min: 21.0, avg: 24.0, max: 53.0) +[2023-10-08 14:55:56,875][101941] Avg episode reward: [(0, '9.130'), (1, '11.310')] +[2023-10-08 14:55:59,969][102898] Updated weights for policy 1, policy_version 79330 (0.0008) +[2023-10-08 14:56:00,336][102897] Updated weights for policy 0, policy_version 79240 (0.0007) +[2023-10-08 14:56:00,372][102898] Updated weights for policy 1, policy_version 79340 (0.0009) +[2023-10-08 14:56:00,706][102897] Updated weights for policy 0, policy_version 79250 (0.0008) +[2023-10-08 14:56:00,733][102898] Updated weights for policy 1, policy_version 79350 (0.0010) +[2023-10-08 14:56:01,074][102897] Updated weights for policy 0, policy_version 79260 (0.0009) +[2023-10-08 14:56:01,100][102898] Updated weights for policy 1, policy_version 79360 (0.0008) +[2023-10-08 14:56:01,875][101941] Fps is (10 sec: 19660.6, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 162430976. Throughput: 0: 1758.2, 1: 1790.0. Samples: 40612706. Policy #0 lag: (min: 21.0, avg: 24.0, max: 53.0) +[2023-10-08 14:56:01,876][101941] Avg episode reward: [(0, '9.190'), (1, '11.140')] +[2023-10-08 14:56:04,771][102897] Updated weights for policy 0, policy_version 79270 (0.0008) +[2023-10-08 14:56:04,877][102898] Updated weights for policy 1, policy_version 79370 (0.0008) +[2023-10-08 14:56:05,138][102897] Updated weights for policy 0, policy_version 79280 (0.0007) +[2023-10-08 14:56:05,244][102898] Updated weights for policy 1, policy_version 79380 (0.0008) +[2023-10-08 14:56:05,506][102897] Updated weights for policy 0, policy_version 79290 (0.0007) +[2023-10-08 14:56:05,607][102898] Updated weights for policy 1, policy_version 79390 (0.0010) +[2023-10-08 14:56:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 162496512. Throughput: 0: 1789.0, 1: 1805.8. Samples: 40625428. Policy #0 lag: (min: 21.0, avg: 24.0, max: 53.0) +[2023-10-08 14:56:06,875][101941] Avg episode reward: [(0, '8.510'), (1, '11.560')] +[2023-10-08 14:56:09,248][102897] Updated weights for policy 0, policy_version 79300 (0.0008) +[2023-10-08 14:56:09,322][102898] Updated weights for policy 1, policy_version 79400 (0.0007) +[2023-10-08 14:56:09,619][102897] Updated weights for policy 0, policy_version 79310 (0.0009) +[2023-10-08 14:56:09,690][102898] Updated weights for policy 1, policy_version 79410 (0.0007) +[2023-10-08 14:56:09,983][102897] Updated weights for policy 0, policy_version 79320 (0.0007) +[2023-10-08 14:56:10,058][102898] Updated weights for policy 1, policy_version 79420 (0.0007) +[2023-10-08 14:56:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 162562048. Throughput: 0: 1760.5, 1: 1791.6. Samples: 40644840. Policy #0 lag: (min: 5.0, avg: 11.4, max: 37.0) +[2023-10-08 14:56:11,876][101941] Avg episode reward: [(0, '8.900'), (1, '11.030')] +[2023-10-08 14:56:13,901][102897] Updated weights for policy 0, policy_version 79330 (0.0009) +[2023-10-08 14:56:13,909][102898] Updated weights for policy 1, policy_version 79430 (0.0007) +[2023-10-08 14:56:14,266][102898] Updated weights for policy 1, policy_version 79440 (0.0007) +[2023-10-08 14:56:14,312][102897] Updated weights for policy 0, policy_version 79340 (0.0008) +[2023-10-08 14:56:14,627][102898] Updated weights for policy 1, policy_version 79450 (0.0007) +[2023-10-08 14:56:14,672][102897] Updated weights for policy 0, policy_version 79350 (0.0009) +[2023-10-08 14:56:15,033][102897] Updated weights for policy 0, policy_version 79360 (0.0008) +[2023-10-08 14:56:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 162627584. Throughput: 0: 1760.7, 1: 1779.7. Samples: 40666850. Policy #0 lag: (min: 5.0, avg: 11.4, max: 37.0) +[2023-10-08 14:56:16,876][101941] Avg episode reward: [(0, '8.960'), (1, '10.830')] +[2023-10-08 14:56:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000079360_81264640.pth... +[2023-10-08 14:56:16,883][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000079456_81362944.pth... +[2023-10-08 14:56:16,916][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000077696_79560704.pth +[2023-10-08 14:56:16,919][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000077792_79659008.pth +[2023-10-08 14:56:18,549][102898] Updated weights for policy 1, policy_version 79460 (0.0007) +[2023-10-08 14:56:18,858][102897] Updated weights for policy 0, policy_version 79370 (0.0009) +[2023-10-08 14:56:18,918][102898] Updated weights for policy 1, policy_version 79470 (0.0008) +[2023-10-08 14:56:19,234][102897] Updated weights for policy 0, policy_version 79380 (0.0008) +[2023-10-08 14:56:19,284][102898] Updated weights for policy 1, policy_version 79480 (0.0008) +[2023-10-08 14:56:19,598][102897] Updated weights for policy 0, policy_version 79390 (0.0007) +[2023-10-08 14:56:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 162693120. Throughput: 0: 1767.0, 1: 1779.5. Samples: 40677064. Policy #0 lag: (min: 5.0, avg: 11.4, max: 37.0) +[2023-10-08 14:56:21,876][101941] Avg episode reward: [(0, '8.710'), (1, '10.860')] +[2023-10-08 14:56:22,959][102898] Updated weights for policy 1, policy_version 79490 (0.0007) +[2023-10-08 14:56:23,331][102898] Updated weights for policy 1, policy_version 79500 (0.0009) +[2023-10-08 14:56:23,439][102897] Updated weights for policy 0, policy_version 79400 (0.0008) +[2023-10-08 14:56:23,693][102898] Updated weights for policy 1, policy_version 79510 (0.0008) +[2023-10-08 14:56:23,802][102897] Updated weights for policy 0, policy_version 79410 (0.0009) +[2023-10-08 14:56:24,055][102898] Updated weights for policy 1, policy_version 79520 (0.0009) +[2023-10-08 14:56:24,180][102897] Updated weights for policy 0, policy_version 79420 (0.0008) +[2023-10-08 14:56:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 162758656. Throughput: 0: 1755.6, 1: 1782.0. Samples: 40698770. Policy #0 lag: (min: 5.0, avg: 11.4, max: 37.0) +[2023-10-08 14:56:26,876][101941] Avg episode reward: [(0, '8.320'), (1, '10.840')] +[2023-10-08 14:56:27,786][102898] Updated weights for policy 1, policy_version 79530 (0.0007) +[2023-10-08 14:56:27,899][102897] Updated weights for policy 0, policy_version 79430 (0.0008) +[2023-10-08 14:56:28,164][102898] Updated weights for policy 1, policy_version 79540 (0.0010) +[2023-10-08 14:56:28,270][102897] Updated weights for policy 0, policy_version 79440 (0.0008) +[2023-10-08 14:56:28,522][102898] Updated weights for policy 1, policy_version 79550 (0.0008) +[2023-10-08 14:56:28,634][102897] Updated weights for policy 0, policy_version 79450 (0.0009) +[2023-10-08 14:56:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 162824192. Throughput: 0: 1767.6, 1: 1786.3. Samples: 40721080. Policy #0 lag: (min: 5.0, avg: 11.4, max: 37.0) +[2023-10-08 14:56:31,876][101941] Avg episode reward: [(0, '8.190'), (1, '10.970')] +[2023-10-08 14:56:32,261][102898] Updated weights for policy 1, policy_version 79560 (0.0007) +[2023-10-08 14:56:32,475][102897] Updated weights for policy 0, policy_version 79460 (0.0008) +[2023-10-08 14:56:32,625][102898] Updated weights for policy 1, policy_version 79570 (0.0008) +[2023-10-08 14:56:32,851][102897] Updated weights for policy 0, policy_version 79470 (0.0008) +[2023-10-08 14:56:32,991][102898] Updated weights for policy 1, policy_version 79580 (0.0007) +[2023-10-08 14:56:33,214][102897] Updated weights for policy 0, policy_version 79480 (0.0008) +[2023-10-08 14:56:36,709][102898] Updated weights for policy 1, policy_version 79590 (0.0009) +[2023-10-08 14:56:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 162889728. Throughput: 0: 1763.4, 1: 1777.9. Samples: 40730688. Policy #0 lag: (min: 5.0, avg: 11.4, max: 37.0) +[2023-10-08 14:56:36,875][101941] Avg episode reward: [(0, '8.500'), (1, '11.020')] +[2023-10-08 14:56:36,957][102897] Updated weights for policy 0, policy_version 79490 (0.0008) +[2023-10-08 14:56:37,071][102898] Updated weights for policy 1, policy_version 79600 (0.0009) +[2023-10-08 14:56:37,329][102897] Updated weights for policy 0, policy_version 79500 (0.0008) +[2023-10-08 14:56:37,437][102898] Updated weights for policy 1, policy_version 79610 (0.0008) +[2023-10-08 14:56:37,708][102897] Updated weights for policy 0, policy_version 79510 (0.0009) +[2023-10-08 14:56:38,078][102897] Updated weights for policy 0, policy_version 79520 (0.0008) +[2023-10-08 14:56:41,290][102898] Updated weights for policy 1, policy_version 79620 (0.0009) +[2023-10-08 14:56:41,653][102898] Updated weights for policy 1, policy_version 79630 (0.0008) +[2023-10-08 14:56:41,864][102897] Updated weights for policy 0, policy_version 79530 (0.0009) +[2023-10-08 14:56:41,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 162955264. Throughput: 0: 1761.1, 1: 1787.2. Samples: 40753118. Policy #0 lag: (min: 5.0, avg: 11.4, max: 37.0) +[2023-10-08 14:56:41,875][101941] Avg episode reward: [(0, '8.850'), (1, '11.660')] +[2023-10-08 14:56:42,010][102898] Updated weights for policy 1, policy_version 79640 (0.0008) +[2023-10-08 14:56:42,226][102897] Updated weights for policy 0, policy_version 79540 (0.0009) +[2023-10-08 14:56:42,604][102897] Updated weights for policy 0, policy_version 79550 (0.0008) +[2023-10-08 14:56:45,931][102898] Updated weights for policy 1, policy_version 79650 (0.0008) +[2023-10-08 14:56:46,318][102898] Updated weights for policy 1, policy_version 79660 (0.0008) +[2023-10-08 14:56:46,570][102897] Updated weights for policy 0, policy_version 79560 (0.0008) +[2023-10-08 14:56:46,686][102898] Updated weights for policy 1, policy_version 79670 (0.0009) +[2023-10-08 14:56:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 163020800. Throughput: 0: 1794.4, 1: 1797.1. Samples: 40774324. Policy #0 lag: (min: 5.0, avg: 11.4, max: 37.0) +[2023-10-08 14:56:46,876][101941] Avg episode reward: [(0, '9.210'), (1, '12.390')] +[2023-10-08 14:56:46,950][102897] Updated weights for policy 0, policy_version 79570 (0.0008) +[2023-10-08 14:56:47,049][102898] Updated weights for policy 1, policy_version 79680 (0.0008) +[2023-10-08 14:56:47,323][102897] Updated weights for policy 0, policy_version 79580 (0.0009) +[2023-10-08 14:56:50,939][102898] Updated weights for policy 1, policy_version 79690 (0.0008) +[2023-10-08 14:56:51,053][102897] Updated weights for policy 0, policy_version 79590 (0.0008) +[2023-10-08 14:56:51,300][102898] Updated weights for policy 1, policy_version 79700 (0.0008) +[2023-10-08 14:56:51,424][102897] Updated weights for policy 0, policy_version 79600 (0.0010) +[2023-10-08 14:56:51,659][102898] Updated weights for policy 1, policy_version 79710 (0.0009) +[2023-10-08 14:56:51,790][102897] Updated weights for policy 0, policy_version 79610 (0.0008) +[2023-10-08 14:56:51,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 163119104. Throughput: 0: 1764.5, 1: 1778.3. Samples: 40784854. Policy #0 lag: (min: 5.0, avg: 11.4, max: 37.0) +[2023-10-08 14:56:51,876][101941] Avg episode reward: [(0, '8.830'), (1, '12.970')] +[2023-10-08 14:56:55,521][102898] Updated weights for policy 1, policy_version 79720 (0.0009) +[2023-10-08 14:56:55,611][102897] Updated weights for policy 0, policy_version 79620 (0.0008) +[2023-10-08 14:56:55,878][102898] Updated weights for policy 1, policy_version 79730 (0.0008) +[2023-10-08 14:56:55,983][102897] Updated weights for policy 0, policy_version 79630 (0.0008) +[2023-10-08 14:56:56,236][102898] Updated weights for policy 1, policy_version 79740 (0.0008) +[2023-10-08 14:56:56,358][102897] Updated weights for policy 0, policy_version 79640 (0.0008) +[2023-10-08 14:56:56,875][101941] Fps is (10 sec: 19660.7, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 163217408. Throughput: 0: 1800.1, 1: 1803.3. Samples: 40806994. Policy #0 lag: (min: 5.0, avg: 11.4, max: 37.0) +[2023-10-08 14:56:56,876][101941] Avg episode reward: [(0, '8.190'), (1, '13.310')] +[2023-10-08 14:56:56,877][102760] Saving new best policy, reward=13.310! +[2023-10-08 14:56:59,855][102897] Updated weights for policy 0, policy_version 79650 (0.0010) +[2023-10-08 14:56:59,939][102898] Updated weights for policy 1, policy_version 79750 (0.0007) +[2023-10-08 14:57:00,246][102897] Updated weights for policy 0, policy_version 79660 (0.0008) +[2023-10-08 14:57:00,308][102898] Updated weights for policy 1, policy_version 79760 (0.0008) +[2023-10-08 14:57:00,621][102897] Updated weights for policy 0, policy_version 79670 (0.0007) +[2023-10-08 14:57:00,670][102898] Updated weights for policy 1, policy_version 79770 (0.0008) +[2023-10-08 14:57:00,982][102897] Updated weights for policy 0, policy_version 79680 (0.0009) +[2023-10-08 14:57:01,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 163282944. Throughput: 0: 1773.3, 1: 1784.5. Samples: 40826954. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:57:01,875][101941] Avg episode reward: [(0, '8.470'), (1, '13.490')] +[2023-10-08 14:57:01,885][102760] Saving new best policy, reward=13.490! +[2023-10-08 14:57:04,481][102898] Updated weights for policy 1, policy_version 79780 (0.0010) +[2023-10-08 14:57:04,657][102897] Updated weights for policy 0, policy_version 79690 (0.0008) +[2023-10-08 14:57:04,854][102898] Updated weights for policy 1, policy_version 79790 (0.0009) +[2023-10-08 14:57:05,033][102897] Updated weights for policy 0, policy_version 79700 (0.0008) +[2023-10-08 14:57:05,215][102898] Updated weights for policy 1, policy_version 79800 (0.0008) +[2023-10-08 14:57:05,392][102897] Updated weights for policy 0, policy_version 79710 (0.0008) +[2023-10-08 14:57:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 163348480. Throughput: 0: 1796.5, 1: 1807.2. Samples: 40839234. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:57:06,876][101941] Avg episode reward: [(0, '8.280'), (1, '12.980')] +[2023-10-08 14:57:08,931][102898] Updated weights for policy 1, policy_version 79810 (0.0008) +[2023-10-08 14:57:09,298][102898] Updated weights for policy 1, policy_version 79820 (0.0007) +[2023-10-08 14:57:09,370][102897] Updated weights for policy 0, policy_version 79720 (0.0009) +[2023-10-08 14:57:09,672][102898] Updated weights for policy 1, policy_version 79830 (0.0007) +[2023-10-08 14:57:09,730][102897] Updated weights for policy 0, policy_version 79730 (0.0008) +[2023-10-08 14:57:10,030][102898] Updated weights for policy 1, policy_version 79840 (0.0007) +[2023-10-08 14:57:10,095][102897] Updated weights for policy 0, policy_version 79740 (0.0008) +[2023-10-08 14:57:11,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 163414016. Throughput: 0: 1774.3, 1: 1777.2. Samples: 40858590. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:57:11,876][101941] Avg episode reward: [(0, '8.110'), (1, '12.460')] +[2023-10-08 14:57:13,723][102898] Updated weights for policy 1, policy_version 79850 (0.0008) +[2023-10-08 14:57:13,913][102897] Updated weights for policy 0, policy_version 79750 (0.0009) +[2023-10-08 14:57:14,081][102898] Updated weights for policy 1, policy_version 79860 (0.0009) +[2023-10-08 14:57:14,286][102897] Updated weights for policy 0, policy_version 79760 (0.0007) +[2023-10-08 14:57:14,440][102898] Updated weights for policy 1, policy_version 79870 (0.0008) +[2023-10-08 14:57:14,652][102897] Updated weights for policy 0, policy_version 79770 (0.0007) +[2023-10-08 14:57:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 163479552. Throughput: 0: 1771.7, 1: 1784.3. Samples: 40881098. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:57:16,876][101941] Avg episode reward: [(0, '8.200'), (1, '11.650')] +[2023-10-08 14:57:18,103][102898] Updated weights for policy 1, policy_version 79880 (0.0009) +[2023-10-08 14:57:18,468][102898] Updated weights for policy 1, policy_version 79890 (0.0008) +[2023-10-08 14:57:18,533][102897] Updated weights for policy 0, policy_version 79780 (0.0010) +[2023-10-08 14:57:18,832][102898] Updated weights for policy 1, policy_version 79900 (0.0008) +[2023-10-08 14:57:18,904][102897] Updated weights for policy 0, policy_version 79790 (0.0009) +[2023-10-08 14:57:19,268][102897] Updated weights for policy 0, policy_version 79800 (0.0008) +[2023-10-08 14:57:21,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 163545088. Throughput: 0: 1780.9, 1: 1786.4. Samples: 40891216. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:57:21,875][101941] Avg episode reward: [(0, '8.290'), (1, '11.500')] +[2023-10-08 14:57:22,653][102898] Updated weights for policy 1, policy_version 79910 (0.0009) +[2023-10-08 14:57:23,021][102898] Updated weights for policy 1, policy_version 79920 (0.0007) +[2023-10-08 14:57:23,107][102897] Updated weights for policy 0, policy_version 79810 (0.0009) +[2023-10-08 14:57:23,389][102898] Updated weights for policy 1, policy_version 79930 (0.0007) +[2023-10-08 14:57:23,478][102897] Updated weights for policy 0, policy_version 79820 (0.0009) +[2023-10-08 14:57:23,843][102897] Updated weights for policy 0, policy_version 79830 (0.0009) +[2023-10-08 14:57:24,212][102897] Updated weights for policy 0, policy_version 79840 (0.0010) +[2023-10-08 14:57:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 163610624. Throughput: 0: 1779.9, 1: 1778.8. Samples: 40913260. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:57:26,876][101941] Avg episode reward: [(0, '8.990'), (1, '10.800')] +[2023-10-08 14:57:27,198][102898] Updated weights for policy 1, policy_version 79940 (0.0008) +[2023-10-08 14:57:27,564][102898] Updated weights for policy 1, policy_version 79950 (0.0007) +[2023-10-08 14:57:27,932][102898] Updated weights for policy 1, policy_version 79960 (0.0007) +[2023-10-08 14:57:27,970][102897] Updated weights for policy 0, policy_version 79850 (0.0008) +[2023-10-08 14:57:28,351][102897] Updated weights for policy 0, policy_version 79860 (0.0009) +[2023-10-08 14:57:28,717][102897] Updated weights for policy 0, policy_version 79870 (0.0007) +[2023-10-08 14:57:31,817][102898] Updated weights for policy 1, policy_version 79970 (0.0008) +[2023-10-08 14:57:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 163676160. Throughput: 0: 1787.2, 1: 1801.2. Samples: 40935798. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:57:31,876][101941] Avg episode reward: [(0, '8.790'), (1, '10.170')] +[2023-10-08 14:57:32,195][102898] Updated weights for policy 1, policy_version 79980 (0.0007) +[2023-10-08 14:57:32,366][102897] Updated weights for policy 0, policy_version 79880 (0.0008) +[2023-10-08 14:57:32,559][102898] Updated weights for policy 1, policy_version 79990 (0.0009) +[2023-10-08 14:57:32,729][102897] Updated weights for policy 0, policy_version 79890 (0.0008) +[2023-10-08 14:57:32,924][102898] Updated weights for policy 1, policy_version 80000 (0.0007) +[2023-10-08 14:57:33,096][102897] Updated weights for policy 0, policy_version 79900 (0.0009) +[2023-10-08 14:57:36,491][102898] Updated weights for policy 1, policy_version 80010 (0.0007) +[2023-10-08 14:57:36,859][102898] Updated weights for policy 1, policy_version 80020 (0.0008) +[2023-10-08 14:57:36,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 163741696. Throughput: 0: 1783.5, 1: 1787.9. Samples: 40945564. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:57:36,875][101941] Avg episode reward: [(0, '8.260'), (1, '11.230')] +[2023-10-08 14:57:36,938][102897] Updated weights for policy 0, policy_version 79910 (0.0008) +[2023-10-08 14:57:37,222][102898] Updated weights for policy 1, policy_version 80030 (0.0007) +[2023-10-08 14:57:37,310][102897] Updated weights for policy 0, policy_version 79920 (0.0007) +[2023-10-08 14:57:37,677][102897] Updated weights for policy 0, policy_version 79930 (0.0007) +[2023-10-08 14:57:41,056][102898] Updated weights for policy 1, policy_version 80040 (0.0010) +[2023-10-08 14:57:41,345][102897] Updated weights for policy 0, policy_version 79940 (0.0008) +[2023-10-08 14:57:41,434][102898] Updated weights for policy 1, policy_version 80050 (0.0009) +[2023-10-08 14:57:41,710][102897] Updated weights for policy 0, policy_version 79950 (0.0007) +[2023-10-08 14:57:41,799][102898] Updated weights for policy 1, policy_version 80060 (0.0009) +[2023-10-08 14:57:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 163807232. Throughput: 0: 1777.6, 1: 1793.6. Samples: 40967694. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:57:41,876][101941] Avg episode reward: [(0, '8.610'), (1, '12.240')] +[2023-10-08 14:57:42,088][102897] Updated weights for policy 0, policy_version 79960 (0.0007) +[2023-10-08 14:57:45,468][102898] Updated weights for policy 1, policy_version 80070 (0.0008) +[2023-10-08 14:57:45,839][102898] Updated weights for policy 1, policy_version 80080 (0.0010) +[2023-10-08 14:57:46,081][102897] Updated weights for policy 0, policy_version 79970 (0.0008) +[2023-10-08 14:57:46,195][102898] Updated weights for policy 1, policy_version 80090 (0.0007) +[2023-10-08 14:57:46,475][102897] Updated weights for policy 0, policy_version 79980 (0.0007) +[2023-10-08 14:57:46,836][102897] Updated weights for policy 0, policy_version 79990 (0.0007) +[2023-10-08 14:57:46,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 163905536. Throughput: 0: 1793.0, 1: 1786.0. Samples: 40988010. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:57:46,876][101941] Avg episode reward: [(0, '9.080'), (1, '12.030')] +[2023-10-08 14:57:47,204][102897] Updated weights for policy 0, policy_version 80000 (0.0010) +[2023-10-08 14:57:50,041][102898] Updated weights for policy 1, policy_version 80100 (0.0009) +[2023-10-08 14:57:50,406][102898] Updated weights for policy 1, policy_version 80110 (0.0008) +[2023-10-08 14:57:50,781][102898] Updated weights for policy 1, policy_version 80120 (0.0008) +[2023-10-08 14:57:51,065][102897] Updated weights for policy 0, policy_version 80010 (0.0008) +[2023-10-08 14:57:51,438][102897] Updated weights for policy 0, policy_version 80020 (0.0007) +[2023-10-08 14:57:51,814][102897] Updated weights for policy 0, policy_version 80030 (0.0009) +[2023-10-08 14:57:51,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 163971072. Throughput: 0: 1770.6, 1: 1792.3. Samples: 40999564. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 14:57:51,875][101941] Avg episode reward: [(0, '8.130'), (1, '11.590')] +[2023-10-08 14:57:54,540][102898] Updated weights for policy 1, policy_version 80130 (0.0007) +[2023-10-08 14:57:54,918][102898] Updated weights for policy 1, policy_version 80140 (0.0011) +[2023-10-08 14:57:55,284][102898] Updated weights for policy 1, policy_version 80150 (0.0008) +[2023-10-08 14:57:55,585][102897] Updated weights for policy 0, policy_version 80040 (0.0008) +[2023-10-08 14:57:55,644][102898] Updated weights for policy 1, policy_version 80160 (0.0008) +[2023-10-08 14:57:55,949][102897] Updated weights for policy 0, policy_version 80050 (0.0007) +[2023-10-08 14:57:56,328][102897] Updated weights for policy 0, policy_version 80060 (0.0009) +[2023-10-08 14:57:56,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 164069376. Throughput: 0: 1805.3, 1: 1799.2. Samples: 41020794. Policy #0 lag: (min: 28.0, avg: 32.2, max: 60.0) +[2023-10-08 14:57:56,876][101941] Avg episode reward: [(0, '8.010'), (1, '11.780')] +[2023-10-08 14:57:59,462][102898] Updated weights for policy 1, policy_version 80170 (0.0009) +[2023-10-08 14:57:59,823][102898] Updated weights for policy 1, policy_version 80180 (0.0009) +[2023-10-08 14:58:00,107][102897] Updated weights for policy 0, policy_version 80070 (0.0007) +[2023-10-08 14:58:00,190][102898] Updated weights for policy 1, policy_version 80190 (0.0007) +[2023-10-08 14:58:00,471][102897] Updated weights for policy 0, policy_version 80080 (0.0008) +[2023-10-08 14:58:00,839][102897] Updated weights for policy 0, policy_version 80090 (0.0009) +[2023-10-08 14:58:01,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 164134912. Throughput: 0: 1772.4, 1: 1789.0. Samples: 41041364. Policy #0 lag: (min: 28.0, avg: 32.2, max: 60.0) +[2023-10-08 14:58:01,876][101941] Avg episode reward: [(0, '7.840'), (1, '10.790')] +[2023-10-08 14:58:03,872][102898] Updated weights for policy 1, policy_version 80200 (0.0007) +[2023-10-08 14:58:04,237][102898] Updated weights for policy 1, policy_version 80210 (0.0009) +[2023-10-08 14:58:04,555][102897] Updated weights for policy 0, policy_version 80100 (0.0008) +[2023-10-08 14:58:04,597][102898] Updated weights for policy 1, policy_version 80220 (0.0008) +[2023-10-08 14:58:04,923][102897] Updated weights for policy 0, policy_version 80110 (0.0008) +[2023-10-08 14:58:05,288][102897] Updated weights for policy 0, policy_version 80120 (0.0007) +[2023-10-08 14:58:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 164200448. Throughput: 0: 1799.9, 1: 1800.3. Samples: 41053228. Policy #0 lag: (min: 28.0, avg: 32.2, max: 60.0) +[2023-10-08 14:58:06,877][101941] Avg episode reward: [(0, '7.760'), (1, '10.620')] +[2023-10-08 14:58:08,336][102898] Updated weights for policy 1, policy_version 80230 (0.0009) +[2023-10-08 14:58:08,703][102898] Updated weights for policy 1, policy_version 80240 (0.0007) +[2023-10-08 14:58:08,988][102897] Updated weights for policy 0, policy_version 80130 (0.0008) +[2023-10-08 14:58:09,059][102898] Updated weights for policy 1, policy_version 80250 (0.0009) +[2023-10-08 14:58:09,362][102897] Updated weights for policy 0, policy_version 80140 (0.0008) +[2023-10-08 14:58:09,735][102897] Updated weights for policy 0, policy_version 80150 (0.0010) +[2023-10-08 14:58:10,103][102897] Updated weights for policy 0, policy_version 80160 (0.0010) +[2023-10-08 14:58:11,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 164265984. Throughput: 0: 1776.6, 1: 1787.7. Samples: 41073654. Policy #0 lag: (min: 28.0, avg: 32.2, max: 60.0) +[2023-10-08 14:58:11,875][101941] Avg episode reward: [(0, '8.550'), (1, '11.130')] +[2023-10-08 14:58:12,780][102898] Updated weights for policy 1, policy_version 80260 (0.0009) +[2023-10-08 14:58:13,144][102898] Updated weights for policy 1, policy_version 80270 (0.0008) +[2023-10-08 14:58:13,506][102898] Updated weights for policy 1, policy_version 80280 (0.0007) +[2023-10-08 14:58:13,799][102897] Updated weights for policy 0, policy_version 80170 (0.0009) +[2023-10-08 14:58:14,173][102897] Updated weights for policy 0, policy_version 80180 (0.0010) +[2023-10-08 14:58:14,550][102897] Updated weights for policy 0, policy_version 80190 (0.0010) +[2023-10-08 14:58:16,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 164331520. Throughput: 0: 1768.3, 1: 1788.0. Samples: 41095832. Policy #0 lag: (min: 28.0, avg: 32.2, max: 60.0) +[2023-10-08 14:58:16,876][101941] Avg episode reward: [(0, '8.410'), (1, '11.700')] +[2023-10-08 14:58:16,884][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000080192_82116608.pth... +[2023-10-08 14:58:16,884][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000080288_82214912.pth... +[2023-10-08 14:58:16,922][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000078624_80510976.pth +[2023-10-08 14:58:16,925][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000078528_80412672.pth +[2023-10-08 14:58:17,304][102898] Updated weights for policy 1, policy_version 80290 (0.0008) +[2023-10-08 14:58:17,702][102898] Updated weights for policy 1, policy_version 80300 (0.0009) +[2023-10-08 14:58:18,066][102898] Updated weights for policy 1, policy_version 80310 (0.0008) +[2023-10-08 14:58:18,407][102897] Updated weights for policy 0, policy_version 80200 (0.0009) +[2023-10-08 14:58:18,429][102898] Updated weights for policy 1, policy_version 80320 (0.0007) +[2023-10-08 14:58:18,777][102897] Updated weights for policy 0, policy_version 80210 (0.0009) +[2023-10-08 14:58:19,150][102897] Updated weights for policy 0, policy_version 80220 (0.0008) +[2023-10-08 14:58:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 164397056. Throughput: 0: 1769.8, 1: 1786.0. Samples: 41105576. Policy #0 lag: (min: 28.0, avg: 32.2, max: 60.0) +[2023-10-08 14:58:21,876][101941] Avg episode reward: [(0, '7.770'), (1, '11.520')] +[2023-10-08 14:58:22,256][102898] Updated weights for policy 1, policy_version 80330 (0.0010) +[2023-10-08 14:58:22,623][102898] Updated weights for policy 1, policy_version 80340 (0.0007) +[2023-10-08 14:58:22,883][102897] Updated weights for policy 0, policy_version 80230 (0.0007) +[2023-10-08 14:58:22,987][102898] Updated weights for policy 1, policy_version 80350 (0.0007) +[2023-10-08 14:58:23,246][102897] Updated weights for policy 0, policy_version 80240 (0.0007) +[2023-10-08 14:58:23,609][102897] Updated weights for policy 0, policy_version 80250 (0.0007) +[2023-10-08 14:58:26,675][102898] Updated weights for policy 1, policy_version 80360 (0.0007) +[2023-10-08 14:58:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 164462592. Throughput: 0: 1770.5, 1: 1791.6. Samples: 41127984. Policy #0 lag: (min: 28.0, avg: 32.2, max: 60.0) +[2023-10-08 14:58:26,876][101941] Avg episode reward: [(0, '8.510'), (1, '11.240')] +[2023-10-08 14:58:27,038][102898] Updated weights for policy 1, policy_version 80370 (0.0007) +[2023-10-08 14:58:27,398][102897] Updated weights for policy 0, policy_version 80260 (0.0009) +[2023-10-08 14:58:27,399][102898] Updated weights for policy 1, policy_version 80380 (0.0007) +[2023-10-08 14:58:27,764][102897] Updated weights for policy 0, policy_version 80270 (0.0007) +[2023-10-08 14:58:28,132][102897] Updated weights for policy 0, policy_version 80280 (0.0009) +[2023-10-08 14:58:31,238][102898] Updated weights for policy 1, policy_version 80390 (0.0010) +[2023-10-08 14:58:31,601][102898] Updated weights for policy 1, policy_version 80400 (0.0010) +[2023-10-08 14:58:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 164528128. Throughput: 0: 1787.2, 1: 1807.3. Samples: 41149764. Policy #0 lag: (min: 28.0, avg: 32.2, max: 60.0) +[2023-10-08 14:58:31,876][101941] Avg episode reward: [(0, '8.750'), (1, '11.410')] +[2023-10-08 14:58:31,971][102898] Updated weights for policy 1, policy_version 80410 (0.0010) +[2023-10-08 14:58:32,036][102897] Updated weights for policy 0, policy_version 80290 (0.0008) +[2023-10-08 14:58:32,438][102897] Updated weights for policy 0, policy_version 80300 (0.0008) +[2023-10-08 14:58:32,821][102897] Updated weights for policy 0, policy_version 80310 (0.0008) +[2023-10-08 14:58:33,184][102897] Updated weights for policy 0, policy_version 80320 (0.0008) +[2023-10-08 14:58:35,695][102898] Updated weights for policy 1, policy_version 80420 (0.0007) +[2023-10-08 14:58:36,069][102898] Updated weights for policy 1, policy_version 80430 (0.0007) +[2023-10-08 14:58:36,429][102898] Updated weights for policy 1, policy_version 80440 (0.0008) +[2023-10-08 14:58:36,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 164626432. Throughput: 0: 1772.8, 1: 1789.2. Samples: 41159850. Policy #0 lag: (min: 28.0, avg: 32.2, max: 60.0) +[2023-10-08 14:58:36,875][101941] Avg episode reward: [(0, '8.970'), (1, '11.360')] +[2023-10-08 14:58:37,038][102897] Updated weights for policy 0, policy_version 80330 (0.0007) +[2023-10-08 14:58:37,405][102897] Updated weights for policy 0, policy_version 80340 (0.0007) +[2023-10-08 14:58:37,787][102897] Updated weights for policy 0, policy_version 80350 (0.0009) +[2023-10-08 14:58:40,098][102898] Updated weights for policy 1, policy_version 80450 (0.0007) +[2023-10-08 14:58:40,459][102898] Updated weights for policy 1, policy_version 80460 (0.0009) +[2023-10-08 14:58:40,825][102898] Updated weights for policy 1, policy_version 80470 (0.0007) +[2023-10-08 14:58:41,187][102898] Updated weights for policy 1, policy_version 80480 (0.0008) +[2023-10-08 14:58:41,691][102897] Updated weights for policy 0, policy_version 80360 (0.0010) +[2023-10-08 14:58:41,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 164691968. Throughput: 0: 1773.3, 1: 1803.1. Samples: 41181732. Policy #0 lag: (min: 28.0, avg: 32.2, max: 60.0) +[2023-10-08 14:58:41,876][101941] Avg episode reward: [(0, '8.470'), (1, '10.130')] +[2023-10-08 14:58:42,066][102897] Updated weights for policy 0, policy_version 80370 (0.0010) +[2023-10-08 14:58:42,425][102897] Updated weights for policy 0, policy_version 80380 (0.0008) +[2023-10-08 14:58:44,960][102898] Updated weights for policy 1, policy_version 80490 (0.0009) +[2023-10-08 14:58:45,325][102898] Updated weights for policy 1, policy_version 80500 (0.0010) +[2023-10-08 14:58:45,691][102898] Updated weights for policy 1, policy_version 80510 (0.0010) +[2023-10-08 14:58:46,079][102897] Updated weights for policy 0, policy_version 80390 (0.0009) +[2023-10-08 14:58:46,450][102897] Updated weights for policy 0, policy_version 80400 (0.0009) +[2023-10-08 14:58:46,834][102897] Updated weights for policy 0, policy_version 80410 (0.0010) +[2023-10-08 14:58:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 164757504. Throughput: 0: 1794.8, 1: 1792.9. Samples: 41202808. Policy #0 lag: (min: 31.0, avg: 33.3, max: 63.0) +[2023-10-08 14:58:46,875][101941] Avg episode reward: [(0, '7.990'), (1, '10.110')] +[2023-10-08 14:58:49,453][102898] Updated weights for policy 1, policy_version 80520 (0.0011) +[2023-10-08 14:58:49,820][102898] Updated weights for policy 1, policy_version 80530 (0.0008) +[2023-10-08 14:58:50,187][102898] Updated weights for policy 1, policy_version 80540 (0.0010) +[2023-10-08 14:58:50,599][102897] Updated weights for policy 0, policy_version 80420 (0.0009) +[2023-10-08 14:58:50,973][102897] Updated weights for policy 0, policy_version 80430 (0.0009) +[2023-10-08 14:58:51,348][102897] Updated weights for policy 0, policy_version 80440 (0.0008) +[2023-10-08 14:58:51,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 164855808. Throughput: 0: 1774.2, 1: 1802.2. Samples: 41214166. Policy #0 lag: (min: 31.0, avg: 33.3, max: 63.0) +[2023-10-08 14:58:51,876][101941] Avg episode reward: [(0, '7.490'), (1, '11.260')] +[2023-10-08 14:58:54,149][102898] Updated weights for policy 1, policy_version 80550 (0.0008) +[2023-10-08 14:58:54,517][102898] Updated weights for policy 1, policy_version 80560 (0.0008) +[2023-10-08 14:58:54,879][102898] Updated weights for policy 1, policy_version 80570 (0.0009) +[2023-10-08 14:58:55,068][102897] Updated weights for policy 0, policy_version 80450 (0.0008) +[2023-10-08 14:58:55,429][102897] Updated weights for policy 0, policy_version 80460 (0.0009) +[2023-10-08 14:58:55,805][102897] Updated weights for policy 0, policy_version 80470 (0.0009) +[2023-10-08 14:58:56,181][102897] Updated weights for policy 0, policy_version 80480 (0.0007) +[2023-10-08 14:58:56,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 164921344. Throughput: 0: 1798.5, 1: 1785.3. Samples: 41234928. Policy #0 lag: (min: 31.0, avg: 33.3, max: 63.0) +[2023-10-08 14:58:56,875][101941] Avg episode reward: [(0, '8.380'), (1, '12.470')] +[2023-10-08 14:58:58,466][102898] Updated weights for policy 1, policy_version 80580 (0.0008) +[2023-10-08 14:58:58,831][102898] Updated weights for policy 1, policy_version 80590 (0.0008) +[2023-10-08 14:58:59,201][102898] Updated weights for policy 1, policy_version 80600 (0.0007) +[2023-10-08 14:58:59,920][102897] Updated weights for policy 0, policy_version 80490 (0.0007) +[2023-10-08 14:59:00,297][102897] Updated weights for policy 0, policy_version 80500 (0.0009) +[2023-10-08 14:59:00,667][102897] Updated weights for policy 0, policy_version 80510 (0.0007) +[2023-10-08 14:59:01,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 164986880. Throughput: 0: 1783.5, 1: 1789.4. Samples: 41256612. Policy #0 lag: (min: 31.0, avg: 33.3, max: 63.0) +[2023-10-08 14:59:01,876][101941] Avg episode reward: [(0, '9.120'), (1, '12.260')] +[2023-10-08 14:59:03,130][102898] Updated weights for policy 1, policy_version 80610 (0.0008) +[2023-10-08 14:59:03,546][102898] Updated weights for policy 1, policy_version 80620 (0.0007) +[2023-10-08 14:59:03,914][102898] Updated weights for policy 1, policy_version 80630 (0.0007) +[2023-10-08 14:59:04,272][102898] Updated weights for policy 1, policy_version 80640 (0.0007) +[2023-10-08 14:59:04,307][102897] Updated weights for policy 0, policy_version 80520 (0.0008) +[2023-10-08 14:59:04,677][102897] Updated weights for policy 0, policy_version 80530 (0.0007) +[2023-10-08 14:59:05,050][102897] Updated weights for policy 0, policy_version 80540 (0.0007) +[2023-10-08 14:59:06,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 165052416. Throughput: 0: 1805.9, 1: 1785.9. Samples: 41267208. Policy #0 lag: (min: 31.0, avg: 33.3, max: 63.0) +[2023-10-08 14:59:06,876][101941] Avg episode reward: [(0, '8.700'), (1, '12.020')] +[2023-10-08 14:59:08,092][102898] Updated weights for policy 1, policy_version 80650 (0.0008) +[2023-10-08 14:59:08,455][102898] Updated weights for policy 1, policy_version 80660 (0.0009) +[2023-10-08 14:59:08,673][102897] Updated weights for policy 0, policy_version 80550 (0.0008) +[2023-10-08 14:59:08,817][102898] Updated weights for policy 1, policy_version 80670 (0.0009) +[2023-10-08 14:59:09,041][102897] Updated weights for policy 0, policy_version 80560 (0.0008) +[2023-10-08 14:59:09,410][102897] Updated weights for policy 0, policy_version 80570 (0.0008) +[2023-10-08 14:59:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 165117952. Throughput: 0: 1787.5, 1: 1783.6. Samples: 41288684. Policy #0 lag: (min: 31.0, avg: 33.3, max: 63.0) +[2023-10-08 14:59:11,876][101941] Avg episode reward: [(0, '8.850'), (1, '11.940')] +[2023-10-08 14:59:12,777][102898] Updated weights for policy 1, policy_version 80680 (0.0007) +[2023-10-08 14:59:13,148][102898] Updated weights for policy 1, policy_version 80690 (0.0009) +[2023-10-08 14:59:13,240][102897] Updated weights for policy 0, policy_version 80580 (0.0008) +[2023-10-08 14:59:13,501][102898] Updated weights for policy 1, policy_version 80700 (0.0009) +[2023-10-08 14:59:13,609][102897] Updated weights for policy 0, policy_version 80590 (0.0007) +[2023-10-08 14:59:13,984][102897] Updated weights for policy 0, policy_version 80600 (0.0010) +[2023-10-08 14:59:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 165183488. Throughput: 0: 1787.0, 1: 1792.3. Samples: 41310836. Policy #0 lag: (min: 31.0, avg: 33.3, max: 63.0) +[2023-10-08 14:59:16,876][101941] Avg episode reward: [(0, '9.430'), (1, '12.120')] +[2023-10-08 14:59:17,205][102898] Updated weights for policy 1, policy_version 80710 (0.0009) +[2023-10-08 14:59:17,570][102898] Updated weights for policy 1, policy_version 80720 (0.0010) +[2023-10-08 14:59:17,763][102897] Updated weights for policy 0, policy_version 80610 (0.0011) +[2023-10-08 14:59:17,939][102898] Updated weights for policy 1, policy_version 80730 (0.0009) +[2023-10-08 14:59:18,172][102897] Updated weights for policy 0, policy_version 80620 (0.0009) +[2023-10-08 14:59:18,532][102897] Updated weights for policy 0, policy_version 80630 (0.0009) +[2023-10-08 14:59:18,905][102897] Updated weights for policy 0, policy_version 80640 (0.0008) +[2023-10-08 14:59:21,753][102898] Updated weights for policy 1, policy_version 80740 (0.0009) +[2023-10-08 14:59:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 165249024. Throughput: 0: 1787.2, 1: 1780.2. Samples: 41320384. Policy #0 lag: (min: 31.0, avg: 33.3, max: 63.0) +[2023-10-08 14:59:21,876][101941] Avg episode reward: [(0, '9.760'), (1, '12.140')] +[2023-10-08 14:59:22,119][102898] Updated weights for policy 1, policy_version 80750 (0.0008) +[2023-10-08 14:59:22,495][102898] Updated weights for policy 1, policy_version 80760 (0.0009) +[2023-10-08 14:59:22,769][102897] Updated weights for policy 0, policy_version 80650 (0.0008) +[2023-10-08 14:59:23,146][102897] Updated weights for policy 0, policy_version 80660 (0.0009) +[2023-10-08 14:59:23,513][102897] Updated weights for policy 0, policy_version 80670 (0.0008) +[2023-10-08 14:59:26,107][102898] Updated weights for policy 1, policy_version 80770 (0.0010) +[2023-10-08 14:59:26,479][102898] Updated weights for policy 1, policy_version 80780 (0.0009) +[2023-10-08 14:59:26,853][102898] Updated weights for policy 1, policy_version 80790 (0.0008) +[2023-10-08 14:59:26,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 165314560. Throughput: 0: 1784.0, 1: 1789.6. Samples: 41342544. Policy #0 lag: (min: 31.0, avg: 33.3, max: 63.0) +[2023-10-08 14:59:26,876][101941] Avg episode reward: [(0, '8.680'), (1, '11.960')] +[2023-10-08 14:59:27,219][102898] Updated weights for policy 1, policy_version 80800 (0.0007) +[2023-10-08 14:59:27,302][102897] Updated weights for policy 0, policy_version 80680 (0.0010) +[2023-10-08 14:59:27,668][102897] Updated weights for policy 0, policy_version 80690 (0.0009) +[2023-10-08 14:59:28,041][102897] Updated weights for policy 0, policy_version 80700 (0.0009) +[2023-10-08 14:59:31,023][102898] Updated weights for policy 1, policy_version 80810 (0.0007) +[2023-10-08 14:59:31,389][102898] Updated weights for policy 1, policy_version 80820 (0.0007) +[2023-10-08 14:59:31,763][102898] Updated weights for policy 1, policy_version 80830 (0.0008) +[2023-10-08 14:59:31,834][102897] Updated weights for policy 0, policy_version 80710 (0.0008) +[2023-10-08 14:59:31,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 165412864. Throughput: 0: 1794.5, 1: 1783.0. Samples: 41363794. Policy #0 lag: (min: 31.0, avg: 33.3, max: 63.0) +[2023-10-08 14:59:31,876][101941] Avg episode reward: [(0, '8.010'), (1, '11.920')] +[2023-10-08 14:59:32,211][102897] Updated weights for policy 0, policy_version 80720 (0.0007) +[2023-10-08 14:59:32,568][102897] Updated weights for policy 0, policy_version 80730 (0.0009) +[2023-10-08 14:59:35,416][102898] Updated weights for policy 1, policy_version 80840 (0.0010) +[2023-10-08 14:59:35,787][102898] Updated weights for policy 1, policy_version 80850 (0.0010) +[2023-10-08 14:59:36,157][102898] Updated weights for policy 1, policy_version 80860 (0.0008) +[2023-10-08 14:59:36,297][102897] Updated weights for policy 0, policy_version 80740 (0.0008) +[2023-10-08 14:59:36,657][102897] Updated weights for policy 0, policy_version 80750 (0.0008) +[2023-10-08 14:59:36,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 165478400. Throughput: 0: 1782.8, 1: 1784.0. Samples: 41374672. Policy #0 lag: (min: 1.0, avg: 13.1, max: 33.0) +[2023-10-08 14:59:36,876][101941] Avg episode reward: [(0, '8.130'), (1, '12.220')] +[2023-10-08 14:59:37,026][102897] Updated weights for policy 0, policy_version 80760 (0.0008) +[2023-10-08 14:59:39,850][102898] Updated weights for policy 1, policy_version 80870 (0.0008) +[2023-10-08 14:59:40,214][102898] Updated weights for policy 1, policy_version 80880 (0.0008) +[2023-10-08 14:59:40,570][102898] Updated weights for policy 1, policy_version 80890 (0.0008) +[2023-10-08 14:59:40,909][102897] Updated weights for policy 0, policy_version 80770 (0.0009) +[2023-10-08 14:59:41,278][102897] Updated weights for policy 0, policy_version 80780 (0.0010) +[2023-10-08 14:59:41,649][102897] Updated weights for policy 0, policy_version 80790 (0.0011) +[2023-10-08 14:59:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 165543936. Throughput: 0: 1783.1, 1: 1794.8. Samples: 41395930. Policy #0 lag: (min: 1.0, avg: 13.1, max: 33.0) +[2023-10-08 14:59:41,876][101941] Avg episode reward: [(0, '8.360'), (1, '12.600')] +[2023-10-08 14:59:42,020][102897] Updated weights for policy 0, policy_version 80800 (0.0008) +[2023-10-08 14:59:44,341][102898] Updated weights for policy 1, policy_version 80900 (0.0010) +[2023-10-08 14:59:44,703][102898] Updated weights for policy 1, policy_version 80910 (0.0009) +[2023-10-08 14:59:45,066][102898] Updated weights for policy 1, policy_version 80920 (0.0008) +[2023-10-08 14:59:45,801][102897] Updated weights for policy 0, policy_version 80810 (0.0008) +[2023-10-08 14:59:46,169][102897] Updated weights for policy 0, policy_version 80820 (0.0007) +[2023-10-08 14:59:46,545][102897] Updated weights for policy 0, policy_version 80830 (0.0008) +[2023-10-08 14:59:46,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 165642240. Throughput: 0: 1781.0, 1: 1775.7. Samples: 41416664. Policy #0 lag: (min: 1.0, avg: 13.1, max: 33.0) +[2023-10-08 14:59:46,876][101941] Avg episode reward: [(0, '8.700'), (1, '12.210')] +[2023-10-08 14:59:49,172][102898] Updated weights for policy 1, policy_version 80930 (0.0008) +[2023-10-08 14:59:49,580][102898] Updated weights for policy 1, policy_version 80940 (0.0007) +[2023-10-08 14:59:49,942][102898] Updated weights for policy 1, policy_version 80950 (0.0007) +[2023-10-08 14:59:50,275][102897] Updated weights for policy 0, policy_version 80840 (0.0007) +[2023-10-08 14:59:50,305][102898] Updated weights for policy 1, policy_version 80960 (0.0008) +[2023-10-08 14:59:50,641][102897] Updated weights for policy 0, policy_version 80850 (0.0009) +[2023-10-08 14:59:51,007][102897] Updated weights for policy 0, policy_version 80860 (0.0009) +[2023-10-08 14:59:51,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 165707776. Throughput: 0: 1782.6, 1: 1798.2. Samples: 41428344. Policy #0 lag: (min: 1.0, avg: 13.1, max: 33.0) +[2023-10-08 14:59:51,877][101941] Avg episode reward: [(0, '9.170'), (1, '12.470')] +[2023-10-08 14:59:53,876][102898] Updated weights for policy 1, policy_version 80970 (0.0009) +[2023-10-08 14:59:54,253][102898] Updated weights for policy 1, policy_version 80980 (0.0009) +[2023-10-08 14:59:54,617][102898] Updated weights for policy 1, policy_version 80990 (0.0007) +[2023-10-08 14:59:54,795][102897] Updated weights for policy 0, policy_version 80870 (0.0009) +[2023-10-08 14:59:55,166][102897] Updated weights for policy 0, policy_version 80880 (0.0010) +[2023-10-08 14:59:55,544][102897] Updated weights for policy 0, policy_version 80890 (0.0009) +[2023-10-08 14:59:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 165773312. Throughput: 0: 1784.0, 1: 1776.9. Samples: 41448926. Policy #0 lag: (min: 1.0, avg: 13.1, max: 33.0) +[2023-10-08 14:59:56,876][101941] Avg episode reward: [(0, '8.940'), (1, '12.090')] +[2023-10-08 14:59:58,295][102898] Updated weights for policy 1, policy_version 81000 (0.0008) +[2023-10-08 14:59:58,665][102898] Updated weights for policy 1, policy_version 81010 (0.0008) +[2023-10-08 14:59:59,025][102898] Updated weights for policy 1, policy_version 81020 (0.0008) +[2023-10-08 14:59:59,409][102897] Updated weights for policy 0, policy_version 80900 (0.0008) +[2023-10-08 14:59:59,782][102897] Updated weights for policy 0, policy_version 80910 (0.0007) +[2023-10-08 15:00:00,164][102897] Updated weights for policy 0, policy_version 80920 (0.0008) +[2023-10-08 15:00:01,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 165838848. Throughput: 0: 1766.9, 1: 1788.2. Samples: 41470816. Policy #0 lag: (min: 1.0, avg: 13.1, max: 33.0) +[2023-10-08 15:00:01,875][101941] Avg episode reward: [(0, '8.000'), (1, '12.320')] +[2023-10-08 15:00:02,765][102898] Updated weights for policy 1, policy_version 81030 (0.0008) +[2023-10-08 15:00:03,124][102898] Updated weights for policy 1, policy_version 81040 (0.0007) +[2023-10-08 15:00:03,496][102898] Updated weights for policy 1, policy_version 81050 (0.0007) +[2023-10-08 15:00:03,965][102897] Updated weights for policy 0, policy_version 80930 (0.0009) +[2023-10-08 15:00:04,366][102897] Updated weights for policy 0, policy_version 80940 (0.0008) +[2023-10-08 15:00:04,752][102897] Updated weights for policy 0, policy_version 80950 (0.0009) +[2023-10-08 15:00:05,108][102897] Updated weights for policy 0, policy_version 80960 (0.0008) +[2023-10-08 15:00:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 165904384. Throughput: 0: 1791.4, 1: 1788.0. Samples: 41481454. Policy #0 lag: (min: 1.0, avg: 13.1, max: 33.0) +[2023-10-08 15:00:06,876][101941] Avg episode reward: [(0, '8.560'), (1, '12.380')] +[2023-10-08 15:00:07,285][102898] Updated weights for policy 1, policy_version 81060 (0.0008) +[2023-10-08 15:00:07,643][102898] Updated weights for policy 1, policy_version 81070 (0.0010) +[2023-10-08 15:00:08,017][102898] Updated weights for policy 1, policy_version 81080 (0.0011) +[2023-10-08 15:00:08,911][102897] Updated weights for policy 0, policy_version 80970 (0.0009) +[2023-10-08 15:00:09,286][102897] Updated weights for policy 0, policy_version 80980 (0.0009) +[2023-10-08 15:00:09,660][102897] Updated weights for policy 0, policy_version 80990 (0.0008) +[2023-10-08 15:00:11,776][102898] Updated weights for policy 1, policy_version 81090 (0.0010) +[2023-10-08 15:00:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 165969920. Throughput: 0: 1774.1, 1: 1790.9. Samples: 41502972. Policy #0 lag: (min: 1.0, avg: 13.1, max: 33.0) +[2023-10-08 15:00:11,876][101941] Avg episode reward: [(0, '8.840'), (1, '12.560')] +[2023-10-08 15:00:12,141][102898] Updated weights for policy 1, policy_version 81100 (0.0009) +[2023-10-08 15:00:12,508][102898] Updated weights for policy 1, policy_version 81110 (0.0007) +[2023-10-08 15:00:12,871][102898] Updated weights for policy 1, policy_version 81120 (0.0009) +[2023-10-08 15:00:13,422][102897] Updated weights for policy 0, policy_version 81000 (0.0009) +[2023-10-08 15:00:13,791][102897] Updated weights for policy 0, policy_version 81010 (0.0008) +[2023-10-08 15:00:14,163][102897] Updated weights for policy 0, policy_version 81020 (0.0007) +[2023-10-08 15:00:16,643][102898] Updated weights for policy 1, policy_version 81130 (0.0009) +[2023-10-08 15:00:16,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.6, 300 sec: 14218.0). Total num frames: 166035456. Throughput: 0: 1777.9, 1: 1806.7. Samples: 41525102. Policy #0 lag: (min: 1.0, avg: 13.1, max: 33.0) +[2023-10-08 15:00:16,875][101941] Avg episode reward: [(0, '8.130'), (1, '13.430')] +[2023-10-08 15:00:16,884][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000081024_82968576.pth... +[2023-10-08 15:00:16,918][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000079360_81264640.pth +[2023-10-08 15:00:17,010][102898] Updated weights for policy 1, policy_version 81140 (0.0008) +[2023-10-08 15:00:17,374][102898] Updated weights for policy 1, policy_version 81150 (0.0008) +[2023-10-08 15:00:17,443][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000081152_83099648.pth... +[2023-10-08 15:00:17,474][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000079456_81362944.pth +[2023-10-08 15:00:17,805][102897] Updated weights for policy 0, policy_version 81030 (0.0007) +[2023-10-08 15:00:18,171][102897] Updated weights for policy 0, policy_version 81040 (0.0007) +[2023-10-08 15:00:18,548][102897] Updated weights for policy 0, policy_version 81050 (0.0008) +[2023-10-08 15:00:21,116][102898] Updated weights for policy 1, policy_version 81160 (0.0010) +[2023-10-08 15:00:21,484][102898] Updated weights for policy 1, policy_version 81170 (0.0010) +[2023-10-08 15:00:21,845][102898] Updated weights for policy 1, policy_version 81180 (0.0009) +[2023-10-08 15:00:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 166100992. Throughput: 0: 1776.8, 1: 1789.1. Samples: 41535136. Policy #0 lag: (min: 1.0, avg: 13.1, max: 33.0) +[2023-10-08 15:00:21,876][101941] Avg episode reward: [(0, '8.230'), (1, '13.330')] +[2023-10-08 15:00:22,237][102897] Updated weights for policy 0, policy_version 81060 (0.0008) +[2023-10-08 15:00:22,598][102897] Updated weights for policy 0, policy_version 81070 (0.0008) +[2023-10-08 15:00:22,976][102897] Updated weights for policy 0, policy_version 81080 (0.0008) +[2023-10-08 15:00:25,558][102898] Updated weights for policy 1, policy_version 81190 (0.0010) +[2023-10-08 15:00:25,911][102898] Updated weights for policy 1, policy_version 81200 (0.0009) +[2023-10-08 15:00:26,285][102898] Updated weights for policy 1, policy_version 81210 (0.0008) +[2023-10-08 15:00:26,800][102897] Updated weights for policy 0, policy_version 81090 (0.0010) +[2023-10-08 15:00:26,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 166199296. Throughput: 0: 1783.3, 1: 1807.2. Samples: 41557502. Policy #0 lag: (min: 17.0, avg: 26.5, max: 49.0) +[2023-10-08 15:00:26,875][101941] Avg episode reward: [(0, '8.810'), (1, '13.720')] +[2023-10-08 15:00:26,876][102760] Saving new best policy, reward=13.720! +[2023-10-08 15:00:27,166][102897] Updated weights for policy 0, policy_version 81100 (0.0008) +[2023-10-08 15:00:27,541][102897] Updated weights for policy 0, policy_version 81110 (0.0009) +[2023-10-08 15:00:27,912][102897] Updated weights for policy 0, policy_version 81120 (0.0009) +[2023-10-08 15:00:30,034][102898] Updated weights for policy 1, policy_version 81220 (0.0008) +[2023-10-08 15:00:30,400][102898] Updated weights for policy 1, policy_version 81230 (0.0010) +[2023-10-08 15:00:30,764][102898] Updated weights for policy 1, policy_version 81240 (0.0008) +[2023-10-08 15:00:31,827][102897] Updated weights for policy 0, policy_version 81130 (0.0011) +[2023-10-08 15:00:31,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 166264832. Throughput: 0: 1797.3, 1: 1792.4. Samples: 41578204. Policy #0 lag: (min: 17.0, avg: 26.5, max: 49.0) +[2023-10-08 15:00:31,876][101941] Avg episode reward: [(0, '8.340'), (1, '13.340')] +[2023-10-08 15:00:32,198][102897] Updated weights for policy 0, policy_version 81140 (0.0007) +[2023-10-08 15:00:32,579][102897] Updated weights for policy 0, policy_version 81150 (0.0007) +[2023-10-08 15:00:34,532][102898] Updated weights for policy 1, policy_version 81250 (0.0008) +[2023-10-08 15:00:34,944][102898] Updated weights for policy 1, policy_version 81260 (0.0007) +[2023-10-08 15:00:35,307][102898] Updated weights for policy 1, policy_version 81270 (0.0008) +[2023-10-08 15:00:35,677][102898] Updated weights for policy 1, policy_version 81280 (0.0008) +[2023-10-08 15:00:36,295][102897] Updated weights for policy 0, policy_version 81160 (0.0009) +[2023-10-08 15:00:36,665][102897] Updated weights for policy 0, policy_version 81170 (0.0007) +[2023-10-08 15:00:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 166330368. Throughput: 0: 1770.8, 1: 1810.7. Samples: 41589510. Policy #0 lag: (min: 17.0, avg: 26.5, max: 49.0) +[2023-10-08 15:00:36,875][101941] Avg episode reward: [(0, '7.990'), (1, '12.610')] +[2023-10-08 15:00:37,041][102897] Updated weights for policy 0, policy_version 81180 (0.0007) +[2023-10-08 15:00:39,345][102898] Updated weights for policy 1, policy_version 81290 (0.0009) +[2023-10-08 15:00:39,715][102898] Updated weights for policy 1, policy_version 81300 (0.0007) +[2023-10-08 15:00:40,084][102898] Updated weights for policy 1, policy_version 81310 (0.0007) +[2023-10-08 15:00:40,967][102897] Updated weights for policy 0, policy_version 81190 (0.0008) +[2023-10-08 15:00:41,345][102897] Updated weights for policy 0, policy_version 81200 (0.0008) +[2023-10-08 15:00:41,718][102897] Updated weights for policy 0, policy_version 81210 (0.0007) +[2023-10-08 15:00:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 166395904. Throughput: 0: 1786.8, 1: 1801.2. Samples: 41610390. Policy #0 lag: (min: 17.0, avg: 26.5, max: 49.0) +[2023-10-08 15:00:41,876][101941] Avg episode reward: [(0, '8.470'), (1, '11.580')] +[2023-10-08 15:00:43,986][102898] Updated weights for policy 1, policy_version 81320 (0.0010) +[2023-10-08 15:00:44,354][102898] Updated weights for policy 1, policy_version 81330 (0.0007) +[2023-10-08 15:00:44,724][102898] Updated weights for policy 1, policy_version 81340 (0.0009) +[2023-10-08 15:00:45,514][102897] Updated weights for policy 0, policy_version 81220 (0.0010) +[2023-10-08 15:00:45,890][102897] Updated weights for policy 0, policy_version 81230 (0.0009) +[2023-10-08 15:00:46,257][102897] Updated weights for policy 0, policy_version 81240 (0.0007) +[2023-10-08 15:00:46,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 166494208. Throughput: 0: 1774.8, 1: 1792.4. Samples: 41631338. Policy #0 lag: (min: 17.0, avg: 26.5, max: 49.0) +[2023-10-08 15:00:46,876][101941] Avg episode reward: [(0, '8.960'), (1, '11.840')] +[2023-10-08 15:00:48,560][102898] Updated weights for policy 1, policy_version 81350 (0.0009) +[2023-10-08 15:00:48,918][102898] Updated weights for policy 1, policy_version 81360 (0.0007) +[2023-10-08 15:00:49,277][102898] Updated weights for policy 1, policy_version 81370 (0.0011) +[2023-10-08 15:00:50,050][102897] Updated weights for policy 0, policy_version 81250 (0.0008) +[2023-10-08 15:00:50,452][102897] Updated weights for policy 0, policy_version 81260 (0.0007) +[2023-10-08 15:00:50,830][102897] Updated weights for policy 0, policy_version 81270 (0.0007) +[2023-10-08 15:00:51,194][102897] Updated weights for policy 0, policy_version 81280 (0.0008) +[2023-10-08 15:00:51,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 166559744. Throughput: 0: 1781.1, 1: 1791.2. Samples: 41642208. Policy #0 lag: (min: 17.0, avg: 26.5, max: 49.0) +[2023-10-08 15:00:51,876][101941] Avg episode reward: [(0, '9.090'), (1, '11.540')] +[2023-10-08 15:00:53,121][102898] Updated weights for policy 1, policy_version 81380 (0.0009) +[2023-10-08 15:00:53,486][102898] Updated weights for policy 1, policy_version 81390 (0.0010) +[2023-10-08 15:00:53,854][102898] Updated weights for policy 1, policy_version 81400 (0.0009) +[2023-10-08 15:00:55,032][102897] Updated weights for policy 0, policy_version 81290 (0.0009) +[2023-10-08 15:00:55,397][102897] Updated weights for policy 0, policy_version 81300 (0.0011) +[2023-10-08 15:00:55,763][102897] Updated weights for policy 0, policy_version 81310 (0.0008) +[2023-10-08 15:00:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 166625280. Throughput: 0: 1780.2, 1: 1780.0. Samples: 41663180. Policy #0 lag: (min: 17.0, avg: 26.5, max: 49.0) +[2023-10-08 15:00:56,875][101941] Avg episode reward: [(0, '8.600'), (1, '11.850')] +[2023-10-08 15:00:57,725][102898] Updated weights for policy 1, policy_version 81410 (0.0010) +[2023-10-08 15:00:58,091][102898] Updated weights for policy 1, policy_version 81420 (0.0008) +[2023-10-08 15:00:58,450][102898] Updated weights for policy 1, policy_version 81430 (0.0010) +[2023-10-08 15:00:58,817][102898] Updated weights for policy 1, policy_version 81440 (0.0008) +[2023-10-08 15:00:59,407][102897] Updated weights for policy 0, policy_version 81320 (0.0008) +[2023-10-08 15:00:59,778][102897] Updated weights for policy 0, policy_version 81330 (0.0007) +[2023-10-08 15:01:00,147][102897] Updated weights for policy 0, policy_version 81340 (0.0010) +[2023-10-08 15:01:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 166690816. Throughput: 0: 1765.2, 1: 1790.4. Samples: 41685104. Policy #0 lag: (min: 17.0, avg: 26.5, max: 49.0) +[2023-10-08 15:01:01,876][101941] Avg episode reward: [(0, '9.110'), (1, '11.850')] +[2023-10-08 15:01:02,541][102898] Updated weights for policy 1, policy_version 81450 (0.0010) +[2023-10-08 15:01:02,902][102898] Updated weights for policy 1, policy_version 81460 (0.0010) +[2023-10-08 15:01:03,266][102898] Updated weights for policy 1, policy_version 81470 (0.0010) +[2023-10-08 15:01:04,048][102897] Updated weights for policy 0, policy_version 81350 (0.0009) +[2023-10-08 15:01:04,405][102897] Updated weights for policy 0, policy_version 81360 (0.0010) +[2023-10-08 15:01:04,781][102897] Updated weights for policy 0, policy_version 81370 (0.0008) +[2023-10-08 15:01:06,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 166756352. Throughput: 0: 1785.6, 1: 1786.0. Samples: 41695856. Policy #0 lag: (min: 17.0, avg: 26.5, max: 49.0) +[2023-10-08 15:01:06,876][101941] Avg episode reward: [(0, '9.050'), (1, '12.060')] +[2023-10-08 15:01:06,965][102898] Updated weights for policy 1, policy_version 81480 (0.0009) +[2023-10-08 15:01:07,330][102898] Updated weights for policy 1, policy_version 81490 (0.0007) +[2023-10-08 15:01:07,689][102898] Updated weights for policy 1, policy_version 81500 (0.0007) +[2023-10-08 15:01:08,373][102897] Updated weights for policy 0, policy_version 81380 (0.0008) +[2023-10-08 15:01:08,742][102897] Updated weights for policy 0, policy_version 81390 (0.0007) +[2023-10-08 15:01:09,110][102897] Updated weights for policy 0, policy_version 81400 (0.0007) +[2023-10-08 15:01:11,590][102898] Updated weights for policy 1, policy_version 81510 (0.0009) +[2023-10-08 15:01:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 166821888. Throughput: 0: 1772.6, 1: 1783.8. Samples: 41717542. Policy #0 lag: (min: 17.0, avg: 26.5, max: 49.0) +[2023-10-08 15:01:11,875][101941] Avg episode reward: [(0, '9.250'), (1, '12.410')] +[2023-10-08 15:01:11,958][102898] Updated weights for policy 1, policy_version 81520 (0.0010) +[2023-10-08 15:01:12,322][102898] Updated weights for policy 1, policy_version 81530 (0.0009) +[2023-10-08 15:01:12,934][102897] Updated weights for policy 0, policy_version 81410 (0.0008) +[2023-10-08 15:01:13,297][102897] Updated weights for policy 0, policy_version 81420 (0.0010) +[2023-10-08 15:01:13,658][102897] Updated weights for policy 0, policy_version 81430 (0.0010) +[2023-10-08 15:01:14,028][102897] Updated weights for policy 0, policy_version 81440 (0.0010) +[2023-10-08 15:01:15,920][102898] Updated weights for policy 1, policy_version 81540 (0.0007) +[2023-10-08 15:01:16,288][102898] Updated weights for policy 1, policy_version 81550 (0.0008) +[2023-10-08 15:01:16,645][102898] Updated weights for policy 1, policy_version 81560 (0.0007) +[2023-10-08 15:01:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 166887424. Throughput: 0: 1779.4, 1: 1794.5. Samples: 41739028. Policy #0 lag: (min: 29.0, avg: 36.8, max: 61.0) +[2023-10-08 15:01:16,876][101941] Avg episode reward: [(0, '8.910'), (1, '11.860')] +[2023-10-08 15:01:17,709][102897] Updated weights for policy 0, policy_version 81450 (0.0011) +[2023-10-08 15:01:18,072][102897] Updated weights for policy 0, policy_version 81460 (0.0009) +[2023-10-08 15:01:18,452][102897] Updated weights for policy 0, policy_version 81470 (0.0008) +[2023-10-08 15:01:20,581][102898] Updated weights for policy 1, policy_version 81570 (0.0008) +[2023-10-08 15:01:20,984][102898] Updated weights for policy 1, policy_version 81580 (0.0009) +[2023-10-08 15:01:21,353][102898] Updated weights for policy 1, policy_version 81590 (0.0007) +[2023-10-08 15:01:21,724][102898] Updated weights for policy 1, policy_version 81600 (0.0009) +[2023-10-08 15:01:21,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 166985728. Throughput: 0: 1779.5, 1: 1777.2. Samples: 41749564. Policy #0 lag: (min: 29.0, avg: 36.8, max: 61.0) +[2023-10-08 15:01:21,876][101941] Avg episode reward: [(0, '8.450'), (1, '12.630')] +[2023-10-08 15:01:22,194][102897] Updated weights for policy 0, policy_version 81480 (0.0008) +[2023-10-08 15:01:22,575][102897] Updated weights for policy 0, policy_version 81490 (0.0008) +[2023-10-08 15:01:22,940][102897] Updated weights for policy 0, policy_version 81500 (0.0009) +[2023-10-08 15:01:25,501][102898] Updated weights for policy 1, policy_version 81610 (0.0011) +[2023-10-08 15:01:25,862][102898] Updated weights for policy 1, policy_version 81620 (0.0010) +[2023-10-08 15:01:26,230][102898] Updated weights for policy 1, policy_version 81630 (0.0008) +[2023-10-08 15:01:26,602][102897] Updated weights for policy 0, policy_version 81510 (0.0007) +[2023-10-08 15:01:26,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 167051264. Throughput: 0: 1784.1, 1: 1792.0. Samples: 41771318. Policy #0 lag: (min: 29.0, avg: 36.8, max: 61.0) +[2023-10-08 15:01:26,876][101941] Avg episode reward: [(0, '9.120'), (1, '12.430')] +[2023-10-08 15:01:26,976][102897] Updated weights for policy 0, policy_version 81520 (0.0009) +[2023-10-08 15:01:27,351][102897] Updated weights for policy 0, policy_version 81530 (0.0007) +[2023-10-08 15:01:29,929][102898] Updated weights for policy 1, policy_version 81640 (0.0007) +[2023-10-08 15:01:30,285][102898] Updated weights for policy 1, policy_version 81650 (0.0008) +[2023-10-08 15:01:30,654][102898] Updated weights for policy 1, policy_version 81660 (0.0008) +[2023-10-08 15:01:31,196][102897] Updated weights for policy 0, policy_version 81540 (0.0009) +[2023-10-08 15:01:31,566][102897] Updated weights for policy 0, policy_version 81550 (0.0007) +[2023-10-08 15:01:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 167116800. Throughput: 0: 1807.1, 1: 1773.0. Samples: 41792440. Policy #0 lag: (min: 29.0, avg: 36.8, max: 61.0) +[2023-10-08 15:01:31,876][101941] Avg episode reward: [(0, '9.200'), (1, '12.540')] +[2023-10-08 15:01:31,932][102897] Updated weights for policy 0, policy_version 81560 (0.0008) +[2023-10-08 15:01:34,309][102898] Updated weights for policy 1, policy_version 81670 (0.0010) +[2023-10-08 15:01:34,679][102898] Updated weights for policy 1, policy_version 81680 (0.0009) +[2023-10-08 15:01:35,042][102898] Updated weights for policy 1, policy_version 81690 (0.0007) +[2023-10-08 15:01:35,792][102897] Updated weights for policy 0, policy_version 81570 (0.0011) +[2023-10-08 15:01:36,199][102897] Updated weights for policy 0, policy_version 81580 (0.0008) +[2023-10-08 15:01:36,566][102897] Updated weights for policy 0, policy_version 81590 (0.0007) +[2023-10-08 15:01:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 167182336. Throughput: 0: 1788.4, 1: 1794.6. Samples: 41803446. Policy #0 lag: (min: 29.0, avg: 36.8, max: 61.0) +[2023-10-08 15:01:36,876][101941] Avg episode reward: [(0, '9.570'), (1, '12.210')] +[2023-10-08 15:01:36,935][102897] Updated weights for policy 0, policy_version 81600 (0.0008) +[2023-10-08 15:01:38,781][102898] Updated weights for policy 1, policy_version 81700 (0.0009) +[2023-10-08 15:01:39,158][102898] Updated weights for policy 1, policy_version 81710 (0.0009) +[2023-10-08 15:01:39,530][102898] Updated weights for policy 1, policy_version 81720 (0.0009) +[2023-10-08 15:01:40,691][102897] Updated weights for policy 0, policy_version 81610 (0.0009) +[2023-10-08 15:01:41,055][102897] Updated weights for policy 0, policy_version 81620 (0.0007) +[2023-10-08 15:01:41,427][102897] Updated weights for policy 0, policy_version 81630 (0.0009) +[2023-10-08 15:01:41,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 167280640. Throughput: 0: 1812.3, 1: 1780.4. Samples: 41824852. Policy #0 lag: (min: 29.0, avg: 36.8, max: 61.0) +[2023-10-08 15:01:41,878][101941] Avg episode reward: [(0, '9.610'), (1, '12.140')] +[2023-10-08 15:01:43,358][102898] Updated weights for policy 1, policy_version 81730 (0.0009) +[2023-10-08 15:01:43,731][102898] Updated weights for policy 1, policy_version 81740 (0.0008) +[2023-10-08 15:01:44,093][102898] Updated weights for policy 1, policy_version 81750 (0.0008) +[2023-10-08 15:01:44,465][102898] Updated weights for policy 1, policy_version 81760 (0.0010) +[2023-10-08 15:01:45,114][102897] Updated weights for policy 0, policy_version 81640 (0.0009) +[2023-10-08 15:01:45,496][102897] Updated weights for policy 0, policy_version 81650 (0.0009) +[2023-10-08 15:01:45,862][102897] Updated weights for policy 0, policy_version 81660 (0.0009) +[2023-10-08 15:01:46,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 167346176. Throughput: 0: 1792.8, 1: 1778.8. Samples: 41845822. Policy #0 lag: (min: 29.0, avg: 36.8, max: 61.0) +[2023-10-08 15:01:46,876][101941] Avg episode reward: [(0, '9.630'), (1, '11.560')] +[2023-10-08 15:01:48,169][102898] Updated weights for policy 1, policy_version 81770 (0.0010) +[2023-10-08 15:01:48,530][102898] Updated weights for policy 1, policy_version 81780 (0.0010) +[2023-10-08 15:01:48,899][102898] Updated weights for policy 1, policy_version 81790 (0.0010) +[2023-10-08 15:01:49,560][102897] Updated weights for policy 0, policy_version 81670 (0.0007) +[2023-10-08 15:01:49,930][102897] Updated weights for policy 0, policy_version 81680 (0.0008) +[2023-10-08 15:01:50,304][102897] Updated weights for policy 0, policy_version 81690 (0.0007) +[2023-10-08 15:01:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 167411712. Throughput: 0: 1800.1, 1: 1776.7. Samples: 41856810. Policy #0 lag: (min: 29.0, avg: 36.8, max: 61.0) +[2023-10-08 15:01:51,875][101941] Avg episode reward: [(0, '8.730'), (1, '11.540')] +[2023-10-08 15:01:52,593][102898] Updated weights for policy 1, policy_version 81800 (0.0009) +[2023-10-08 15:01:52,963][102898] Updated weights for policy 1, policy_version 81810 (0.0008) +[2023-10-08 15:01:53,323][102898] Updated weights for policy 1, policy_version 81820 (0.0008) +[2023-10-08 15:01:54,121][102897] Updated weights for policy 0, policy_version 81700 (0.0007) +[2023-10-08 15:01:54,498][102897] Updated weights for policy 0, policy_version 81710 (0.0009) +[2023-10-08 15:01:54,870][102897] Updated weights for policy 0, policy_version 81720 (0.0009) +[2023-10-08 15:01:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 167477248. Throughput: 0: 1778.0, 1: 1785.2. Samples: 41877882. Policy #0 lag: (min: 29.0, avg: 36.8, max: 61.0) +[2023-10-08 15:01:56,876][101941] Avg episode reward: [(0, '8.640'), (1, '12.160')] +[2023-10-08 15:01:56,982][102898] Updated weights for policy 1, policy_version 81830 (0.0008) +[2023-10-08 15:01:57,345][102898] Updated weights for policy 1, policy_version 81840 (0.0010) +[2023-10-08 15:01:57,707][102898] Updated weights for policy 1, policy_version 81850 (0.0008) +[2023-10-08 15:01:58,649][102897] Updated weights for policy 0, policy_version 81730 (0.0010) +[2023-10-08 15:01:59,021][102897] Updated weights for policy 0, policy_version 81740 (0.0010) +[2023-10-08 15:01:59,388][102897] Updated weights for policy 0, policy_version 81750 (0.0010) +[2023-10-08 15:01:59,753][102897] Updated weights for policy 0, policy_version 81760 (0.0009) +[2023-10-08 15:02:01,702][102898] Updated weights for policy 1, policy_version 81860 (0.0009) +[2023-10-08 15:02:01,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 167542784. Throughput: 0: 1779.8, 1: 1800.2. Samples: 41900128. Policy #0 lag: (min: 29.0, avg: 36.8, max: 61.0) +[2023-10-08 15:02:01,876][101941] Avg episode reward: [(0, '10.380'), (1, '12.800')] +[2023-10-08 15:02:01,888][102634] Saving new best policy, reward=10.380! +[2023-10-08 15:02:02,069][102898] Updated weights for policy 1, policy_version 81870 (0.0010) +[2023-10-08 15:02:02,431][102898] Updated weights for policy 1, policy_version 81880 (0.0008) +[2023-10-08 15:02:03,501][102897] Updated weights for policy 0, policy_version 81770 (0.0008) +[2023-10-08 15:02:03,883][102897] Updated weights for policy 0, policy_version 81780 (0.0008) +[2023-10-08 15:02:04,254][102897] Updated weights for policy 0, policy_version 81790 (0.0007) +[2023-10-08 15:02:06,175][102898] Updated weights for policy 1, policy_version 81890 (0.0007) +[2023-10-08 15:02:06,540][102898] Updated weights for policy 1, policy_version 81900 (0.0007) +[2023-10-08 15:02:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 167608320. Throughput: 0: 1778.8, 1: 1782.7. Samples: 41909832. Policy #0 lag: (min: 29.0, avg: 36.8, max: 61.0) +[2023-10-08 15:02:06,875][101941] Avg episode reward: [(0, '9.390'), (1, '12.890')] +[2023-10-08 15:02:06,910][102898] Updated weights for policy 1, policy_version 81910 (0.0007) +[2023-10-08 15:02:07,271][102898] Updated weights for policy 1, policy_version 81920 (0.0007) +[2023-10-08 15:02:08,035][102897] Updated weights for policy 0, policy_version 81800 (0.0008) +[2023-10-08 15:02:08,411][102897] Updated weights for policy 0, policy_version 81810 (0.0009) +[2023-10-08 15:02:08,775][102897] Updated weights for policy 0, policy_version 81820 (0.0009) +[2023-10-08 15:02:10,969][102898] Updated weights for policy 1, policy_version 81930 (0.0009) +[2023-10-08 15:02:11,331][102898] Updated weights for policy 1, policy_version 81940 (0.0007) +[2023-10-08 15:02:11,703][102898] Updated weights for policy 1, policy_version 81950 (0.0009) +[2023-10-08 15:02:11,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 167706624. Throughput: 0: 1775.0, 1: 1800.9. Samples: 41932232. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:02:11,876][101941] Avg episode reward: [(0, '9.120'), (1, '12.550')] +[2023-10-08 15:02:12,599][102897] Updated weights for policy 0, policy_version 81830 (0.0009) +[2023-10-08 15:02:12,973][102897] Updated weights for policy 0, policy_version 81840 (0.0011) +[2023-10-08 15:02:13,347][102897] Updated weights for policy 0, policy_version 81850 (0.0008) +[2023-10-08 15:02:15,621][102898] Updated weights for policy 1, policy_version 81960 (0.0010) +[2023-10-08 15:02:15,986][102898] Updated weights for policy 1, policy_version 81970 (0.0009) +[2023-10-08 15:02:16,355][102898] Updated weights for policy 1, policy_version 81980 (0.0008) +[2023-10-08 15:02:16,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 167772160. Throughput: 0: 1780.6, 1: 1795.7. Samples: 41953374. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:02:16,875][101941] Avg episode reward: [(0, '8.770'), (1, '12.720')] +[2023-10-08 15:02:16,887][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000081984_83951616.pth... +[2023-10-08 15:02:16,888][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000081856_83820544.pth... +[2023-10-08 15:02:16,923][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000080192_82116608.pth +[2023-10-08 15:02:16,926][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000080288_82214912.pth +[2023-10-08 15:02:17,192][102897] Updated weights for policy 0, policy_version 81860 (0.0009) +[2023-10-08 15:02:17,568][102897] Updated weights for policy 0, policy_version 81870 (0.0008) +[2023-10-08 15:02:17,934][102897] Updated weights for policy 0, policy_version 81880 (0.0007) +[2023-10-08 15:02:20,050][102898] Updated weights for policy 1, policy_version 81990 (0.0008) +[2023-10-08 15:02:20,410][102898] Updated weights for policy 1, policy_version 82000 (0.0008) +[2023-10-08 15:02:20,769][102898] Updated weights for policy 1, policy_version 82010 (0.0010) +[2023-10-08 15:02:21,734][102897] Updated weights for policy 0, policy_version 81890 (0.0010) +[2023-10-08 15:02:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 167837696. Throughput: 0: 1772.8, 1: 1808.1. Samples: 41964586. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:02:21,876][101941] Avg episode reward: [(0, '8.440'), (1, '12.560')] +[2023-10-08 15:02:22,096][102897] Updated weights for policy 0, policy_version 81900 (0.0008) +[2023-10-08 15:02:22,466][102897] Updated weights for policy 0, policy_version 81910 (0.0008) +[2023-10-08 15:02:22,839][102897] Updated weights for policy 0, policy_version 81920 (0.0007) +[2023-10-08 15:02:24,407][102898] Updated weights for policy 1, policy_version 82020 (0.0007) +[2023-10-08 15:02:24,768][102898] Updated weights for policy 1, policy_version 82030 (0.0009) +[2023-10-08 15:02:25,127][102898] Updated weights for policy 1, policy_version 82040 (0.0007) +[2023-10-08 15:02:26,594][102897] Updated weights for policy 0, policy_version 81930 (0.0007) +[2023-10-08 15:02:26,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 167903232. Throughput: 0: 1769.8, 1: 1803.3. Samples: 41985642. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:02:26,876][101941] Avg episode reward: [(0, '8.800'), (1, '12.740')] +[2023-10-08 15:02:26,951][102897] Updated weights for policy 0, policy_version 81940 (0.0010) +[2023-10-08 15:02:27,321][102897] Updated weights for policy 0, policy_version 81950 (0.0011) +[2023-10-08 15:02:28,808][102898] Updated weights for policy 1, policy_version 82050 (0.0010) +[2023-10-08 15:02:29,173][102898] Updated weights for policy 1, policy_version 82060 (0.0007) +[2023-10-08 15:02:29,542][102898] Updated weights for policy 1, policy_version 82070 (0.0009) +[2023-10-08 15:02:29,903][102898] Updated weights for policy 1, policy_version 82080 (0.0007) +[2023-10-08 15:02:31,153][102897] Updated weights for policy 0, policy_version 81960 (0.0008) +[2023-10-08 15:02:31,528][102897] Updated weights for policy 0, policy_version 81970 (0.0007) +[2023-10-08 15:02:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 167968768. Throughput: 0: 1784.5, 1: 1800.6. Samples: 42007152. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:02:31,875][101941] Avg episode reward: [(0, '9.210'), (1, '13.260')] +[2023-10-08 15:02:31,890][102897] Updated weights for policy 0, policy_version 81980 (0.0010) +[2023-10-08 15:02:33,566][102898] Updated weights for policy 1, policy_version 82090 (0.0008) +[2023-10-08 15:02:33,935][102898] Updated weights for policy 1, policy_version 82100 (0.0010) +[2023-10-08 15:02:34,293][102898] Updated weights for policy 1, policy_version 82110 (0.0008) +[2023-10-08 15:02:35,572][102897] Updated weights for policy 0, policy_version 81990 (0.0008) +[2023-10-08 15:02:35,951][102897] Updated weights for policy 0, policy_version 82000 (0.0009) +[2023-10-08 15:02:36,324][102897] Updated weights for policy 0, policy_version 82010 (0.0008) +[2023-10-08 15:02:36,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 168067072. Throughput: 0: 1770.3, 1: 1803.1. Samples: 42017614. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:02:36,876][101941] Avg episode reward: [(0, '8.400'), (1, '13.870')] +[2023-10-08 15:02:36,878][102760] Saving new best policy, reward=13.870! +[2023-10-08 15:02:38,029][102898] Updated weights for policy 1, policy_version 82120 (0.0009) +[2023-10-08 15:02:38,388][102898] Updated weights for policy 1, policy_version 82130 (0.0010) +[2023-10-08 15:02:38,764][102898] Updated weights for policy 1, policy_version 82140 (0.0009) +[2023-10-08 15:02:39,975][102897] Updated weights for policy 0, policy_version 82020 (0.0009) +[2023-10-08 15:02:40,334][102897] Updated weights for policy 0, policy_version 82030 (0.0009) +[2023-10-08 15:02:40,709][102897] Updated weights for policy 0, policy_version 82040 (0.0008) +[2023-10-08 15:02:41,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 168132608. Throughput: 0: 1794.3, 1: 1798.0. Samples: 42039540. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:02:41,876][101941] Avg episode reward: [(0, '9.400'), (1, '12.190')] +[2023-10-08 15:02:42,596][102898] Updated weights for policy 1, policy_version 82150 (0.0009) +[2023-10-08 15:02:42,954][102898] Updated weights for policy 1, policy_version 82160 (0.0011) +[2023-10-08 15:02:43,321][102898] Updated weights for policy 1, policy_version 82170 (0.0009) +[2023-10-08 15:02:44,607][102897] Updated weights for policy 0, policy_version 82050 (0.0008) +[2023-10-08 15:02:44,978][102897] Updated weights for policy 0, policy_version 82060 (0.0009) +[2023-10-08 15:02:45,340][102897] Updated weights for policy 0, policy_version 82070 (0.0009) +[2023-10-08 15:02:45,711][102897] Updated weights for policy 0, policy_version 82080 (0.0008) +[2023-10-08 15:02:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 168198144. Throughput: 0: 1771.7, 1: 1800.4. Samples: 42060874. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:02:46,876][101941] Avg episode reward: [(0, '8.720'), (1, '12.430')] +[2023-10-08 15:02:47,111][102898] Updated weights for policy 1, policy_version 82180 (0.0009) +[2023-10-08 15:02:47,479][102898] Updated weights for policy 1, policy_version 82190 (0.0007) +[2023-10-08 15:02:47,842][102898] Updated weights for policy 1, policy_version 82200 (0.0008) +[2023-10-08 15:02:49,579][102897] Updated weights for policy 0, policy_version 82090 (0.0010) +[2023-10-08 15:02:49,950][102897] Updated weights for policy 0, policy_version 82100 (0.0008) +[2023-10-08 15:02:50,330][102897] Updated weights for policy 0, policy_version 82110 (0.0009) +[2023-10-08 15:02:51,672][102898] Updated weights for policy 1, policy_version 82210 (0.0007) +[2023-10-08 15:02:51,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 168263680. Throughput: 0: 1798.7, 1: 1798.0. Samples: 42071686. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:02:51,875][101941] Avg episode reward: [(0, '9.090'), (1, '11.860')] +[2023-10-08 15:02:52,051][102898] Updated weights for policy 1, policy_version 82220 (0.0007) +[2023-10-08 15:02:52,423][102898] Updated weights for policy 1, policy_version 82230 (0.0007) +[2023-10-08 15:02:52,787][102898] Updated weights for policy 1, policy_version 82240 (0.0007) +[2023-10-08 15:02:54,119][102897] Updated weights for policy 0, policy_version 82120 (0.0011) +[2023-10-08 15:02:54,486][102897] Updated weights for policy 0, policy_version 82130 (0.0008) +[2023-10-08 15:02:54,863][102897] Updated weights for policy 0, policy_version 82140 (0.0007) +[2023-10-08 15:02:56,540][102898] Updated weights for policy 1, policy_version 82250 (0.0009) +[2023-10-08 15:02:56,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 168329216. Throughput: 0: 1771.9, 1: 1796.0. Samples: 42092788. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:02:56,875][101941] Avg episode reward: [(0, '9.260'), (1, '12.020')] +[2023-10-08 15:02:56,908][102898] Updated weights for policy 1, policy_version 82260 (0.0008) +[2023-10-08 15:02:57,267][102898] Updated weights for policy 1, policy_version 82270 (0.0011) +[2023-10-08 15:02:58,572][102897] Updated weights for policy 0, policy_version 82150 (0.0007) +[2023-10-08 15:02:58,941][102897] Updated weights for policy 0, policy_version 82160 (0.0009) +[2023-10-08 15:02:59,308][102897] Updated weights for policy 0, policy_version 82170 (0.0007) +[2023-10-08 15:03:00,865][102898] Updated weights for policy 1, policy_version 82280 (0.0009) +[2023-10-08 15:03:01,231][102898] Updated weights for policy 1, policy_version 82290 (0.0008) +[2023-10-08 15:03:01,611][102898] Updated weights for policy 1, policy_version 82300 (0.0009) +[2023-10-08 15:03:01,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 168427520. Throughput: 0: 1776.1, 1: 1802.7. Samples: 42114420. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:03:01,876][101941] Avg episode reward: [(0, '9.510'), (1, '11.440')] +[2023-10-08 15:03:03,058][102897] Updated weights for policy 0, policy_version 82180 (0.0008) +[2023-10-08 15:03:03,425][102897] Updated weights for policy 0, policy_version 82190 (0.0007) +[2023-10-08 15:03:03,800][102897] Updated weights for policy 0, policy_version 82200 (0.0008) +[2023-10-08 15:03:05,402][102898] Updated weights for policy 1, policy_version 82310 (0.0008) +[2023-10-08 15:03:05,760][102898] Updated weights for policy 1, policy_version 82320 (0.0008) +[2023-10-08 15:03:06,122][102898] Updated weights for policy 1, policy_version 82330 (0.0007) +[2023-10-08 15:03:06,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 168493056. Throughput: 0: 1779.9, 1: 1794.6. Samples: 42125438. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:03:06,875][101941] Avg episode reward: [(0, '9.350'), (1, '12.350')] +[2023-10-08 15:03:07,743][102897] Updated weights for policy 0, policy_version 82210 (0.0008) +[2023-10-08 15:03:08,128][102897] Updated weights for policy 0, policy_version 82220 (0.0010) +[2023-10-08 15:03:08,500][102897] Updated weights for policy 0, policy_version 82230 (0.0009) +[2023-10-08 15:03:08,867][102897] Updated weights for policy 0, policy_version 82240 (0.0008) +[2023-10-08 15:03:09,769][102898] Updated weights for policy 1, policy_version 82340 (0.0009) +[2023-10-08 15:03:10,131][102898] Updated weights for policy 1, policy_version 82350 (0.0010) +[2023-10-08 15:03:10,502][102898] Updated weights for policy 1, policy_version 82360 (0.0007) +[2023-10-08 15:03:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 168558592. Throughput: 0: 1781.6, 1: 1801.1. Samples: 42146864. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:03:11,876][101941] Avg episode reward: [(0, '10.190'), (1, '12.330')] +[2023-10-08 15:03:12,470][102897] Updated weights for policy 0, policy_version 82250 (0.0008) +[2023-10-08 15:03:12,835][102897] Updated weights for policy 0, policy_version 82260 (0.0009) +[2023-10-08 15:03:13,210][102897] Updated weights for policy 0, policy_version 82270 (0.0008) +[2023-10-08 15:03:14,297][102898] Updated weights for policy 1, policy_version 82370 (0.0008) +[2023-10-08 15:03:14,667][102898] Updated weights for policy 1, policy_version 82380 (0.0010) +[2023-10-08 15:03:15,029][102898] Updated weights for policy 1, policy_version 82390 (0.0009) +[2023-10-08 15:03:15,397][102898] Updated weights for policy 1, policy_version 82400 (0.0008) +[2023-10-08 15:03:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 168624128. Throughput: 0: 1800.3, 1: 1791.8. Samples: 42168798. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:03:16,875][101941] Avg episode reward: [(0, '10.620'), (1, '13.190')] +[2023-10-08 15:03:16,914][102897] Updated weights for policy 0, policy_version 82280 (0.0010) +[2023-10-08 15:03:17,283][102897] Updated weights for policy 0, policy_version 82290 (0.0011) +[2023-10-08 15:03:17,664][102897] Updated weights for policy 0, policy_version 82300 (0.0009) +[2023-10-08 15:03:17,804][102634] Saving new best policy, reward=10.620! +[2023-10-08 15:03:19,253][102898] Updated weights for policy 1, policy_version 82410 (0.0008) +[2023-10-08 15:03:19,626][102898] Updated weights for policy 1, policy_version 82420 (0.0008) +[2023-10-08 15:03:19,990][102898] Updated weights for policy 1, policy_version 82430 (0.0008) +[2023-10-08 15:03:21,561][102897] Updated weights for policy 0, policy_version 82310 (0.0007) +[2023-10-08 15:03:21,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 168689664. Throughput: 0: 1785.2, 1: 1806.6. Samples: 42179244. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:03:21,875][101941] Avg episode reward: [(0, '9.980'), (1, '12.270')] +[2023-10-08 15:03:21,938][102897] Updated weights for policy 0, policy_version 82320 (0.0008) +[2023-10-08 15:03:22,304][102897] Updated weights for policy 0, policy_version 82330 (0.0007) +[2023-10-08 15:03:23,830][102898] Updated weights for policy 1, policy_version 82440 (0.0009) +[2023-10-08 15:03:24,197][102898] Updated weights for policy 1, policy_version 82450 (0.0007) +[2023-10-08 15:03:24,568][102898] Updated weights for policy 1, policy_version 82460 (0.0008) +[2023-10-08 15:03:26,072][102897] Updated weights for policy 0, policy_version 82340 (0.0007) +[2023-10-08 15:03:26,437][102897] Updated weights for policy 0, policy_version 82350 (0.0007) +[2023-10-08 15:03:26,807][102897] Updated weights for policy 0, policy_version 82360 (0.0007) +[2023-10-08 15:03:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 168755200. Throughput: 0: 1793.1, 1: 1787.4. Samples: 42200662. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:03:26,875][101941] Avg episode reward: [(0, '10.140'), (1, '12.950')] +[2023-10-08 15:03:28,264][102898] Updated weights for policy 1, policy_version 82470 (0.0008) +[2023-10-08 15:03:28,633][102898] Updated weights for policy 1, policy_version 82480 (0.0007) +[2023-10-08 15:03:28,994][102898] Updated weights for policy 1, policy_version 82490 (0.0011) +[2023-10-08 15:03:30,480][102897] Updated weights for policy 0, policy_version 82370 (0.0007) +[2023-10-08 15:03:30,840][102897] Updated weights for policy 0, policy_version 82380 (0.0008) +[2023-10-08 15:03:31,207][102897] Updated weights for policy 0, policy_version 82390 (0.0007) +[2023-10-08 15:03:31,580][102897] Updated weights for policy 0, policy_version 82400 (0.0007) +[2023-10-08 15:03:31,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 168853504. Throughput: 0: 1788.9, 1: 1795.0. Samples: 42222148. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:03:31,876][101941] Avg episode reward: [(0, '9.170'), (1, '12.990')] +[2023-10-08 15:03:32,713][102898] Updated weights for policy 1, policy_version 82500 (0.0008) +[2023-10-08 15:03:33,082][102898] Updated weights for policy 1, policy_version 82510 (0.0008) +[2023-10-08 15:03:33,451][102898] Updated weights for policy 1, policy_version 82520 (0.0008) +[2023-10-08 15:03:35,433][102897] Updated weights for policy 0, policy_version 82410 (0.0010) +[2023-10-08 15:03:35,805][102897] Updated weights for policy 0, policy_version 82420 (0.0007) +[2023-10-08 15:03:36,176][102897] Updated weights for policy 0, policy_version 82430 (0.0008) +[2023-10-08 15:03:36,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 168919040. Throughput: 0: 1789.3, 1: 1798.1. Samples: 42233120. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:03:36,876][101941] Avg episode reward: [(0, '8.720'), (1, '13.060')] +[2023-10-08 15:03:37,176][102898] Updated weights for policy 1, policy_version 82530 (0.0008) +[2023-10-08 15:03:37,590][102898] Updated weights for policy 1, policy_version 82540 (0.0007) +[2023-10-08 15:03:37,959][102898] Updated weights for policy 1, policy_version 82550 (0.0007) +[2023-10-08 15:03:38,314][102898] Updated weights for policy 1, policy_version 82560 (0.0007) +[2023-10-08 15:03:39,782][102897] Updated weights for policy 0, policy_version 82440 (0.0007) +[2023-10-08 15:03:40,148][102897] Updated weights for policy 0, policy_version 82450 (0.0008) +[2023-10-08 15:03:40,513][102897] Updated weights for policy 0, policy_version 82460 (0.0008) +[2023-10-08 15:03:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 168984576. Throughput: 0: 1798.4, 1: 1794.0. Samples: 42254450. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:03:41,876][101941] Avg episode reward: [(0, '8.730'), (1, '13.570')] +[2023-10-08 15:03:42,134][102898] Updated weights for policy 1, policy_version 82570 (0.0008) +[2023-10-08 15:03:42,493][102898] Updated weights for policy 1, policy_version 82580 (0.0009) +[2023-10-08 15:03:42,867][102898] Updated weights for policy 1, policy_version 82590 (0.0010) +[2023-10-08 15:03:44,222][102897] Updated weights for policy 0, policy_version 82470 (0.0009) +[2023-10-08 15:03:44,604][102897] Updated weights for policy 0, policy_version 82480 (0.0010) +[2023-10-08 15:03:44,982][102897] Updated weights for policy 0, policy_version 82490 (0.0011) +[2023-10-08 15:03:46,548][102898] Updated weights for policy 1, policy_version 82600 (0.0009) +[2023-10-08 15:03:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 169050112. Throughput: 0: 1786.1, 1: 1812.3. Samples: 42276346. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:03:46,876][101941] Avg episode reward: [(0, '8.780'), (1, '12.750')] +[2023-10-08 15:03:46,919][102898] Updated weights for policy 1, policy_version 82610 (0.0010) +[2023-10-08 15:03:47,282][102898] Updated weights for policy 1, policy_version 82620 (0.0009) +[2023-10-08 15:03:48,764][102897] Updated weights for policy 0, policy_version 82500 (0.0009) +[2023-10-08 15:03:49,136][102897] Updated weights for policy 0, policy_version 82510 (0.0007) +[2023-10-08 15:03:49,497][102897] Updated weights for policy 0, policy_version 82520 (0.0008) +[2023-10-08 15:03:51,212][102898] Updated weights for policy 1, policy_version 82630 (0.0008) +[2023-10-08 15:03:51,577][102898] Updated weights for policy 1, policy_version 82640 (0.0009) +[2023-10-08 15:03:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 169115648. Throughput: 0: 1794.3, 1: 1786.9. Samples: 42286592. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:03:51,876][101941] Avg episode reward: [(0, '9.670'), (1, '13.230')] +[2023-10-08 15:03:51,950][102898] Updated weights for policy 1, policy_version 82650 (0.0009) +[2023-10-08 15:03:53,363][102897] Updated weights for policy 0, policy_version 82530 (0.0011) +[2023-10-08 15:03:53,733][102897] Updated weights for policy 0, policy_version 82540 (0.0008) +[2023-10-08 15:03:54,097][102897] Updated weights for policy 0, policy_version 82550 (0.0011) +[2023-10-08 15:03:54,468][102897] Updated weights for policy 0, policy_version 82560 (0.0010) +[2023-10-08 15:03:55,511][102898] Updated weights for policy 1, policy_version 82660 (0.0009) +[2023-10-08 15:03:55,881][102898] Updated weights for policy 1, policy_version 82670 (0.0007) +[2023-10-08 15:03:56,250][102898] Updated weights for policy 1, policy_version 82680 (0.0009) +[2023-10-08 15:03:56,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 169213952. Throughput: 0: 1780.8, 1: 1811.0. Samples: 42308492. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:03:56,876][101941] Avg episode reward: [(0, '9.510'), (1, '12.490')] +[2023-10-08 15:03:58,458][102897] Updated weights for policy 0, policy_version 82570 (0.0010) +[2023-10-08 15:03:58,835][102897] Updated weights for policy 0, policy_version 82580 (0.0009) +[2023-10-08 15:03:59,210][102897] Updated weights for policy 0, policy_version 82590 (0.0009) +[2023-10-08 15:03:59,943][102898] Updated weights for policy 1, policy_version 82690 (0.0008) +[2023-10-08 15:04:00,315][102898] Updated weights for policy 1, policy_version 82700 (0.0008) +[2023-10-08 15:04:00,672][102898] Updated weights for policy 1, policy_version 82710 (0.0007) +[2023-10-08 15:04:01,034][102898] Updated weights for policy 1, policy_version 82720 (0.0007) +[2023-10-08 15:04:01,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 169279488. Throughput: 0: 1785.0, 1: 1792.9. Samples: 42329806. Policy #0 lag: (min: 14.0, avg: 14.4, max: 28.0) +[2023-10-08 15:04:01,876][101941] Avg episode reward: [(0, '8.690'), (1, '13.000')] +[2023-10-08 15:04:02,849][102897] Updated weights for policy 0, policy_version 82600 (0.0010) +[2023-10-08 15:04:03,210][102897] Updated weights for policy 0, policy_version 82610 (0.0010) +[2023-10-08 15:04:03,587][102897] Updated weights for policy 0, policy_version 82620 (0.0007) +[2023-10-08 15:04:04,583][102898] Updated weights for policy 1, policy_version 82730 (0.0011) +[2023-10-08 15:04:04,950][102898] Updated weights for policy 1, policy_version 82740 (0.0010) +[2023-10-08 15:04:05,326][102898] Updated weights for policy 1, policy_version 82750 (0.0010) +[2023-10-08 15:04:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 169345024. Throughput: 0: 1781.6, 1: 1805.0. Samples: 42340640. Policy #0 lag: (min: 14.0, avg: 14.4, max: 28.0) +[2023-10-08 15:04:06,876][101941] Avg episode reward: [(0, '8.050'), (1, '13.040')] +[2023-10-08 15:04:07,529][102897] Updated weights for policy 0, policy_version 82630 (0.0007) +[2023-10-08 15:04:07,906][102897] Updated weights for policy 0, policy_version 82640 (0.0007) +[2023-10-08 15:04:08,280][102897] Updated weights for policy 0, policy_version 82650 (0.0010) +[2023-10-08 15:04:09,095][102898] Updated weights for policy 1, policy_version 82760 (0.0008) +[2023-10-08 15:04:09,467][102898] Updated weights for policy 1, policy_version 82770 (0.0008) +[2023-10-08 15:04:09,824][102898] Updated weights for policy 1, policy_version 82780 (0.0007) +[2023-10-08 15:04:11,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 169410560. Throughput: 0: 1785.4, 1: 1801.7. Samples: 42362082. Policy #0 lag: (min: 14.0, avg: 14.4, max: 28.0) +[2023-10-08 15:04:11,876][101941] Avg episode reward: [(0, '8.140'), (1, '13.180')] +[2023-10-08 15:04:11,911][102897] Updated weights for policy 0, policy_version 82660 (0.0008) +[2023-10-08 15:04:12,287][102897] Updated weights for policy 0, policy_version 82670 (0.0009) +[2023-10-08 15:04:12,645][102897] Updated weights for policy 0, policy_version 82680 (0.0009) +[2023-10-08 15:04:13,803][102898] Updated weights for policy 1, policy_version 82790 (0.0009) +[2023-10-08 15:04:14,164][102898] Updated weights for policy 1, policy_version 82800 (0.0010) +[2023-10-08 15:04:14,535][102898] Updated weights for policy 1, policy_version 82810 (0.0010) +[2023-10-08 15:04:16,357][102897] Updated weights for policy 0, policy_version 82690 (0.0008) +[2023-10-08 15:04:16,734][102897] Updated weights for policy 0, policy_version 82700 (0.0007) +[2023-10-08 15:04:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 169476096. Throughput: 0: 1812.9, 1: 1788.2. Samples: 42384198. Policy #0 lag: (min: 14.0, avg: 14.4, max: 28.0) +[2023-10-08 15:04:16,876][101941] Avg episode reward: [(0, '8.210'), (1, '12.490')] +[2023-10-08 15:04:16,883][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000082816_84803584.pth... +[2023-10-08 15:04:16,916][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000081152_83099648.pth +[2023-10-08 15:04:17,104][102897] Updated weights for policy 0, policy_version 82710 (0.0007) +[2023-10-08 15:04:17,464][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000082720_84705280.pth... +[2023-10-08 15:04:17,468][102897] Updated weights for policy 0, policy_version 82720 (0.0007) +[2023-10-08 15:04:17,502][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000081024_82968576.pth +[2023-10-08 15:04:18,479][102898] Updated weights for policy 1, policy_version 82820 (0.0010) +[2023-10-08 15:04:18,846][102898] Updated weights for policy 1, policy_version 82830 (0.0007) +[2023-10-08 15:04:19,207][102898] Updated weights for policy 1, policy_version 82840 (0.0009) +[2023-10-08 15:04:21,010][102897] Updated weights for policy 0, policy_version 82730 (0.0007) +[2023-10-08 15:04:21,386][102897] Updated weights for policy 0, policy_version 82740 (0.0008) +[2023-10-08 15:04:21,753][102897] Updated weights for policy 0, policy_version 82750 (0.0008) +[2023-10-08 15:04:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 169574400. Throughput: 0: 1791.9, 1: 1789.1. Samples: 42394264. Policy #0 lag: (min: 14.0, avg: 14.4, max: 28.0) +[2023-10-08 15:04:21,876][101941] Avg episode reward: [(0, '8.500'), (1, '12.860')] +[2023-10-08 15:04:22,948][102898] Updated weights for policy 1, policy_version 82850 (0.0010) +[2023-10-08 15:04:23,314][102898] Updated weights for policy 1, policy_version 82860 (0.0008) +[2023-10-08 15:04:23,688][102898] Updated weights for policy 1, policy_version 82870 (0.0007) +[2023-10-08 15:04:24,053][102898] Updated weights for policy 1, policy_version 82880 (0.0007) +[2023-10-08 15:04:25,546][102897] Updated weights for policy 0, policy_version 82760 (0.0010) +[2023-10-08 15:04:25,913][102897] Updated weights for policy 0, policy_version 82770 (0.0009) +[2023-10-08 15:04:26,283][102897] Updated weights for policy 0, policy_version 82780 (0.0011) +[2023-10-08 15:04:26,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.5, 300 sec: 14329.1). Total num frames: 169639936. Throughput: 0: 1803.6, 1: 1786.3. Samples: 42415994. Policy #0 lag: (min: 14.0, avg: 14.4, max: 28.0) +[2023-10-08 15:04:26,876][101941] Avg episode reward: [(0, '8.840'), (1, '13.180')] +[2023-10-08 15:04:27,790][102898] Updated weights for policy 1, policy_version 82890 (0.0008) +[2023-10-08 15:04:28,156][102898] Updated weights for policy 1, policy_version 82900 (0.0009) +[2023-10-08 15:04:28,527][102898] Updated weights for policy 1, policy_version 82910 (0.0008) +[2023-10-08 15:04:30,198][102897] Updated weights for policy 0, policy_version 82790 (0.0010) +[2023-10-08 15:04:30,575][102897] Updated weights for policy 0, policy_version 82800 (0.0008) +[2023-10-08 15:04:30,949][102897] Updated weights for policy 0, policy_version 82810 (0.0008) +[2023-10-08 15:04:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 169705472. Throughput: 0: 1781.2, 1: 1786.4. Samples: 42436888. Policy #0 lag: (min: 14.0, avg: 14.4, max: 28.0) +[2023-10-08 15:04:31,876][101941] Avg episode reward: [(0, '8.740'), (1, '13.860')] +[2023-10-08 15:04:32,377][102898] Updated weights for policy 1, policy_version 82920 (0.0008) +[2023-10-08 15:04:32,749][102898] Updated weights for policy 1, policy_version 82930 (0.0009) +[2023-10-08 15:04:33,120][102898] Updated weights for policy 1, policy_version 82940 (0.0008) +[2023-10-08 15:04:34,663][102897] Updated weights for policy 0, policy_version 82820 (0.0007) +[2023-10-08 15:04:35,031][102897] Updated weights for policy 0, policy_version 82830 (0.0008) +[2023-10-08 15:04:35,405][102897] Updated weights for policy 0, policy_version 82840 (0.0007) +[2023-10-08 15:04:36,837][102898] Updated weights for policy 1, policy_version 82950 (0.0008) +[2023-10-08 15:04:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 169771008. Throughput: 0: 1806.4, 1: 1783.0. Samples: 42448114. Policy #0 lag: (min: 14.0, avg: 14.4, max: 28.0) +[2023-10-08 15:04:36,876][101941] Avg episode reward: [(0, '9.100'), (1, '13.950')] +[2023-10-08 15:04:37,197][102898] Updated weights for policy 1, policy_version 82960 (0.0007) +[2023-10-08 15:04:37,561][102898] Updated weights for policy 1, policy_version 82970 (0.0007) +[2023-10-08 15:04:37,780][102760] Saving new best policy, reward=13.950! +[2023-10-08 15:04:39,018][102897] Updated weights for policy 0, policy_version 82850 (0.0008) +[2023-10-08 15:04:39,382][102897] Updated weights for policy 0, policy_version 82860 (0.0008) +[2023-10-08 15:04:39,745][102897] Updated weights for policy 0, policy_version 82870 (0.0008) +[2023-10-08 15:04:40,112][102897] Updated weights for policy 0, policy_version 82880 (0.0009) +[2023-10-08 15:04:41,496][102898] Updated weights for policy 1, policy_version 82980 (0.0008) +[2023-10-08 15:04:41,871][102898] Updated weights for policy 1, policy_version 82990 (0.0010) +[2023-10-08 15:04:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 169836544. Throughput: 0: 1791.2, 1: 1774.3. Samples: 42468938. Policy #0 lag: (min: 14.0, avg: 14.4, max: 28.0) +[2023-10-08 15:04:41,876][101941] Avg episode reward: [(0, '8.900'), (1, '13.580')] +[2023-10-08 15:04:42,241][102898] Updated weights for policy 1, policy_version 83000 (0.0008) +[2023-10-08 15:04:43,967][102897] Updated weights for policy 0, policy_version 82890 (0.0009) +[2023-10-08 15:04:44,332][102897] Updated weights for policy 0, policy_version 82900 (0.0009) +[2023-10-08 15:04:44,704][102897] Updated weights for policy 0, policy_version 82910 (0.0010) +[2023-10-08 15:04:46,005][102898] Updated weights for policy 1, policy_version 83010 (0.0007) +[2023-10-08 15:04:46,367][102898] Updated weights for policy 1, policy_version 83020 (0.0007) +[2023-10-08 15:04:46,739][102898] Updated weights for policy 1, policy_version 83030 (0.0007) +[2023-10-08 15:04:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 169902080. Throughput: 0: 1784.8, 1: 1785.3. Samples: 42490460. Policy #0 lag: (min: 14.0, avg: 14.4, max: 28.0) +[2023-10-08 15:04:46,876][101941] Avg episode reward: [(0, '8.300'), (1, '12.650')] +[2023-10-08 15:04:47,097][102898] Updated weights for policy 1, policy_version 83040 (0.0009) +[2023-10-08 15:04:48,509][102897] Updated weights for policy 0, policy_version 82920 (0.0008) +[2023-10-08 15:04:48,887][102897] Updated weights for policy 0, policy_version 82930 (0.0008) +[2023-10-08 15:04:49,259][102897] Updated weights for policy 0, policy_version 82940 (0.0007) +[2023-10-08 15:04:50,887][102898] Updated weights for policy 1, policy_version 83050 (0.0008) +[2023-10-08 15:04:51,250][102898] Updated weights for policy 1, policy_version 83060 (0.0008) +[2023-10-08 15:04:51,612][102898] Updated weights for policy 1, policy_version 83070 (0.0009) +[2023-10-08 15:04:51,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 170000384. Throughput: 0: 1787.9, 1: 1770.2. Samples: 42500752. Policy #0 lag: (min: 14.0, avg: 14.4, max: 28.0) +[2023-10-08 15:04:51,875][101941] Avg episode reward: [(0, '8.630'), (1, '12.990')] +[2023-10-08 15:04:53,078][102897] Updated weights for policy 0, policy_version 82950 (0.0007) +[2023-10-08 15:04:53,458][102897] Updated weights for policy 0, policy_version 82960 (0.0010) +[2023-10-08 15:04:53,834][102897] Updated weights for policy 0, policy_version 82970 (0.0007) +[2023-10-08 15:04:55,325][102898] Updated weights for policy 1, policy_version 83080 (0.0009) +[2023-10-08 15:04:55,688][102898] Updated weights for policy 1, policy_version 83090 (0.0010) +[2023-10-08 15:04:56,058][102898] Updated weights for policy 1, policy_version 83100 (0.0010) +[2023-10-08 15:04:56,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 170065920. Throughput: 0: 1781.6, 1: 1788.6. Samples: 42522742. Policy #0 lag: (min: 9.0, avg: 27.5, max: 41.0) +[2023-10-08 15:04:56,876][101941] Avg episode reward: [(0, '8.810'), (1, '11.740')] +[2023-10-08 15:04:57,699][102897] Updated weights for policy 0, policy_version 82980 (0.0007) +[2023-10-08 15:04:58,064][102897] Updated weights for policy 0, policy_version 82990 (0.0009) +[2023-10-08 15:04:58,434][102897] Updated weights for policy 0, policy_version 83000 (0.0008) +[2023-10-08 15:04:59,778][102898] Updated weights for policy 1, policy_version 83110 (0.0009) +[2023-10-08 15:05:00,145][102898] Updated weights for policy 1, policy_version 83120 (0.0010) +[2023-10-08 15:05:00,510][102898] Updated weights for policy 1, policy_version 83130 (0.0007) +[2023-10-08 15:05:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 170131456. Throughput: 0: 1777.0, 1: 1775.7. Samples: 42544068. Policy #0 lag: (min: 9.0, avg: 27.5, max: 41.0) +[2023-10-08 15:05:01,875][101941] Avg episode reward: [(0, '8.870'), (1, '12.480')] +[2023-10-08 15:05:02,217][102897] Updated weights for policy 0, policy_version 83010 (0.0007) +[2023-10-08 15:05:02,584][102897] Updated weights for policy 0, policy_version 83020 (0.0011) +[2023-10-08 15:05:02,956][102897] Updated weights for policy 0, policy_version 83030 (0.0009) +[2023-10-08 15:05:03,314][102897] Updated weights for policy 0, policy_version 83040 (0.0008) +[2023-10-08 15:05:04,183][102898] Updated weights for policy 1, policy_version 83140 (0.0008) +[2023-10-08 15:05:04,552][102898] Updated weights for policy 1, policy_version 83150 (0.0007) +[2023-10-08 15:05:04,920][102898] Updated weights for policy 1, policy_version 83160 (0.0008) +[2023-10-08 15:05:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 170196992. Throughput: 0: 1768.4, 1: 1796.7. Samples: 42554698. Policy #0 lag: (min: 9.0, avg: 27.5, max: 41.0) +[2023-10-08 15:05:06,876][101941] Avg episode reward: [(0, '8.570'), (1, '12.220')] +[2023-10-08 15:05:07,127][102897] Updated weights for policy 0, policy_version 83050 (0.0010) +[2023-10-08 15:05:07,495][102897] Updated weights for policy 0, policy_version 83060 (0.0009) +[2023-10-08 15:05:07,862][102897] Updated weights for policy 0, policy_version 83070 (0.0007) +[2023-10-08 15:05:08,606][102898] Updated weights for policy 1, policy_version 83170 (0.0009) +[2023-10-08 15:05:08,978][102898] Updated weights for policy 1, policy_version 83180 (0.0008) +[2023-10-08 15:05:09,343][102898] Updated weights for policy 1, policy_version 83190 (0.0009) +[2023-10-08 15:05:09,705][102898] Updated weights for policy 1, policy_version 83200 (0.0008) +[2023-10-08 15:05:11,517][102897] Updated weights for policy 0, policy_version 83080 (0.0009) +[2023-10-08 15:05:11,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 170262528. Throughput: 0: 1781.3, 1: 1784.1. Samples: 42576436. Policy #0 lag: (min: 9.0, avg: 27.5, max: 41.0) +[2023-10-08 15:05:11,876][101941] Avg episode reward: [(0, '8.630'), (1, '13.970')] +[2023-10-08 15:05:11,877][102760] Saving new best policy, reward=13.970! +[2023-10-08 15:05:11,879][102897] Updated weights for policy 0, policy_version 83090 (0.0010) +[2023-10-08 15:05:12,253][102897] Updated weights for policy 0, policy_version 83100 (0.0009) +[2023-10-08 15:05:13,432][102898] Updated weights for policy 1, policy_version 83210 (0.0007) +[2023-10-08 15:05:13,794][102898] Updated weights for policy 1, policy_version 83220 (0.0008) +[2023-10-08 15:05:14,168][102898] Updated weights for policy 1, policy_version 83230 (0.0008) +[2023-10-08 15:05:16,090][102897] Updated weights for policy 0, policy_version 83110 (0.0008) +[2023-10-08 15:05:16,464][102897] Updated weights for policy 0, policy_version 83120 (0.0007) +[2023-10-08 15:05:16,831][102897] Updated weights for policy 0, policy_version 83130 (0.0007) +[2023-10-08 15:05:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 170328064. Throughput: 0: 1798.8, 1: 1784.8. Samples: 42598152. Policy #0 lag: (min: 9.0, avg: 27.5, max: 41.0) +[2023-10-08 15:05:16,876][101941] Avg episode reward: [(0, '8.680'), (1, '13.150')] +[2023-10-08 15:05:17,992][102898] Updated weights for policy 1, policy_version 83240 (0.0007) +[2023-10-08 15:05:18,355][102898] Updated weights for policy 1, policy_version 83250 (0.0008) +[2023-10-08 15:05:18,723][102898] Updated weights for policy 1, policy_version 83260 (0.0009) +[2023-10-08 15:05:20,633][102897] Updated weights for policy 0, policy_version 83140 (0.0009) +[2023-10-08 15:05:21,007][102897] Updated weights for policy 0, policy_version 83150 (0.0009) +[2023-10-08 15:05:21,375][102897] Updated weights for policy 0, policy_version 83160 (0.0008) +[2023-10-08 15:05:21,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 170426368. Throughput: 0: 1776.9, 1: 1791.2. Samples: 42608680. Policy #0 lag: (min: 9.0, avg: 27.5, max: 41.0) +[2023-10-08 15:05:21,876][101941] Avg episode reward: [(0, '8.580'), (1, '13.450')] +[2023-10-08 15:05:22,596][102898] Updated weights for policy 1, policy_version 83270 (0.0009) +[2023-10-08 15:05:22,957][102898] Updated weights for policy 1, policy_version 83280 (0.0007) +[2023-10-08 15:05:23,327][102898] Updated weights for policy 1, policy_version 83290 (0.0008) +[2023-10-08 15:05:25,156][102897] Updated weights for policy 0, policy_version 83170 (0.0009) +[2023-10-08 15:05:25,514][102897] Updated weights for policy 0, policy_version 83180 (0.0010) +[2023-10-08 15:05:25,886][102897] Updated weights for policy 0, policy_version 83190 (0.0010) +[2023-10-08 15:05:26,248][102897] Updated weights for policy 0, policy_version 83200 (0.0010) +[2023-10-08 15:05:26,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 170491904. Throughput: 0: 1794.9, 1: 1792.9. Samples: 42630390. Policy #0 lag: (min: 9.0, avg: 27.5, max: 41.0) +[2023-10-08 15:05:26,876][101941] Avg episode reward: [(0, '8.840'), (1, '12.860')] +[2023-10-08 15:05:26,962][102898] Updated weights for policy 1, policy_version 83300 (0.0009) +[2023-10-08 15:05:27,323][102898] Updated weights for policy 1, policy_version 83310 (0.0009) +[2023-10-08 15:05:27,691][102898] Updated weights for policy 1, policy_version 83320 (0.0008) +[2023-10-08 15:05:30,162][102897] Updated weights for policy 0, policy_version 83210 (0.0009) +[2023-10-08 15:05:30,538][102897] Updated weights for policy 0, policy_version 83220 (0.0007) +[2023-10-08 15:05:30,908][102897] Updated weights for policy 0, policy_version 83230 (0.0007) +[2023-10-08 15:05:31,346][102898] Updated weights for policy 1, policy_version 83330 (0.0008) +[2023-10-08 15:05:31,720][102898] Updated weights for policy 1, policy_version 83340 (0.0010) +[2023-10-08 15:05:31,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 170557440. Throughput: 0: 1766.8, 1: 1808.4. Samples: 42651340. Policy #0 lag: (min: 9.0, avg: 27.5, max: 41.0) +[2023-10-08 15:05:31,876][101941] Avg episode reward: [(0, '8.470'), (1, '13.320')] +[2023-10-08 15:05:32,078][102898] Updated weights for policy 1, policy_version 83350 (0.0010) +[2023-10-08 15:05:32,444][102898] Updated weights for policy 1, policy_version 83360 (0.0010) +[2023-10-08 15:05:34,408][102897] Updated weights for policy 0, policy_version 83240 (0.0010) +[2023-10-08 15:05:34,790][102897] Updated weights for policy 0, policy_version 83250 (0.0007) +[2023-10-08 15:05:35,157][102897] Updated weights for policy 0, policy_version 83260 (0.0007) +[2023-10-08 15:05:36,362][102898] Updated weights for policy 1, policy_version 83370 (0.0007) +[2023-10-08 15:05:36,731][102898] Updated weights for policy 1, policy_version 83380 (0.0007) +[2023-10-08 15:05:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 170622976. Throughput: 0: 1796.6, 1: 1799.9. Samples: 42662596. Policy #0 lag: (min: 9.0, avg: 27.5, max: 41.0) +[2023-10-08 15:05:36,875][101941] Avg episode reward: [(0, '8.170'), (1, '13.350')] +[2023-10-08 15:05:37,104][102898] Updated weights for policy 1, policy_version 83390 (0.0009) +[2023-10-08 15:05:38,939][102897] Updated weights for policy 0, policy_version 83270 (0.0010) +[2023-10-08 15:05:39,300][102897] Updated weights for policy 0, policy_version 83280 (0.0011) +[2023-10-08 15:05:39,667][102897] Updated weights for policy 0, policy_version 83290 (0.0009) +[2023-10-08 15:05:41,007][102898] Updated weights for policy 1, policy_version 83400 (0.0007) +[2023-10-08 15:05:41,380][102898] Updated weights for policy 1, policy_version 83410 (0.0009) +[2023-10-08 15:05:41,754][102898] Updated weights for policy 1, policy_version 83420 (0.0008) +[2023-10-08 15:05:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 170688512. Throughput: 0: 1772.3, 1: 1802.0. Samples: 42683584. Policy #0 lag: (min: 9.0, avg: 27.5, max: 41.0) +[2023-10-08 15:05:41,875][101941] Avg episode reward: [(0, '8.280'), (1, '13.800')] +[2023-10-08 15:05:43,562][102897] Updated weights for policy 0, policy_version 83300 (0.0007) +[2023-10-08 15:05:43,933][102897] Updated weights for policy 0, policy_version 83310 (0.0008) +[2023-10-08 15:05:44,308][102897] Updated weights for policy 0, policy_version 83320 (0.0007) +[2023-10-08 15:05:45,574][102898] Updated weights for policy 1, policy_version 83430 (0.0009) +[2023-10-08 15:05:45,929][102898] Updated weights for policy 1, policy_version 83440 (0.0008) +[2023-10-08 15:05:46,295][102898] Updated weights for policy 1, policy_version 83450 (0.0010) +[2023-10-08 15:05:46,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 170786816. Throughput: 0: 1774.6, 1: 1794.7. Samples: 42704686. Policy #0 lag: (min: 9.0, avg: 27.5, max: 41.0) +[2023-10-08 15:05:46,876][101941] Avg episode reward: [(0, '9.010'), (1, '13.200')] +[2023-10-08 15:05:47,990][102897] Updated weights for policy 0, policy_version 83330 (0.0008) +[2023-10-08 15:05:48,351][102897] Updated weights for policy 0, policy_version 83340 (0.0010) +[2023-10-08 15:05:48,725][102897] Updated weights for policy 0, policy_version 83350 (0.0010) +[2023-10-08 15:05:49,104][102897] Updated weights for policy 0, policy_version 83360 (0.0007) +[2023-10-08 15:05:49,917][102898] Updated weights for policy 1, policy_version 83460 (0.0009) +[2023-10-08 15:05:50,291][102898] Updated weights for policy 1, policy_version 83470 (0.0010) +[2023-10-08 15:05:50,652][102898] Updated weights for policy 1, policy_version 83480 (0.0011) +[2023-10-08 15:05:51,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 170852352. Throughput: 0: 1777.1, 1: 1801.5. Samples: 42715734. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:05:51,876][101941] Avg episode reward: [(0, '9.500'), (1, '12.620')] +[2023-10-08 15:05:52,991][102897] Updated weights for policy 0, policy_version 83370 (0.0008) +[2023-10-08 15:05:53,363][102897] Updated weights for policy 0, policy_version 83380 (0.0009) +[2023-10-08 15:05:53,744][102897] Updated weights for policy 0, policy_version 83390 (0.0010) +[2023-10-08 15:05:54,400][102898] Updated weights for policy 1, policy_version 83490 (0.0008) +[2023-10-08 15:05:54,763][102898] Updated weights for policy 1, policy_version 83500 (0.0007) +[2023-10-08 15:05:55,136][102898] Updated weights for policy 1, policy_version 83510 (0.0009) +[2023-10-08 15:05:55,499][102898] Updated weights for policy 1, policy_version 83520 (0.0010) +[2023-10-08 15:05:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 170917888. Throughput: 0: 1779.2, 1: 1794.3. Samples: 42737244. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:05:56,876][101941] Avg episode reward: [(0, '9.360'), (1, '12.980')] +[2023-10-08 15:05:57,453][102897] Updated weights for policy 0, policy_version 83400 (0.0010) +[2023-10-08 15:05:57,823][102897] Updated weights for policy 0, policy_version 83410 (0.0011) +[2023-10-08 15:05:58,193][102897] Updated weights for policy 0, policy_version 83420 (0.0010) +[2023-10-08 15:05:59,279][102898] Updated weights for policy 1, policy_version 83530 (0.0009) +[2023-10-08 15:05:59,656][102898] Updated weights for policy 1, policy_version 83540 (0.0009) +[2023-10-08 15:06:00,030][102898] Updated weights for policy 1, policy_version 83550 (0.0007) +[2023-10-08 15:06:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 170983424. Throughput: 0: 1794.5, 1: 1792.6. Samples: 42759570. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:06:01,876][101941] Avg episode reward: [(0, '9.370'), (1, '13.380')] +[2023-10-08 15:06:01,908][102897] Updated weights for policy 0, policy_version 83430 (0.0008) +[2023-10-08 15:06:02,283][102897] Updated weights for policy 0, policy_version 83440 (0.0008) +[2023-10-08 15:06:02,657][102897] Updated weights for policy 0, policy_version 83450 (0.0009) +[2023-10-08 15:06:03,858][102898] Updated weights for policy 1, policy_version 83560 (0.0008) +[2023-10-08 15:06:04,235][102898] Updated weights for policy 1, policy_version 83570 (0.0008) +[2023-10-08 15:06:04,599][102898] Updated weights for policy 1, policy_version 83580 (0.0008) +[2023-10-08 15:06:06,267][102897] Updated weights for policy 0, policy_version 83460 (0.0008) +[2023-10-08 15:06:06,638][102897] Updated weights for policy 0, policy_version 83470 (0.0007) +[2023-10-08 15:06:06,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 171048960. Throughput: 0: 1779.3, 1: 1798.0. Samples: 42769662. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:06:06,876][101941] Avg episode reward: [(0, '9.120'), (1, '14.140')] +[2023-10-08 15:06:06,878][102760] Saving new best policy, reward=14.140! +[2023-10-08 15:06:07,010][102897] Updated weights for policy 0, policy_version 83480 (0.0008) +[2023-10-08 15:06:08,380][102898] Updated weights for policy 1, policy_version 83590 (0.0009) +[2023-10-08 15:06:08,743][102898] Updated weights for policy 1, policy_version 83600 (0.0010) +[2023-10-08 15:06:09,110][102898] Updated weights for policy 1, policy_version 83610 (0.0009) +[2023-10-08 15:06:10,781][102897] Updated weights for policy 0, policy_version 83490 (0.0007) +[2023-10-08 15:06:11,160][102897] Updated weights for policy 0, policy_version 83500 (0.0010) +[2023-10-08 15:06:11,523][102897] Updated weights for policy 0, policy_version 83510 (0.0008) +[2023-10-08 15:06:11,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 171114496. Throughput: 0: 1795.5, 1: 1791.2. Samples: 42791794. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:06:11,876][101941] Avg episode reward: [(0, '9.060'), (1, '13.370')] +[2023-10-08 15:06:11,882][102897] Updated weights for policy 0, policy_version 83520 (0.0007) +[2023-10-08 15:06:12,870][102898] Updated weights for policy 1, policy_version 83620 (0.0009) +[2023-10-08 15:06:13,237][102898] Updated weights for policy 1, policy_version 83630 (0.0010) +[2023-10-08 15:06:13,602][102898] Updated weights for policy 1, policy_version 83640 (0.0010) +[2023-10-08 15:06:15,993][102897] Updated weights for policy 0, policy_version 83530 (0.0009) +[2023-10-08 15:06:16,366][102897] Updated weights for policy 0, policy_version 83540 (0.0007) +[2023-10-08 15:06:16,732][102897] Updated weights for policy 0, policy_version 83550 (0.0007) +[2023-10-08 15:06:16,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 171212800. Throughput: 0: 1801.5, 1: 1791.0. Samples: 42813000. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:06:16,876][101941] Avg episode reward: [(0, '8.440'), (1, '13.420')] +[2023-10-08 15:06:16,889][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000083552_85557248.pth... +[2023-10-08 15:06:16,889][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000083648_85655552.pth... +[2023-10-08 15:06:16,918][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000081856_83820544.pth +[2023-10-08 15:06:16,922][102634] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p0/milestones/checkpoint_000083552_85557248.pth +[2023-10-08 15:06:16,923][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000081984_83951616.pth +[2023-10-08 15:06:16,927][102760] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p1/milestones/checkpoint_000083648_85655552.pth +[2023-10-08 15:06:17,304][102898] Updated weights for policy 1, policy_version 83650 (0.0010) +[2023-10-08 15:06:17,676][102898] Updated weights for policy 1, policy_version 83660 (0.0007) +[2023-10-08 15:06:18,041][102898] Updated weights for policy 1, policy_version 83670 (0.0008) +[2023-10-08 15:06:18,405][102898] Updated weights for policy 1, policy_version 83680 (0.0009) +[2023-10-08 15:06:20,289][102897] Updated weights for policy 0, policy_version 83560 (0.0008) +[2023-10-08 15:06:20,657][102897] Updated weights for policy 0, policy_version 83570 (0.0010) +[2023-10-08 15:06:21,032][102897] Updated weights for policy 0, policy_version 83580 (0.0010) +[2023-10-08 15:06:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 171278336. Throughput: 0: 1794.8, 1: 1785.6. Samples: 42823716. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:06:21,876][101941] Avg episode reward: [(0, '8.040'), (1, '13.650')] +[2023-10-08 15:06:22,225][102898] Updated weights for policy 1, policy_version 83690 (0.0008) +[2023-10-08 15:06:22,586][102898] Updated weights for policy 1, policy_version 83700 (0.0009) +[2023-10-08 15:06:22,946][102898] Updated weights for policy 1, policy_version 83710 (0.0007) +[2023-10-08 15:06:24,781][102897] Updated weights for policy 0, policy_version 83590 (0.0009) +[2023-10-08 15:06:25,143][102897] Updated weights for policy 0, policy_version 83600 (0.0008) +[2023-10-08 15:06:25,518][102897] Updated weights for policy 0, policy_version 83610 (0.0008) +[2023-10-08 15:06:26,678][102898] Updated weights for policy 1, policy_version 83720 (0.0007) +[2023-10-08 15:06:26,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 171343872. Throughput: 0: 1799.9, 1: 1789.7. Samples: 42845118. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:06:26,875][101941] Avg episode reward: [(0, '8.390'), (1, '14.010')] +[2023-10-08 15:06:27,052][102898] Updated weights for policy 1, policy_version 83730 (0.0008) +[2023-10-08 15:06:27,422][102898] Updated weights for policy 1, policy_version 83740 (0.0009) +[2023-10-08 15:06:29,315][102897] Updated weights for policy 0, policy_version 83620 (0.0007) +[2023-10-08 15:06:29,682][102897] Updated weights for policy 0, policy_version 83630 (0.0007) +[2023-10-08 15:06:30,062][102897] Updated weights for policy 0, policy_version 83640 (0.0009) +[2023-10-08 15:06:31,287][102898] Updated weights for policy 1, policy_version 83750 (0.0008) +[2023-10-08 15:06:31,653][102898] Updated weights for policy 1, policy_version 83760 (0.0008) +[2023-10-08 15:06:32,313][101941] Fps is (10 sec: 12556.8, 60 sec: 14096.5, 300 sec: 14307.8). Total num frames: 171409408. Throughput: 0: 1772.8, 1: 1788.7. Samples: 42866516. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:06:32,315][101941] Avg episode reward: [(0, '8.300'), (1, '12.720')] +[2023-10-08 15:06:33,024][102898] Updated weights for policy 1, policy_version 83770 (0.0008) +[2023-10-08 15:06:34,768][102897] Updated weights for policy 0, policy_version 83650 (0.0010) +[2023-10-08 15:06:35,141][102897] Updated weights for policy 0, policy_version 83660 (0.0007) +[2023-10-08 15:06:35,519][102897] Updated weights for policy 0, policy_version 83670 (0.0009) +[2023-10-08 15:06:35,897][102897] Updated weights for policy 0, policy_version 83680 (0.0007) +[2023-10-08 15:06:36,825][102898] Updated weights for policy 1, policy_version 83780 (0.0007) +[2023-10-08 15:06:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 171474944. Throughput: 0: 1780.6, 1: 1737.7. Samples: 42874058. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:06:36,876][101941] Avg episode reward: [(0, '8.420'), (1, '12.400')] +[2023-10-08 15:06:37,245][102898] Updated weights for policy 1, policy_version 83790 (0.0009) +[2023-10-08 15:06:37,612][102898] Updated weights for policy 1, policy_version 83800 (0.0010) +[2023-10-08 15:06:39,828][102897] Updated weights for policy 0, policy_version 83690 (0.0012) +[2023-10-08 15:06:40,201][102897] Updated weights for policy 0, policy_version 83700 (0.0009) +[2023-10-08 15:06:40,562][102897] Updated weights for policy 0, policy_version 83710 (0.0008) +[2023-10-08 15:06:41,283][102898] Updated weights for policy 1, policy_version 83810 (0.0008) +[2023-10-08 15:06:41,648][102898] Updated weights for policy 1, policy_version 83820 (0.0007) +[2023-10-08 15:06:41,875][101941] Fps is (10 sec: 13708.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 171540480. Throughput: 0: 1743.0, 1: 1764.2. Samples: 42895068. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:06:41,876][101941] Avg episode reward: [(0, '8.280'), (1, '11.650')] +[2023-10-08 15:06:42,022][102898] Updated weights for policy 1, policy_version 83830 (0.0008) +[2023-10-08 15:06:42,387][102898] Updated weights for policy 1, policy_version 83840 (0.0009) +[2023-10-08 15:06:44,281][102897] Updated weights for policy 0, policy_version 83720 (0.0008) +[2023-10-08 15:06:44,657][102897] Updated weights for policy 0, policy_version 83730 (0.0010) +[2023-10-08 15:06:45,035][102897] Updated weights for policy 0, policy_version 83740 (0.0010) +[2023-10-08 15:06:46,317][102898] Updated weights for policy 1, policy_version 83850 (0.0007) +[2023-10-08 15:06:46,673][102898] Updated weights for policy 1, policy_version 83860 (0.0009) +[2023-10-08 15:06:46,875][101941] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 14218.0). Total num frames: 171606016. Throughput: 0: 1735.1, 1: 1751.5. Samples: 42916470. Policy #0 lag: (min: 25.0, avg: 45.6, max: 57.0) +[2023-10-08 15:06:46,876][101941] Avg episode reward: [(0, '8.400'), (1, '13.080')] +[2023-10-08 15:06:47,041][102898] Updated weights for policy 1, policy_version 83870 (0.0007) +[2023-10-08 15:06:48,854][102897] Updated weights for policy 0, policy_version 83750 (0.0009) +[2023-10-08 15:06:49,234][102897] Updated weights for policy 0, policy_version 83760 (0.0008) +[2023-10-08 15:06:49,594][102897] Updated weights for policy 0, policy_version 83770 (0.0010) +[2023-10-08 15:06:50,663][102898] Updated weights for policy 1, policy_version 83880 (0.0010) +[2023-10-08 15:06:51,033][102898] Updated weights for policy 1, policy_version 83890 (0.0010) +[2023-10-08 15:06:51,406][102898] Updated weights for policy 1, policy_version 83900 (0.0010) +[2023-10-08 15:06:51,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 171704320. Throughput: 0: 1750.3, 1: 1757.0. Samples: 42927490. Policy #0 lag: (min: 25.0, avg: 45.6, max: 57.0) +[2023-10-08 15:06:51,876][101941] Avg episode reward: [(0, '8.600'), (1, '13.000')] +[2023-10-08 15:06:53,384][102897] Updated weights for policy 0, policy_version 83780 (0.0008) +[2023-10-08 15:06:53,761][102897] Updated weights for policy 0, policy_version 83790 (0.0008) +[2023-10-08 15:06:54,125][102897] Updated weights for policy 0, policy_version 83800 (0.0008) +[2023-10-08 15:06:55,253][102898] Updated weights for policy 1, policy_version 83910 (0.0008) +[2023-10-08 15:06:55,622][102898] Updated weights for policy 1, policy_version 83920 (0.0010) +[2023-10-08 15:06:55,976][102898] Updated weights for policy 1, policy_version 83930 (0.0009) +[2023-10-08 15:06:56,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 171769856. Throughput: 0: 1734.3, 1: 1753.2. Samples: 42948734. Policy #0 lag: (min: 25.0, avg: 45.6, max: 57.0) +[2023-10-08 15:06:56,876][101941] Avg episode reward: [(0, '8.980'), (1, '14.120')] +[2023-10-08 15:06:57,877][102897] Updated weights for policy 0, policy_version 83810 (0.0008) +[2023-10-08 15:06:58,237][102897] Updated weights for policy 0, policy_version 83820 (0.0008) +[2023-10-08 15:06:58,609][102897] Updated weights for policy 0, policy_version 83830 (0.0007) +[2023-10-08 15:06:58,978][102897] Updated weights for policy 0, policy_version 83840 (0.0007) +[2023-10-08 15:06:59,618][102898] Updated weights for policy 1, policy_version 83940 (0.0010) +[2023-10-08 15:06:59,983][102898] Updated weights for policy 1, policy_version 83950 (0.0007) +[2023-10-08 15:07:00,348][102898] Updated weights for policy 1, policy_version 83960 (0.0007) +[2023-10-08 15:07:01,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 171835392. Throughput: 0: 1755.8, 1: 1738.9. Samples: 42970258. Policy #0 lag: (min: 25.0, avg: 45.6, max: 57.0) +[2023-10-08 15:07:01,875][101941] Avg episode reward: [(0, '8.920'), (1, '14.270')] +[2023-10-08 15:07:01,883][102760] Saving new best policy, reward=14.270! +[2023-10-08 15:07:02,665][102897] Updated weights for policy 0, policy_version 83850 (0.0008) +[2023-10-08 15:07:03,040][102897] Updated weights for policy 0, policy_version 83860 (0.0007) +[2023-10-08 15:07:03,407][102897] Updated weights for policy 0, policy_version 83870 (0.0008) +[2023-10-08 15:07:04,065][102898] Updated weights for policy 1, policy_version 83970 (0.0008) +[2023-10-08 15:07:04,436][102898] Updated weights for policy 1, policy_version 83980 (0.0008) +[2023-10-08 15:07:04,800][102898] Updated weights for policy 1, policy_version 83990 (0.0009) +[2023-10-08 15:07:05,168][102898] Updated weights for policy 1, policy_version 84000 (0.0008) +[2023-10-08 15:07:06,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 171900928. Throughput: 0: 1731.3, 1: 1758.3. Samples: 42980746. Policy #0 lag: (min: 25.0, avg: 45.6, max: 57.0) +[2023-10-08 15:07:06,875][101941] Avg episode reward: [(0, '8.810'), (1, '13.210')] +[2023-10-08 15:07:07,245][102897] Updated weights for policy 0, policy_version 83880 (0.0010) +[2023-10-08 15:07:07,610][102897] Updated weights for policy 0, policy_version 83890 (0.0011) +[2023-10-08 15:07:07,995][102897] Updated weights for policy 0, policy_version 83900 (0.0011) +[2023-10-08 15:07:08,843][102898] Updated weights for policy 1, policy_version 84010 (0.0008) +[2023-10-08 15:07:09,208][102898] Updated weights for policy 1, policy_version 84020 (0.0007) +[2023-10-08 15:07:09,579][102898] Updated weights for policy 1, policy_version 84030 (0.0010) +[2023-10-08 15:07:11,741][102897] Updated weights for policy 0, policy_version 83910 (0.0009) +[2023-10-08 15:07:11,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 171966464. Throughput: 0: 1754.5, 1: 1742.1. Samples: 43002468. Policy #0 lag: (min: 25.0, avg: 45.6, max: 57.0) +[2023-10-08 15:07:11,876][101941] Avg episode reward: [(0, '8.580'), (1, '13.180')] +[2023-10-08 15:07:12,118][102897] Updated weights for policy 0, policy_version 83920 (0.0007) +[2023-10-08 15:07:12,480][102897] Updated weights for policy 0, policy_version 83930 (0.0008) +[2023-10-08 15:07:13,275][102898] Updated weights for policy 1, policy_version 84040 (0.0008) +[2023-10-08 15:07:13,640][102898] Updated weights for policy 1, policy_version 84050 (0.0008) +[2023-10-08 15:07:14,007][102898] Updated weights for policy 1, policy_version 84060 (0.0008) +[2023-10-08 15:07:16,097][102897] Updated weights for policy 0, policy_version 83940 (0.0007) +[2023-10-08 15:07:16,460][102897] Updated weights for policy 0, policy_version 83950 (0.0009) +[2023-10-08 15:07:16,833][102897] Updated weights for policy 0, policy_version 83960 (0.0010) +[2023-10-08 15:07:16,875][101941] Fps is (10 sec: 13106.9, 60 sec: 13653.3, 300 sec: 14218.0). Total num frames: 172032000. Throughput: 0: 1771.7, 1: 1767.6. Samples: 43024232. Policy #0 lag: (min: 25.0, avg: 45.6, max: 57.0) +[2023-10-08 15:07:16,876][101941] Avg episode reward: [(0, '9.010'), (1, '12.150')] +[2023-10-08 15:07:17,740][102898] Updated weights for policy 1, policy_version 84070 (0.0008) +[2023-10-08 15:07:18,094][102898] Updated weights for policy 1, policy_version 84080 (0.0007) +[2023-10-08 15:07:18,463][102898] Updated weights for policy 1, policy_version 84090 (0.0009) +[2023-10-08 15:07:20,650][102897] Updated weights for policy 0, policy_version 83970 (0.0008) +[2023-10-08 15:07:21,009][102897] Updated weights for policy 0, policy_version 83980 (0.0009) +[2023-10-08 15:07:21,384][102897] Updated weights for policy 0, policy_version 83990 (0.0007) +[2023-10-08 15:07:21,743][102897] Updated weights for policy 0, policy_version 84000 (0.0007) +[2023-10-08 15:07:21,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 172130304. Throughput: 0: 1780.3, 1: 1791.3. Samples: 43034782. Policy #0 lag: (min: 25.0, avg: 45.6, max: 57.0) +[2023-10-08 15:07:21,875][101941] Avg episode reward: [(0, '8.730'), (1, '12.190')] +[2023-10-08 15:07:22,388][102898] Updated weights for policy 1, policy_version 84100 (0.0009) +[2023-10-08 15:07:22,752][102898] Updated weights for policy 1, policy_version 84110 (0.0010) +[2023-10-08 15:07:23,115][102898] Updated weights for policy 1, policy_version 84120 (0.0010) +[2023-10-08 15:07:25,338][102897] Updated weights for policy 0, policy_version 84010 (0.0008) +[2023-10-08 15:07:25,710][102897] Updated weights for policy 0, policy_version 84020 (0.0009) +[2023-10-08 15:07:26,074][102897] Updated weights for policy 0, policy_version 84030 (0.0007) +[2023-10-08 15:07:26,710][102898] Updated weights for policy 1, policy_version 84130 (0.0010) +[2023-10-08 15:07:26,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 172195840. Throughput: 0: 1807.1, 1: 1784.9. Samples: 43056708. Policy #0 lag: (min: 25.0, avg: 45.6, max: 57.0) +[2023-10-08 15:07:26,876][101941] Avg episode reward: [(0, '8.830'), (1, '12.860')] +[2023-10-08 15:07:27,071][102898] Updated weights for policy 1, policy_version 84140 (0.0008) +[2023-10-08 15:07:27,449][102898] Updated weights for policy 1, policy_version 84150 (0.0009) +[2023-10-08 15:07:27,816][102898] Updated weights for policy 1, policy_version 84160 (0.0008) +[2023-10-08 15:07:29,755][102897] Updated weights for policy 0, policy_version 84040 (0.0007) +[2023-10-08 15:07:30,119][102897] Updated weights for policy 0, policy_version 84050 (0.0007) +[2023-10-08 15:07:30,484][102897] Updated weights for policy 0, policy_version 84060 (0.0008) +[2023-10-08 15:07:31,531][102898] Updated weights for policy 1, policy_version 84170 (0.0008) +[2023-10-08 15:07:31,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14304.0, 300 sec: 14218.0). Total num frames: 172261376. Throughput: 0: 1795.5, 1: 1794.7. Samples: 43078030. Policy #0 lag: (min: 25.0, avg: 45.6, max: 57.0) +[2023-10-08 15:07:31,876][101941] Avg episode reward: [(0, '9.120'), (1, '12.840')] +[2023-10-08 15:07:31,890][102898] Updated weights for policy 1, policy_version 84180 (0.0007) +[2023-10-08 15:07:32,257][102898] Updated weights for policy 1, policy_version 84190 (0.0007) +[2023-10-08 15:07:34,001][102897] Updated weights for policy 0, policy_version 84070 (0.0008) +[2023-10-08 15:07:34,367][102897] Updated weights for policy 0, policy_version 84080 (0.0008) +[2023-10-08 15:07:34,743][102897] Updated weights for policy 0, policy_version 84090 (0.0009) +[2023-10-08 15:07:36,197][102898] Updated weights for policy 1, policy_version 84200 (0.0007) +[2023-10-08 15:07:36,563][102898] Updated weights for policy 1, policy_version 84210 (0.0008) +[2023-10-08 15:07:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 172326912. Throughput: 0: 1803.6, 1: 1787.0. Samples: 43089068. Policy #0 lag: (min: 25.0, avg: 45.6, max: 57.0) +[2023-10-08 15:07:36,876][101941] Avg episode reward: [(0, '9.060'), (1, '13.170')] +[2023-10-08 15:07:36,931][102898] Updated weights for policy 1, policy_version 84220 (0.0007) +[2023-10-08 15:07:38,577][102897] Updated weights for policy 0, policy_version 84100 (0.0007) +[2023-10-08 15:07:38,948][102897] Updated weights for policy 0, policy_version 84110 (0.0007) +[2023-10-08 15:07:39,315][102897] Updated weights for policy 0, policy_version 84120 (0.0008) +[2023-10-08 15:07:40,663][102898] Updated weights for policy 1, policy_version 84230 (0.0008) +[2023-10-08 15:07:41,019][102898] Updated weights for policy 1, policy_version 84240 (0.0008) +[2023-10-08 15:07:41,386][102898] Updated weights for policy 1, policy_version 84250 (0.0010) +[2023-10-08 15:07:41,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 172425216. Throughput: 0: 1798.0, 1: 1802.1. Samples: 43110738. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:07:41,876][101941] Avg episode reward: [(0, '9.230'), (1, '12.210')] +[2023-10-08 15:07:43,129][102897] Updated weights for policy 0, policy_version 84130 (0.0007) +[2023-10-08 15:07:43,503][102897] Updated weights for policy 0, policy_version 84140 (0.0008) +[2023-10-08 15:07:43,872][102897] Updated weights for policy 0, policy_version 84150 (0.0008) +[2023-10-08 15:07:44,245][102897] Updated weights for policy 0, policy_version 84160 (0.0009) +[2023-10-08 15:07:45,069][102898] Updated weights for policy 1, policy_version 84260 (0.0010) +[2023-10-08 15:07:45,434][102898] Updated weights for policy 1, policy_version 84270 (0.0010) +[2023-10-08 15:07:45,798][102898] Updated weights for policy 1, policy_version 84280 (0.0009) +[2023-10-08 15:07:46,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 172490752. Throughput: 0: 1805.8, 1: 1788.3. Samples: 43131994. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:07:46,876][101941] Avg episode reward: [(0, '8.830'), (1, '12.320')] +[2023-10-08 15:07:47,893][102897] Updated weights for policy 0, policy_version 84170 (0.0007) +[2023-10-08 15:07:48,265][102897] Updated weights for policy 0, policy_version 84180 (0.0008) +[2023-10-08 15:07:48,631][102897] Updated weights for policy 0, policy_version 84190 (0.0009) +[2023-10-08 15:07:49,657][102898] Updated weights for policy 1, policy_version 84290 (0.0010) +[2023-10-08 15:07:50,014][102898] Updated weights for policy 1, policy_version 84300 (0.0008) +[2023-10-08 15:07:50,380][102898] Updated weights for policy 1, policy_version 84310 (0.0008) +[2023-10-08 15:07:50,746][102898] Updated weights for policy 1, policy_version 84320 (0.0008) +[2023-10-08 15:07:51,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 172556288. Throughput: 0: 1807.5, 1: 1803.6. Samples: 43143246. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:07:51,876][101941] Avg episode reward: [(0, '8.490'), (1, '12.060')] +[2023-10-08 15:07:52,319][102897] Updated weights for policy 0, policy_version 84200 (0.0007) +[2023-10-08 15:07:52,684][102897] Updated weights for policy 0, policy_version 84210 (0.0007) +[2023-10-08 15:07:53,048][102897] Updated weights for policy 0, policy_version 84220 (0.0007) +[2023-10-08 15:07:54,552][102898] Updated weights for policy 1, policy_version 84330 (0.0008) +[2023-10-08 15:07:54,928][102898] Updated weights for policy 1, policy_version 84340 (0.0007) +[2023-10-08 15:07:55,298][102898] Updated weights for policy 1, policy_version 84350 (0.0007) +[2023-10-08 15:07:56,706][102897] Updated weights for policy 0, policy_version 84230 (0.0008) +[2023-10-08 15:07:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 172621824. Throughput: 0: 1811.9, 1: 1781.4. Samples: 43164166. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:07:56,876][101941] Avg episode reward: [(0, '8.330'), (1, '12.840')] +[2023-10-08 15:07:57,077][102897] Updated weights for policy 0, policy_version 84240 (0.0008) +[2023-10-08 15:07:57,442][102897] Updated weights for policy 0, policy_version 84250 (0.0007) +[2023-10-08 15:07:59,124][102898] Updated weights for policy 1, policy_version 84360 (0.0010) +[2023-10-08 15:07:59,498][102898] Updated weights for policy 1, policy_version 84370 (0.0009) +[2023-10-08 15:07:59,873][102898] Updated weights for policy 1, policy_version 84380 (0.0008) +[2023-10-08 15:08:01,374][102897] Updated weights for policy 0, policy_version 84260 (0.0008) +[2023-10-08 15:08:01,738][102897] Updated weights for policy 0, policy_version 84270 (0.0007) +[2023-10-08 15:08:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 172687360. Throughput: 0: 1814.9, 1: 1784.3. Samples: 43186194. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:08:01,875][101941] Avg episode reward: [(0, '8.160'), (1, '13.120')] +[2023-10-08 15:08:02,115][102897] Updated weights for policy 0, policy_version 84280 (0.0009) +[2023-10-08 15:08:03,724][102898] Updated weights for policy 1, policy_version 84390 (0.0010) +[2023-10-08 15:08:04,079][102898] Updated weights for policy 1, policy_version 84400 (0.0010) +[2023-10-08 15:08:04,444][102898] Updated weights for policy 1, policy_version 84410 (0.0009) +[2023-10-08 15:08:05,932][102897] Updated weights for policy 0, policy_version 84290 (0.0009) +[2023-10-08 15:08:06,306][102897] Updated weights for policy 0, policy_version 84300 (0.0009) +[2023-10-08 15:08:06,676][102897] Updated weights for policy 0, policy_version 84310 (0.0007) +[2023-10-08 15:08:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 172752896. Throughput: 0: 1802.0, 1: 1790.5. Samples: 43196448. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:08:06,876][101941] Avg episode reward: [(0, '8.450'), (1, '12.490')] +[2023-10-08 15:08:07,051][102897] Updated weights for policy 0, policy_version 84320 (0.0008) +[2023-10-08 15:08:08,262][102898] Updated weights for policy 1, policy_version 84420 (0.0009) +[2023-10-08 15:08:08,634][102898] Updated weights for policy 1, policy_version 84430 (0.0009) +[2023-10-08 15:08:08,993][102898] Updated weights for policy 1, policy_version 84440 (0.0010) +[2023-10-08 15:08:10,773][102897] Updated weights for policy 0, policy_version 84330 (0.0008) +[2023-10-08 15:08:11,144][102897] Updated weights for policy 0, policy_version 84340 (0.0009) +[2023-10-08 15:08:11,511][102897] Updated weights for policy 0, policy_version 84350 (0.0008) +[2023-10-08 15:08:11,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 172851200. Throughput: 0: 1808.8, 1: 1785.7. Samples: 43218464. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:08:11,876][101941] Avg episode reward: [(0, '8.480'), (1, '12.850')] +[2023-10-08 15:08:12,809][102898] Updated weights for policy 1, policy_version 84450 (0.0009) +[2023-10-08 15:08:13,187][102898] Updated weights for policy 1, policy_version 84460 (0.0007) +[2023-10-08 15:08:13,557][102898] Updated weights for policy 1, policy_version 84470 (0.0007) +[2023-10-08 15:08:13,922][102898] Updated weights for policy 1, policy_version 84480 (0.0007) +[2023-10-08 15:08:15,311][102897] Updated weights for policy 0, policy_version 84360 (0.0009) +[2023-10-08 15:08:15,673][102897] Updated weights for policy 0, policy_version 84370 (0.0008) +[2023-10-08 15:08:16,039][102897] Updated weights for policy 0, policy_version 84380 (0.0009) +[2023-10-08 15:08:16,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 172916736. Throughput: 0: 1793.1, 1: 1791.1. Samples: 43239316. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:08:16,876][101941] Avg episode reward: [(0, '9.090'), (1, '12.800')] +[2023-10-08 15:08:16,887][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000084384_86409216.pth... +[2023-10-08 15:08:16,887][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000084480_86507520.pth... +[2023-10-08 15:08:16,926][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000082816_84803584.pth +[2023-10-08 15:08:16,927][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000082720_84705280.pth +[2023-10-08 15:08:17,597][102898] Updated weights for policy 1, policy_version 84490 (0.0007) +[2023-10-08 15:08:17,970][102898] Updated weights for policy 1, policy_version 84500 (0.0009) +[2023-10-08 15:08:18,341][102898] Updated weights for policy 1, policy_version 84510 (0.0009) +[2023-10-08 15:08:19,800][102897] Updated weights for policy 0, policy_version 84390 (0.0008) +[2023-10-08 15:08:20,172][102897] Updated weights for policy 0, policy_version 84400 (0.0007) +[2023-10-08 15:08:20,547][102897] Updated weights for policy 0, policy_version 84410 (0.0007) +[2023-10-08 15:08:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 172982272. Throughput: 0: 1803.2, 1: 1780.4. Samples: 43250332. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:08:21,876][101941] Avg episode reward: [(0, '9.490'), (1, '13.830')] +[2023-10-08 15:08:22,113][102898] Updated weights for policy 1, policy_version 84520 (0.0009) +[2023-10-08 15:08:22,477][102898] Updated weights for policy 1, policy_version 84530 (0.0007) +[2023-10-08 15:08:22,843][102898] Updated weights for policy 1, policy_version 84540 (0.0007) +[2023-10-08 15:08:24,218][102897] Updated weights for policy 0, policy_version 84420 (0.0008) +[2023-10-08 15:08:24,583][102897] Updated weights for policy 0, policy_version 84430 (0.0010) +[2023-10-08 15:08:24,953][102897] Updated weights for policy 0, policy_version 84440 (0.0009) +[2023-10-08 15:08:26,620][102898] Updated weights for policy 1, policy_version 84550 (0.0009) +[2023-10-08 15:08:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 173047808. Throughput: 0: 1790.9, 1: 1777.8. Samples: 43271328. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:08:26,876][101941] Avg episode reward: [(0, '8.870'), (1, '13.120')] +[2023-10-08 15:08:26,991][102898] Updated weights for policy 1, policy_version 84560 (0.0008) +[2023-10-08 15:08:27,357][102898] Updated weights for policy 1, policy_version 84570 (0.0007) +[2023-10-08 15:08:28,669][102897] Updated weights for policy 0, policy_version 84450 (0.0010) +[2023-10-08 15:08:29,041][102897] Updated weights for policy 0, policy_version 84460 (0.0008) +[2023-10-08 15:08:29,408][102897] Updated weights for policy 0, policy_version 84470 (0.0007) +[2023-10-08 15:08:29,770][102897] Updated weights for policy 0, policy_version 84480 (0.0009) +[2023-10-08 15:08:31,157][102898] Updated weights for policy 1, policy_version 84580 (0.0010) +[2023-10-08 15:08:31,515][102898] Updated weights for policy 1, policy_version 84590 (0.0008) +[2023-10-08 15:08:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 173113344. Throughput: 0: 1785.7, 1: 1798.7. Samples: 43293292. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:08:31,876][102898] Updated weights for policy 1, policy_version 84600 (0.0010) +[2023-10-08 15:08:31,876][101941] Avg episode reward: [(0, '8.850'), (1, '13.130')] +[2023-10-08 15:08:33,670][102897] Updated weights for policy 0, policy_version 84490 (0.0008) +[2023-10-08 15:08:34,044][102897] Updated weights for policy 0, policy_version 84500 (0.0007) +[2023-10-08 15:08:34,415][102897] Updated weights for policy 0, policy_version 84510 (0.0008) +[2023-10-08 15:08:35,429][102898] Updated weights for policy 1, policy_version 84610 (0.0007) +[2023-10-08 15:08:35,793][102898] Updated weights for policy 1, policy_version 84620 (0.0007) +[2023-10-08 15:08:36,162][102898] Updated weights for policy 1, policy_version 84630 (0.0009) +[2023-10-08 15:08:36,530][102898] Updated weights for policy 1, policy_version 84640 (0.0009) +[2023-10-08 15:08:36,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 173211648. Throughput: 0: 1789.9, 1: 1783.5. Samples: 43304048. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 15:08:36,876][101941] Avg episode reward: [(0, '9.070'), (1, '14.140')] +[2023-10-08 15:08:38,105][102897] Updated weights for policy 0, policy_version 84520 (0.0009) +[2023-10-08 15:08:38,466][102897] Updated weights for policy 0, policy_version 84530 (0.0008) +[2023-10-08 15:08:38,844][102897] Updated weights for policy 0, policy_version 84540 (0.0008) +[2023-10-08 15:08:40,198][102898] Updated weights for policy 1, policy_version 84650 (0.0008) +[2023-10-08 15:08:40,566][102898] Updated weights for policy 1, policy_version 84660 (0.0008) +[2023-10-08 15:08:40,936][102898] Updated weights for policy 1, policy_version 84670 (0.0010) +[2023-10-08 15:08:41,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 173277184. Throughput: 0: 1782.7, 1: 1805.3. Samples: 43325624. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 15:08:41,876][101941] Avg episode reward: [(0, '8.070'), (1, '13.200')] +[2023-10-08 15:08:42,622][102897] Updated weights for policy 0, policy_version 84550 (0.0008) +[2023-10-08 15:08:42,985][102897] Updated weights for policy 0, policy_version 84560 (0.0009) +[2023-10-08 15:08:43,353][102897] Updated weights for policy 0, policy_version 84570 (0.0007) +[2023-10-08 15:08:44,552][102898] Updated weights for policy 1, policy_version 84680 (0.0009) +[2023-10-08 15:08:44,922][102898] Updated weights for policy 1, policy_version 84690 (0.0009) +[2023-10-08 15:08:45,289][102898] Updated weights for policy 1, policy_version 84700 (0.0008) +[2023-10-08 15:08:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 173342720. Throughput: 0: 1793.7, 1: 1794.4. Samples: 43347658. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 15:08:46,875][101941] Avg episode reward: [(0, '8.600'), (1, '13.650')] +[2023-10-08 15:08:47,043][102897] Updated weights for policy 0, policy_version 84580 (0.0007) +[2023-10-08 15:08:47,407][102897] Updated weights for policy 0, policy_version 84590 (0.0007) +[2023-10-08 15:08:47,780][102897] Updated weights for policy 0, policy_version 84600 (0.0009) +[2023-10-08 15:08:49,149][102898] Updated weights for policy 1, policy_version 84710 (0.0008) +[2023-10-08 15:08:49,513][102898] Updated weights for policy 1, policy_version 84720 (0.0007) +[2023-10-08 15:08:49,883][102898] Updated weights for policy 1, policy_version 84730 (0.0008) +[2023-10-08 15:08:51,692][102897] Updated weights for policy 0, policy_version 84610 (0.0008) +[2023-10-08 15:08:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 173408256. Throughput: 0: 1788.6, 1: 1803.0. Samples: 43358068. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 15:08:51,876][101941] Avg episode reward: [(0, '8.860'), (1, '13.130')] +[2023-10-08 15:08:52,065][102897] Updated weights for policy 0, policy_version 84620 (0.0008) +[2023-10-08 15:08:52,448][102897] Updated weights for policy 0, policy_version 84630 (0.0008) +[2023-10-08 15:08:52,815][102897] Updated weights for policy 0, policy_version 84640 (0.0007) +[2023-10-08 15:08:53,621][102898] Updated weights for policy 1, policy_version 84740 (0.0008) +[2023-10-08 15:08:53,997][102898] Updated weights for policy 1, policy_version 84750 (0.0009) +[2023-10-08 15:08:54,361][102898] Updated weights for policy 1, policy_version 84760 (0.0009) +[2023-10-08 15:08:56,574][102897] Updated weights for policy 0, policy_version 84650 (0.0008) +[2023-10-08 15:08:56,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 173473792. Throughput: 0: 1781.7, 1: 1797.0. Samples: 43379504. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 15:08:56,876][101941] Avg episode reward: [(0, '8.740'), (1, '13.460')] +[2023-10-08 15:08:56,949][102897] Updated weights for policy 0, policy_version 84660 (0.0007) +[2023-10-08 15:08:57,321][102897] Updated weights for policy 0, policy_version 84670 (0.0008) +[2023-10-08 15:08:57,911][102898] Updated weights for policy 1, policy_version 84770 (0.0008) +[2023-10-08 15:08:58,278][102898] Updated weights for policy 1, policy_version 84780 (0.0007) +[2023-10-08 15:08:58,645][102898] Updated weights for policy 1, policy_version 84790 (0.0007) +[2023-10-08 15:08:59,011][102898] Updated weights for policy 1, policy_version 84800 (0.0008) +[2023-10-08 15:09:01,037][102897] Updated weights for policy 0, policy_version 84680 (0.0009) +[2023-10-08 15:09:01,406][102897] Updated weights for policy 0, policy_version 84690 (0.0008) +[2023-10-08 15:09:01,773][102897] Updated weights for policy 0, policy_version 84700 (0.0009) +[2023-10-08 15:09:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 173539328. Throughput: 0: 1795.6, 1: 1804.5. Samples: 43401320. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 15:09:01,876][101941] Avg episode reward: [(0, '8.890'), (1, '12.220')] +[2023-10-08 15:09:02,809][102898] Updated weights for policy 1, policy_version 84810 (0.0010) +[2023-10-08 15:09:03,184][102898] Updated weights for policy 1, policy_version 84820 (0.0010) +[2023-10-08 15:09:03,556][102898] Updated weights for policy 1, policy_version 84830 (0.0011) +[2023-10-08 15:09:05,554][102897] Updated weights for policy 0, policy_version 84710 (0.0008) +[2023-10-08 15:09:05,940][102897] Updated weights for policy 0, policy_version 84720 (0.0007) +[2023-10-08 15:09:06,311][102897] Updated weights for policy 0, policy_version 84730 (0.0007) +[2023-10-08 15:09:06,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 173637632. Throughput: 0: 1779.6, 1: 1803.2. Samples: 43411554. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 15:09:06,875][101941] Avg episode reward: [(0, '8.820'), (1, '12.230')] +[2023-10-08 15:09:07,421][102898] Updated weights for policy 1, policy_version 84840 (0.0007) +[2023-10-08 15:09:07,780][102898] Updated weights for policy 1, policy_version 84850 (0.0008) +[2023-10-08 15:09:08,152][102898] Updated weights for policy 1, policy_version 84860 (0.0008) +[2023-10-08 15:09:09,999][102897] Updated weights for policy 0, policy_version 84740 (0.0007) +[2023-10-08 15:09:10,380][102897] Updated weights for policy 0, policy_version 84750 (0.0008) +[2023-10-08 15:09:10,748][102897] Updated weights for policy 0, policy_version 84760 (0.0008) +[2023-10-08 15:09:11,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 173703168. Throughput: 0: 1803.1, 1: 1801.6. Samples: 43433540. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 15:09:11,875][101941] Avg episode reward: [(0, '9.570'), (1, '14.070')] +[2023-10-08 15:09:11,970][102898] Updated weights for policy 1, policy_version 84870 (0.0009) +[2023-10-08 15:09:12,338][102898] Updated weights for policy 1, policy_version 84880 (0.0007) +[2023-10-08 15:09:12,706][102898] Updated weights for policy 1, policy_version 84890 (0.0007) +[2023-10-08 15:09:14,632][102897] Updated weights for policy 0, policy_version 84770 (0.0008) +[2023-10-08 15:09:15,002][102897] Updated weights for policy 0, policy_version 84780 (0.0009) +[2023-10-08 15:09:15,373][102897] Updated weights for policy 0, policy_version 84790 (0.0008) +[2023-10-08 15:09:15,739][102897] Updated weights for policy 0, policy_version 84800 (0.0007) +[2023-10-08 15:09:16,463][102898] Updated weights for policy 1, policy_version 84900 (0.0008) +[2023-10-08 15:09:16,837][102898] Updated weights for policy 1, policy_version 84910 (0.0010) +[2023-10-08 15:09:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 173768704. Throughput: 0: 1785.0, 1: 1805.6. Samples: 43454868. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 15:09:16,876][101941] Avg episode reward: [(0, '9.650'), (1, '13.300')] +[2023-10-08 15:09:17,208][102898] Updated weights for policy 1, policy_version 84920 (0.0007) +[2023-10-08 15:09:19,542][102897] Updated weights for policy 0, policy_version 84810 (0.0007) +[2023-10-08 15:09:19,906][102897] Updated weights for policy 0, policy_version 84820 (0.0007) +[2023-10-08 15:09:20,278][102897] Updated weights for policy 0, policy_version 84830 (0.0008) +[2023-10-08 15:09:20,983][102898] Updated weights for policy 1, policy_version 84930 (0.0007) +[2023-10-08 15:09:21,347][102898] Updated weights for policy 1, policy_version 84940 (0.0011) +[2023-10-08 15:09:21,709][102898] Updated weights for policy 1, policy_version 84950 (0.0010) +[2023-10-08 15:09:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 173834240. Throughput: 0: 1807.2, 1: 1791.5. Samples: 43465992. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 15:09:21,876][101941] Avg episode reward: [(0, '8.610'), (1, '14.330')] +[2023-10-08 15:09:22,070][102760] Saving new best policy, reward=14.330! +[2023-10-08 15:09:22,072][102898] Updated weights for policy 1, policy_version 84960 (0.0010) +[2023-10-08 15:09:23,863][102897] Updated weights for policy 0, policy_version 84840 (0.0008) +[2023-10-08 15:09:24,221][102897] Updated weights for policy 0, policy_version 84850 (0.0007) +[2023-10-08 15:09:24,598][102897] Updated weights for policy 0, policy_version 84860 (0.0007) +[2023-10-08 15:09:26,127][102898] Updated weights for policy 1, policy_version 84970 (0.0009) +[2023-10-08 15:09:26,489][102898] Updated weights for policy 1, policy_version 84980 (0.0008) +[2023-10-08 15:09:26,862][102898] Updated weights for policy 1, policy_version 84990 (0.0007) +[2023-10-08 15:09:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 173899776. Throughput: 0: 1787.0, 1: 1802.4. Samples: 43487146. Policy #0 lag: (min: 30.0, avg: 30.0, max: 30.0) +[2023-10-08 15:09:26,876][101941] Avg episode reward: [(0, '8.920'), (1, '13.440')] +[2023-10-08 15:09:28,401][102897] Updated weights for policy 0, policy_version 84870 (0.0008) +[2023-10-08 15:09:28,772][102897] Updated weights for policy 0, policy_version 84880 (0.0008) +[2023-10-08 15:09:29,141][102897] Updated weights for policy 0, policy_version 84890 (0.0008) +[2023-10-08 15:09:30,473][102898] Updated weights for policy 1, policy_version 85000 (0.0008) +[2023-10-08 15:09:30,848][102898] Updated weights for policy 1, policy_version 85010 (0.0011) +[2023-10-08 15:09:31,210][102898] Updated weights for policy 1, policy_version 85020 (0.0009) +[2023-10-08 15:09:31,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 173998080. Throughput: 0: 1782.8, 1: 1781.8. Samples: 43508062. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:09:31,876][101941] Avg episode reward: [(0, '9.480'), (1, '13.180')] +[2023-10-08 15:09:32,837][102897] Updated weights for policy 0, policy_version 84900 (0.0007) +[2023-10-08 15:09:33,213][102897] Updated weights for policy 0, policy_version 84910 (0.0008) +[2023-10-08 15:09:33,590][102897] Updated weights for policy 0, policy_version 84920 (0.0010) +[2023-10-08 15:09:35,071][102898] Updated weights for policy 1, policy_version 85030 (0.0008) +[2023-10-08 15:09:35,440][102898] Updated weights for policy 1, policy_version 85040 (0.0011) +[2023-10-08 15:09:35,794][102898] Updated weights for policy 1, policy_version 85050 (0.0007) +[2023-10-08 15:09:36,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 174063616. Throughput: 0: 1785.3, 1: 1796.1. Samples: 43519234. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:09:36,876][101941] Avg episode reward: [(0, '9.850'), (1, '13.270')] +[2023-10-08 15:09:37,480][102897] Updated weights for policy 0, policy_version 84930 (0.0007) +[2023-10-08 15:09:37,838][102897] Updated weights for policy 0, policy_version 84940 (0.0009) +[2023-10-08 15:09:38,215][102897] Updated weights for policy 0, policy_version 84950 (0.0007) +[2023-10-08 15:09:38,583][102897] Updated weights for policy 0, policy_version 84960 (0.0008) +[2023-10-08 15:09:39,629][102898] Updated weights for policy 1, policy_version 85060 (0.0007) +[2023-10-08 15:09:39,985][102898] Updated weights for policy 1, policy_version 85070 (0.0008) +[2023-10-08 15:09:40,352][102898] Updated weights for policy 1, policy_version 85080 (0.0008) +[2023-10-08 15:09:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 174129152. Throughput: 0: 1787.1, 1: 1785.3. Samples: 43540264. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:09:41,876][101941] Avg episode reward: [(0, '8.690'), (1, '12.190')] +[2023-10-08 15:09:42,504][102897] Updated weights for policy 0, policy_version 84970 (0.0008) +[2023-10-08 15:09:42,885][102897] Updated weights for policy 0, policy_version 84980 (0.0009) +[2023-10-08 15:09:43,265][102897] Updated weights for policy 0, policy_version 84990 (0.0008) +[2023-10-08 15:09:43,957][102898] Updated weights for policy 1, policy_version 85090 (0.0007) +[2023-10-08 15:09:44,328][102898] Updated weights for policy 1, policy_version 85100 (0.0007) +[2023-10-08 15:09:44,690][102898] Updated weights for policy 1, policy_version 85110 (0.0009) +[2023-10-08 15:09:45,054][102898] Updated weights for policy 1, policy_version 85120 (0.0009) +[2023-10-08 15:09:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 174194688. Throughput: 0: 1803.5, 1: 1773.9. Samples: 43562304. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:09:46,876][101941] Avg episode reward: [(0, '9.070'), (1, '11.790')] +[2023-10-08 15:09:47,035][102897] Updated weights for policy 0, policy_version 85000 (0.0009) +[2023-10-08 15:09:47,406][102897] Updated weights for policy 0, policy_version 85010 (0.0007) +[2023-10-08 15:09:47,777][102897] Updated weights for policy 0, policy_version 85020 (0.0009) +[2023-10-08 15:09:48,976][102898] Updated weights for policy 1, policy_version 85130 (0.0009) +[2023-10-08 15:09:49,335][102898] Updated weights for policy 1, policy_version 85140 (0.0007) +[2023-10-08 15:09:49,708][102898] Updated weights for policy 1, policy_version 85150 (0.0007) +[2023-10-08 15:09:51,598][102897] Updated weights for policy 0, policy_version 85030 (0.0008) +[2023-10-08 15:09:51,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 174260224. Throughput: 0: 1786.6, 1: 1785.2. Samples: 43572284. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:09:51,876][101941] Avg episode reward: [(0, '9.350'), (1, '12.730')] +[2023-10-08 15:09:51,965][102897] Updated weights for policy 0, policy_version 85040 (0.0009) +[2023-10-08 15:09:52,342][102897] Updated weights for policy 0, policy_version 85050 (0.0007) +[2023-10-08 15:09:53,517][102898] Updated weights for policy 1, policy_version 85160 (0.0008) +[2023-10-08 15:09:53,880][102898] Updated weights for policy 1, policy_version 85170 (0.0007) +[2023-10-08 15:09:54,243][102898] Updated weights for policy 1, policy_version 85180 (0.0008) +[2023-10-08 15:09:56,067][102897] Updated weights for policy 0, policy_version 85060 (0.0010) +[2023-10-08 15:09:56,435][102897] Updated weights for policy 0, policy_version 85070 (0.0010) +[2023-10-08 15:09:56,808][102897] Updated weights for policy 0, policy_version 85080 (0.0009) +[2023-10-08 15:09:56,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 174325760. Throughput: 0: 1792.3, 1: 1776.4. Samples: 43594128. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:09:56,875][101941] Avg episode reward: [(0, '9.150'), (1, '13.240')] +[2023-10-08 15:09:58,022][102898] Updated weights for policy 1, policy_version 85190 (0.0010) +[2023-10-08 15:09:58,382][102898] Updated weights for policy 1, policy_version 85200 (0.0008) +[2023-10-08 15:09:58,756][102898] Updated weights for policy 1, policy_version 85210 (0.0007) +[2023-10-08 15:10:00,661][102897] Updated weights for policy 0, policy_version 85090 (0.0007) +[2023-10-08 15:10:01,027][102897] Updated weights for policy 0, policy_version 85100 (0.0009) +[2023-10-08 15:10:01,398][102897] Updated weights for policy 0, policy_version 85110 (0.0008) +[2023-10-08 15:10:01,774][102897] Updated weights for policy 0, policy_version 85120 (0.0007) +[2023-10-08 15:10:01,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 174424064. Throughput: 0: 1786.3, 1: 1784.3. Samples: 43615546. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:10:01,876][101941] Avg episode reward: [(0, '8.880'), (1, '14.600')] +[2023-10-08 15:10:01,889][102760] Saving new best policy, reward=14.600! +[2023-10-08 15:10:02,564][102898] Updated weights for policy 1, policy_version 85220 (0.0007) +[2023-10-08 15:10:02,933][102898] Updated weights for policy 1, policy_version 85230 (0.0007) +[2023-10-08 15:10:03,300][102898] Updated weights for policy 1, policy_version 85240 (0.0007) +[2023-10-08 15:10:05,508][102897] Updated weights for policy 0, policy_version 85130 (0.0008) +[2023-10-08 15:10:05,880][102897] Updated weights for policy 0, policy_version 85140 (0.0007) +[2023-10-08 15:10:06,253][102897] Updated weights for policy 0, policy_version 85150 (0.0009) +[2023-10-08 15:10:06,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 174489600. Throughput: 0: 1783.0, 1: 1778.1. Samples: 43626242. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:10:06,876][101941] Avg episode reward: [(0, '9.260'), (1, '13.210')] +[2023-10-08 15:10:06,883][102898] Updated weights for policy 1, policy_version 85250 (0.0007) +[2023-10-08 15:10:07,244][102898] Updated weights for policy 1, policy_version 85260 (0.0009) +[2023-10-08 15:10:07,616][102898] Updated weights for policy 1, policy_version 85270 (0.0007) +[2023-10-08 15:10:07,978][102898] Updated weights for policy 1, policy_version 85280 (0.0008) +[2023-10-08 15:10:09,939][102897] Updated weights for policy 0, policy_version 85160 (0.0008) +[2023-10-08 15:10:10,309][102897] Updated weights for policy 0, policy_version 85170 (0.0008) +[2023-10-08 15:10:10,676][102897] Updated weights for policy 0, policy_version 85180 (0.0008) +[2023-10-08 15:10:11,684][102898] Updated weights for policy 1, policy_version 85290 (0.0008) +[2023-10-08 15:10:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 174555136. Throughput: 0: 1783.5, 1: 1785.0. Samples: 43647728. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:10:11,876][101941] Avg episode reward: [(0, '8.950'), (1, '13.240')] +[2023-10-08 15:10:12,055][102898] Updated weights for policy 1, policy_version 85300 (0.0009) +[2023-10-08 15:10:12,427][102898] Updated weights for policy 1, policy_version 85310 (0.0008) +[2023-10-08 15:10:14,385][102897] Updated weights for policy 0, policy_version 85190 (0.0008) +[2023-10-08 15:10:14,761][102897] Updated weights for policy 0, policy_version 85200 (0.0007) +[2023-10-08 15:10:15,132][102897] Updated weights for policy 0, policy_version 85210 (0.0008) +[2023-10-08 15:10:16,179][102898] Updated weights for policy 1, policy_version 85320 (0.0009) +[2023-10-08 15:10:16,546][102898] Updated weights for policy 1, policy_version 85330 (0.0009) +[2023-10-08 15:10:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 174620672. Throughput: 0: 1770.0, 1: 1800.5. Samples: 43668736. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:10:16,876][101941] Avg episode reward: [(0, '8.210'), (1, '13.860')] +[2023-10-08 15:10:16,887][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000085216_87261184.pth... +[2023-10-08 15:10:16,920][102898] Updated weights for policy 1, policy_version 85340 (0.0007) +[2023-10-08 15:10:16,922][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000083552_85557248.pth +[2023-10-08 15:10:17,058][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000085344_87392256.pth... +[2023-10-08 15:10:17,086][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000083648_85655552.pth +[2023-10-08 15:10:18,981][102897] Updated weights for policy 0, policy_version 85220 (0.0008) +[2023-10-08 15:10:19,350][102897] Updated weights for policy 0, policy_version 85230 (0.0007) +[2023-10-08 15:10:19,720][102897] Updated weights for policy 0, policy_version 85240 (0.0008) +[2023-10-08 15:10:20,599][102898] Updated weights for policy 1, policy_version 85350 (0.0008) +[2023-10-08 15:10:20,970][102898] Updated weights for policy 1, policy_version 85360 (0.0008) +[2023-10-08 15:10:21,327][102898] Updated weights for policy 1, policy_version 85370 (0.0007) +[2023-10-08 15:10:21,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 174718976. Throughput: 0: 1786.1, 1: 1783.8. Samples: 43679882. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:10:21,876][101941] Avg episode reward: [(0, '8.870'), (1, '14.110')] +[2023-10-08 15:10:23,605][102897] Updated weights for policy 0, policy_version 85250 (0.0010) +[2023-10-08 15:10:23,973][102897] Updated weights for policy 0, policy_version 85260 (0.0008) +[2023-10-08 15:10:24,350][102897] Updated weights for policy 0, policy_version 85270 (0.0007) +[2023-10-08 15:10:24,718][102897] Updated weights for policy 0, policy_version 85280 (0.0008) +[2023-10-08 15:10:25,038][102898] Updated weights for policy 1, policy_version 85380 (0.0007) +[2023-10-08 15:10:25,409][102898] Updated weights for policy 1, policy_version 85390 (0.0008) +[2023-10-08 15:10:25,774][102898] Updated weights for policy 1, policy_version 85400 (0.0010) +[2023-10-08 15:10:26,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 174784512. Throughput: 0: 1765.2, 1: 1801.0. Samples: 43700744. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:10:26,876][101941] Avg episode reward: [(0, '9.110'), (1, '14.340')] +[2023-10-08 15:10:28,532][102897] Updated weights for policy 0, policy_version 85290 (0.0007) +[2023-10-08 15:10:28,901][102897] Updated weights for policy 0, policy_version 85300 (0.0007) +[2023-10-08 15:10:29,264][102897] Updated weights for policy 0, policy_version 85310 (0.0007) +[2023-10-08 15:10:29,630][102898] Updated weights for policy 1, policy_version 85410 (0.0007) +[2023-10-08 15:10:29,999][102898] Updated weights for policy 1, policy_version 85420 (0.0008) +[2023-10-08 15:10:30,368][102898] Updated weights for policy 1, policy_version 85430 (0.0009) +[2023-10-08 15:10:30,738][102898] Updated weights for policy 1, policy_version 85440 (0.0011) +[2023-10-08 15:10:31,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 174850048. Throughput: 0: 1770.5, 1: 1786.9. Samples: 43722382. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:10:31,875][101941] Avg episode reward: [(0, '9.570'), (1, '14.630')] +[2023-10-08 15:10:31,883][102760] Saving new best policy, reward=14.630! +[2023-10-08 15:10:32,951][102897] Updated weights for policy 0, policy_version 85320 (0.0009) +[2023-10-08 15:10:33,327][102897] Updated weights for policy 0, policy_version 85330 (0.0009) +[2023-10-08 15:10:33,692][102897] Updated weights for policy 0, policy_version 85340 (0.0007) +[2023-10-08 15:10:34,551][102898] Updated weights for policy 1, policy_version 85450 (0.0008) +[2023-10-08 15:10:34,929][102898] Updated weights for policy 1, policy_version 85460 (0.0007) +[2023-10-08 15:10:35,281][102898] Updated weights for policy 1, policy_version 85470 (0.0009) +[2023-10-08 15:10:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 174915584. Throughput: 0: 1768.9, 1: 1805.6. Samples: 43733136. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:10:36,875][101941] Avg episode reward: [(0, '9.850'), (1, '14.590')] +[2023-10-08 15:10:37,460][102897] Updated weights for policy 0, policy_version 85350 (0.0008) +[2023-10-08 15:10:37,839][102897] Updated weights for policy 0, policy_version 85360 (0.0007) +[2023-10-08 15:10:38,204][102897] Updated weights for policy 0, policy_version 85370 (0.0010) +[2023-10-08 15:10:39,081][102898] Updated weights for policy 1, policy_version 85480 (0.0009) +[2023-10-08 15:10:39,450][102898] Updated weights for policy 1, policy_version 85490 (0.0007) +[2023-10-08 15:10:39,820][102898] Updated weights for policy 1, policy_version 85500 (0.0009) +[2023-10-08 15:10:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 174981120. Throughput: 0: 1772.3, 1: 1788.5. Samples: 43754364. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:10:41,876][101941] Avg episode reward: [(0, '8.970'), (1, '13.640')] +[2023-10-08 15:10:42,149][102897] Updated weights for policy 0, policy_version 85380 (0.0009) +[2023-10-08 15:10:42,517][102897] Updated weights for policy 0, policy_version 85390 (0.0010) +[2023-10-08 15:10:42,891][102897] Updated weights for policy 0, policy_version 85400 (0.0007) +[2023-10-08 15:10:43,680][102898] Updated weights for policy 1, policy_version 85510 (0.0007) +[2023-10-08 15:10:44,050][102898] Updated weights for policy 1, policy_version 85520 (0.0011) +[2023-10-08 15:10:44,411][102898] Updated weights for policy 1, policy_version 85530 (0.0008) +[2023-10-08 15:10:46,559][102897] Updated weights for policy 0, policy_version 85410 (0.0007) +[2023-10-08 15:10:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 175046656. Throughput: 0: 1799.0, 1: 1786.2. Samples: 43776882. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:10:46,876][101941] Avg episode reward: [(0, '9.340'), (1, '12.160')] +[2023-10-08 15:10:46,934][102897] Updated weights for policy 0, policy_version 85420 (0.0007) +[2023-10-08 15:10:47,303][102897] Updated weights for policy 0, policy_version 85430 (0.0007) +[2023-10-08 15:10:47,674][102897] Updated weights for policy 0, policy_version 85440 (0.0009) +[2023-10-08 15:10:48,172][102898] Updated weights for policy 1, policy_version 85540 (0.0009) +[2023-10-08 15:10:48,534][102898] Updated weights for policy 1, policy_version 85550 (0.0008) +[2023-10-08 15:10:48,904][102898] Updated weights for policy 1, policy_version 85560 (0.0008) +[2023-10-08 15:10:51,378][102897] Updated weights for policy 0, policy_version 85450 (0.0010) +[2023-10-08 15:10:51,754][102897] Updated weights for policy 0, policy_version 85460 (0.0011) +[2023-10-08 15:10:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 175112192. Throughput: 0: 1777.5, 1: 1787.0. Samples: 43786642. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:10:51,876][101941] Avg episode reward: [(0, '9.430'), (1, '12.470')] +[2023-10-08 15:10:52,133][102897] Updated weights for policy 0, policy_version 85470 (0.0010) +[2023-10-08 15:10:52,614][102898] Updated weights for policy 1, policy_version 85570 (0.0007) +[2023-10-08 15:10:52,985][102898] Updated weights for policy 1, policy_version 85580 (0.0008) +[2023-10-08 15:10:53,348][102898] Updated weights for policy 1, policy_version 85590 (0.0007) +[2023-10-08 15:10:53,717][102898] Updated weights for policy 1, policy_version 85600 (0.0008) +[2023-10-08 15:10:55,769][102897] Updated weights for policy 0, policy_version 85480 (0.0008) +[2023-10-08 15:10:56,137][102897] Updated weights for policy 0, policy_version 85490 (0.0007) +[2023-10-08 15:10:56,508][102897] Updated weights for policy 0, policy_version 85500 (0.0009) +[2023-10-08 15:10:56,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 175210496. Throughput: 0: 1802.2, 1: 1786.6. Samples: 43809226. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:10:56,876][101941] Avg episode reward: [(0, '8.100'), (1, '13.100')] +[2023-10-08 15:10:57,453][102898] Updated weights for policy 1, policy_version 85610 (0.0010) +[2023-10-08 15:10:57,829][102898] Updated weights for policy 1, policy_version 85620 (0.0008) +[2023-10-08 15:10:58,184][102898] Updated weights for policy 1, policy_version 85630 (0.0008) +[2023-10-08 15:11:00,135][102897] Updated weights for policy 0, policy_version 85510 (0.0009) +[2023-10-08 15:11:00,501][102897] Updated weights for policy 0, policy_version 85520 (0.0010) +[2023-10-08 15:11:00,872][102897] Updated weights for policy 0, policy_version 85530 (0.0011) +[2023-10-08 15:11:01,835][102898] Updated weights for policy 1, policy_version 85640 (0.0008) +[2023-10-08 15:11:01,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 175276032. Throughput: 0: 1783.3, 1: 1813.1. Samples: 43830574. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:11:01,876][101941] Avg episode reward: [(0, '8.320'), (1, '11.740')] +[2023-10-08 15:11:02,201][102898] Updated weights for policy 1, policy_version 85650 (0.0010) +[2023-10-08 15:11:02,576][102898] Updated weights for policy 1, policy_version 85660 (0.0008) +[2023-10-08 15:11:04,557][102897] Updated weights for policy 0, policy_version 85540 (0.0009) +[2023-10-08 15:11:04,930][102897] Updated weights for policy 0, policy_version 85550 (0.0008) +[2023-10-08 15:11:05,293][102897] Updated weights for policy 0, policy_version 85560 (0.0009) +[2023-10-08 15:11:06,362][102898] Updated weights for policy 1, policy_version 85670 (0.0008) +[2023-10-08 15:11:06,720][102898] Updated weights for policy 1, policy_version 85680 (0.0008) +[2023-10-08 15:11:06,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 175341568. Throughput: 0: 1803.8, 1: 1793.1. Samples: 43841740. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:11:06,876][101941] Avg episode reward: [(0, '8.690'), (1, '11.780')] +[2023-10-08 15:11:07,092][102898] Updated weights for policy 1, policy_version 85690 (0.0008) +[2023-10-08 15:11:08,952][102897] Updated weights for policy 0, policy_version 85570 (0.0010) +[2023-10-08 15:11:09,319][102897] Updated weights for policy 0, policy_version 85580 (0.0007) +[2023-10-08 15:11:09,699][102897] Updated weights for policy 0, policy_version 85590 (0.0008) +[2023-10-08 15:11:10,067][102897] Updated weights for policy 0, policy_version 85600 (0.0008) +[2023-10-08 15:11:10,779][102898] Updated weights for policy 1, policy_version 85700 (0.0009) +[2023-10-08 15:11:11,152][102898] Updated weights for policy 1, policy_version 85710 (0.0008) +[2023-10-08 15:11:11,529][102898] Updated weights for policy 1, policy_version 85720 (0.0008) +[2023-10-08 15:11:11,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 175439872. Throughput: 0: 1798.0, 1: 1804.2. Samples: 43862844. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:11:11,875][101941] Avg episode reward: [(0, '8.010'), (1, '12.220')] +[2023-10-08 15:11:13,750][102897] Updated weights for policy 0, policy_version 85610 (0.0008) +[2023-10-08 15:11:14,106][102897] Updated weights for policy 0, policy_version 85620 (0.0010) +[2023-10-08 15:11:14,474][102897] Updated weights for policy 0, policy_version 85630 (0.0009) +[2023-10-08 15:11:15,361][102898] Updated weights for policy 1, policy_version 85730 (0.0007) +[2023-10-08 15:11:15,723][102898] Updated weights for policy 1, policy_version 85740 (0.0008) +[2023-10-08 15:11:16,087][102898] Updated weights for policy 1, policy_version 85750 (0.0008) +[2023-10-08 15:11:16,459][102898] Updated weights for policy 1, policy_version 85760 (0.0007) +[2023-10-08 15:11:16,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 175505408. Throughput: 0: 1799.1, 1: 1791.2. Samples: 43883948. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:11:16,876][101941] Avg episode reward: [(0, '8.270'), (1, '13.260')] +[2023-10-08 15:11:18,137][102897] Updated weights for policy 0, policy_version 85640 (0.0008) +[2023-10-08 15:11:18,506][102897] Updated weights for policy 0, policy_version 85650 (0.0007) +[2023-10-08 15:11:18,873][102897] Updated weights for policy 0, policy_version 85660 (0.0007) +[2023-10-08 15:11:20,408][102898] Updated weights for policy 1, policy_version 85770 (0.0009) +[2023-10-08 15:11:20,774][102898] Updated weights for policy 1, policy_version 85780 (0.0012) +[2023-10-08 15:11:21,140][102898] Updated weights for policy 1, policy_version 85790 (0.0007) +[2023-10-08 15:11:21,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 175570944. Throughput: 0: 1802.1, 1: 1800.7. Samples: 43895260. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 15:11:21,876][101941] Avg episode reward: [(0, '8.450'), (1, '14.630')] +[2023-10-08 15:11:22,803][102897] Updated weights for policy 0, policy_version 85670 (0.0007) +[2023-10-08 15:11:23,176][102897] Updated weights for policy 0, policy_version 85680 (0.0008) +[2023-10-08 15:11:23,551][102897] Updated weights for policy 0, policy_version 85690 (0.0010) +[2023-10-08 15:11:24,855][102898] Updated weights for policy 1, policy_version 85800 (0.0009) +[2023-10-08 15:11:25,224][102898] Updated weights for policy 1, policy_version 85810 (0.0009) +[2023-10-08 15:11:25,586][102898] Updated weights for policy 1, policy_version 85820 (0.0010) +[2023-10-08 15:11:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14350.4). Total num frames: 175636480. Throughput: 0: 1801.6, 1: 1799.2. Samples: 43916398. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 15:11:26,876][101941] Avg episode reward: [(0, '8.570'), (1, '14.410')] +[2023-10-08 15:11:27,236][102897] Updated weights for policy 0, policy_version 85700 (0.0008) +[2023-10-08 15:11:27,600][102897] Updated weights for policy 0, policy_version 85710 (0.0008) +[2023-10-08 15:11:27,975][102897] Updated weights for policy 0, policy_version 85720 (0.0009) +[2023-10-08 15:11:29,459][102898] Updated weights for policy 1, policy_version 85830 (0.0009) +[2023-10-08 15:11:29,827][102898] Updated weights for policy 1, policy_version 85840 (0.0008) +[2023-10-08 15:11:30,198][102898] Updated weights for policy 1, policy_version 85850 (0.0007) +[2023-10-08 15:11:31,774][102897] Updated weights for policy 0, policy_version 85730 (0.0010) +[2023-10-08 15:11:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 175702016. Throughput: 0: 1803.4, 1: 1785.5. Samples: 43938380. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 15:11:31,876][101941] Avg episode reward: [(0, '8.220'), (1, '14.750')] +[2023-10-08 15:11:31,886][102760] Saving new best policy, reward=14.750! +[2023-10-08 15:11:32,138][102897] Updated weights for policy 0, policy_version 85740 (0.0008) +[2023-10-08 15:11:32,514][102897] Updated weights for policy 0, policy_version 85750 (0.0008) +[2023-10-08 15:11:32,879][102897] Updated weights for policy 0, policy_version 85760 (0.0009) +[2023-10-08 15:11:33,915][102898] Updated weights for policy 1, policy_version 85860 (0.0009) +[2023-10-08 15:11:34,292][102898] Updated weights for policy 1, policy_version 85870 (0.0010) +[2023-10-08 15:11:34,652][102898] Updated weights for policy 1, policy_version 85880 (0.0009) +[2023-10-08 15:11:36,612][102897] Updated weights for policy 0, policy_version 85770 (0.0009) +[2023-10-08 15:11:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 175767552. Throughput: 0: 1802.0, 1: 1805.4. Samples: 43948974. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 15:11:36,875][101941] Avg episode reward: [(0, '8.300'), (1, '14.310')] +[2023-10-08 15:11:36,982][102897] Updated weights for policy 0, policy_version 85780 (0.0007) +[2023-10-08 15:11:37,336][102897] Updated weights for policy 0, policy_version 85790 (0.0008) +[2023-10-08 15:11:38,382][102898] Updated weights for policy 1, policy_version 85890 (0.0008) +[2023-10-08 15:11:38,749][102898] Updated weights for policy 1, policy_version 85900 (0.0007) +[2023-10-08 15:11:39,103][102898] Updated weights for policy 1, policy_version 85910 (0.0007) +[2023-10-08 15:11:39,469][102898] Updated weights for policy 1, policy_version 85920 (0.0008) +[2023-10-08 15:11:40,985][102897] Updated weights for policy 0, policy_version 85800 (0.0009) +[2023-10-08 15:11:41,368][102897] Updated weights for policy 0, policy_version 85810 (0.0008) +[2023-10-08 15:11:41,729][102897] Updated weights for policy 0, policy_version 85820 (0.0008) +[2023-10-08 15:11:41,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 175833088. Throughput: 0: 1811.2, 1: 1797.0. Samples: 43971594. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 15:11:41,876][101941] Avg episode reward: [(0, '9.140'), (1, '14.270')] +[2023-10-08 15:11:43,197][102898] Updated weights for policy 1, policy_version 85930 (0.0009) +[2023-10-08 15:11:43,572][102898] Updated weights for policy 1, policy_version 85940 (0.0009) +[2023-10-08 15:11:43,937][102898] Updated weights for policy 1, policy_version 85950 (0.0010) +[2023-10-08 15:11:45,365][102897] Updated weights for policy 0, policy_version 85830 (0.0008) +[2023-10-08 15:11:45,741][102897] Updated weights for policy 0, policy_version 85840 (0.0010) +[2023-10-08 15:11:46,108][102897] Updated weights for policy 0, policy_version 85850 (0.0010) +[2023-10-08 15:11:46,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 175931392. Throughput: 0: 1815.3, 1: 1784.9. Samples: 43992584. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 15:11:46,876][101941] Avg episode reward: [(0, '9.130'), (1, '13.280')] +[2023-10-08 15:11:47,736][102898] Updated weights for policy 1, policy_version 85960 (0.0008) +[2023-10-08 15:11:48,110][102898] Updated weights for policy 1, policy_version 85970 (0.0008) +[2023-10-08 15:11:48,481][102898] Updated weights for policy 1, policy_version 85980 (0.0008) +[2023-10-08 15:11:49,900][102897] Updated weights for policy 0, policy_version 85860 (0.0008) +[2023-10-08 15:11:50,268][102897] Updated weights for policy 0, policy_version 85870 (0.0008) +[2023-10-08 15:11:50,637][102897] Updated weights for policy 0, policy_version 85880 (0.0008) +[2023-10-08 15:11:51,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 175996928. Throughput: 0: 1812.3, 1: 1786.7. Samples: 44003692. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 15:11:51,876][101941] Avg episode reward: [(0, '8.760'), (1, '13.260')] +[2023-10-08 15:11:52,073][102898] Updated weights for policy 1, policy_version 85990 (0.0009) +[2023-10-08 15:11:52,441][102898] Updated weights for policy 1, policy_version 86000 (0.0009) +[2023-10-08 15:11:52,813][102898] Updated weights for policy 1, policy_version 86010 (0.0008) +[2023-10-08 15:11:54,392][102897] Updated weights for policy 0, policy_version 85890 (0.0009) +[2023-10-08 15:11:54,763][102897] Updated weights for policy 0, policy_version 85900 (0.0008) +[2023-10-08 15:11:55,135][102897] Updated weights for policy 0, policy_version 85910 (0.0009) +[2023-10-08 15:11:55,497][102897] Updated weights for policy 0, policy_version 85920 (0.0008) +[2023-10-08 15:11:56,566][102898] Updated weights for policy 1, policy_version 86020 (0.0009) +[2023-10-08 15:11:56,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 176062464. Throughput: 0: 1815.7, 1: 1786.7. Samples: 44024954. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 15:11:56,876][101941] Avg episode reward: [(0, '9.130'), (1, '13.400')] +[2023-10-08 15:11:56,942][102898] Updated weights for policy 1, policy_version 86030 (0.0008) +[2023-10-08 15:11:57,304][102898] Updated weights for policy 1, policy_version 86040 (0.0007) +[2023-10-08 15:11:59,156][102897] Updated weights for policy 0, policy_version 85930 (0.0010) +[2023-10-08 15:11:59,533][102897] Updated weights for policy 0, policy_version 85940 (0.0008) +[2023-10-08 15:11:59,911][102897] Updated weights for policy 0, policy_version 85950 (0.0010) +[2023-10-08 15:12:01,140][102898] Updated weights for policy 1, policy_version 86050 (0.0008) +[2023-10-08 15:12:01,502][102898] Updated weights for policy 1, policy_version 86060 (0.0010) +[2023-10-08 15:12:01,867][102898] Updated weights for policy 1, policy_version 86070 (0.0007) +[2023-10-08 15:12:01,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 176128000. Throughput: 0: 1811.1, 1: 1806.8. Samples: 44046752. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 15:12:01,876][101941] Avg episode reward: [(0, '9.020'), (1, '13.640')] +[2023-10-08 15:12:02,234][102898] Updated weights for policy 1, policy_version 86080 (0.0009) +[2023-10-08 15:12:03,633][102897] Updated weights for policy 0, policy_version 85960 (0.0011) +[2023-10-08 15:12:04,007][102897] Updated weights for policy 0, policy_version 85970 (0.0007) +[2023-10-08 15:12:04,379][102897] Updated weights for policy 0, policy_version 85980 (0.0009) +[2023-10-08 15:12:06,100][102898] Updated weights for policy 1, policy_version 86090 (0.0009) +[2023-10-08 15:12:06,470][102898] Updated weights for policy 1, policy_version 86100 (0.0008) +[2023-10-08 15:12:06,852][102898] Updated weights for policy 1, policy_version 86110 (0.0009) +[2023-10-08 15:12:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 176193536. Throughput: 0: 1815.5, 1: 1785.6. Samples: 44057306. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 15:12:06,875][101941] Avg episode reward: [(0, '8.170'), (1, '14.720')] +[2023-10-08 15:12:08,123][102897] Updated weights for policy 0, policy_version 85990 (0.0008) +[2023-10-08 15:12:08,492][102897] Updated weights for policy 0, policy_version 86000 (0.0008) +[2023-10-08 15:12:08,862][102897] Updated weights for policy 0, policy_version 86010 (0.0008) +[2023-10-08 15:12:10,496][102898] Updated weights for policy 1, policy_version 86120 (0.0010) +[2023-10-08 15:12:10,869][102898] Updated weights for policy 1, policy_version 86130 (0.0011) +[2023-10-08 15:12:11,236][102898] Updated weights for policy 1, policy_version 86140 (0.0007) +[2023-10-08 15:12:11,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 176291840. Throughput: 0: 1810.0, 1: 1809.4. Samples: 44079272. Policy #0 lag: (min: 31.0, avg: 34.8, max: 63.0) +[2023-10-08 15:12:11,876][101941] Avg episode reward: [(0, '8.020'), (1, '14.870')] +[2023-10-08 15:12:11,877][102760] Saving new best policy, reward=14.870! +[2023-10-08 15:12:12,717][102897] Updated weights for policy 0, policy_version 86020 (0.0008) +[2023-10-08 15:12:13,080][102897] Updated weights for policy 0, policy_version 86030 (0.0009) +[2023-10-08 15:12:13,453][102897] Updated weights for policy 0, policy_version 86040 (0.0010) +[2023-10-08 15:12:14,839][102898] Updated weights for policy 1, policy_version 86150 (0.0007) +[2023-10-08 15:12:15,202][102898] Updated weights for policy 1, policy_version 86160 (0.0008) +[2023-10-08 15:12:15,575][102898] Updated weights for policy 1, policy_version 86170 (0.0008) +[2023-10-08 15:12:16,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 176357376. Throughput: 0: 1803.0, 1: 1803.9. Samples: 44100692. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:12:16,876][101941] Avg episode reward: [(0, '8.180'), (1, '15.310')] +[2023-10-08 15:12:16,888][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000086048_88113152.pth... +[2023-10-08 15:12:16,889][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000086176_88244224.pth... +[2023-10-08 15:12:16,923][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000084480_86507520.pth +[2023-10-08 15:12:16,926][102760] Saving new best policy, reward=15.310! +[2023-10-08 15:12:16,928][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000084384_86409216.pth +[2023-10-08 15:12:17,202][102897] Updated weights for policy 0, policy_version 86050 (0.0008) +[2023-10-08 15:12:17,572][102897] Updated weights for policy 0, policy_version 86060 (0.0010) +[2023-10-08 15:12:17,939][102897] Updated weights for policy 0, policy_version 86070 (0.0008) +[2023-10-08 15:12:18,307][102897] Updated weights for policy 0, policy_version 86080 (0.0008) +[2023-10-08 15:12:19,337][102898] Updated weights for policy 1, policy_version 86180 (0.0007) +[2023-10-08 15:12:19,710][102898] Updated weights for policy 1, policy_version 86190 (0.0010) +[2023-10-08 15:12:20,079][102898] Updated weights for policy 1, policy_version 86200 (0.0009) +[2023-10-08 15:12:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 176422912. Throughput: 0: 1802.5, 1: 1809.7. Samples: 44111524. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:12:21,876][101941] Avg episode reward: [(0, '8.740'), (1, '14.140')] +[2023-10-08 15:12:22,018][102897] Updated weights for policy 0, policy_version 86090 (0.0007) +[2023-10-08 15:12:22,381][102897] Updated weights for policy 0, policy_version 86100 (0.0009) +[2023-10-08 15:12:22,757][102897] Updated weights for policy 0, policy_version 86110 (0.0007) +[2023-10-08 15:12:23,757][102898] Updated weights for policy 1, policy_version 86210 (0.0009) +[2023-10-08 15:12:24,125][102898] Updated weights for policy 1, policy_version 86220 (0.0009) +[2023-10-08 15:12:24,494][102898] Updated weights for policy 1, policy_version 86230 (0.0009) +[2023-10-08 15:12:24,862][102898] Updated weights for policy 1, policy_version 86240 (0.0008) +[2023-10-08 15:12:26,523][102897] Updated weights for policy 0, policy_version 86120 (0.0007) +[2023-10-08 15:12:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 176488448. Throughput: 0: 1793.8, 1: 1792.9. Samples: 44132996. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:12:26,875][101941] Avg episode reward: [(0, '8.930'), (1, '13.880')] +[2023-10-08 15:12:26,896][102897] Updated weights for policy 0, policy_version 86130 (0.0008) +[2023-10-08 15:12:27,264][102897] Updated weights for policy 0, policy_version 86140 (0.0007) +[2023-10-08 15:12:28,650][102898] Updated weights for policy 1, policy_version 86250 (0.0008) +[2023-10-08 15:12:29,024][102898] Updated weights for policy 1, policy_version 86260 (0.0009) +[2023-10-08 15:12:29,388][102898] Updated weights for policy 1, policy_version 86270 (0.0007) +[2023-10-08 15:12:30,978][102897] Updated weights for policy 0, policy_version 86150 (0.0008) +[2023-10-08 15:12:31,345][102897] Updated weights for policy 0, policy_version 86160 (0.0009) +[2023-10-08 15:12:31,707][102897] Updated weights for policy 0, policy_version 86170 (0.0011) +[2023-10-08 15:12:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 176553984. Throughput: 0: 1809.7, 1: 1790.1. Samples: 44154570. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:12:31,875][101941] Avg episode reward: [(0, '9.500'), (1, '12.170')] +[2023-10-08 15:12:33,325][102898] Updated weights for policy 1, policy_version 86280 (0.0007) +[2023-10-08 15:12:33,697][102898] Updated weights for policy 1, policy_version 86290 (0.0010) +[2023-10-08 15:12:34,047][102898] Updated weights for policy 1, policy_version 86300 (0.0009) +[2023-10-08 15:12:35,302][102897] Updated weights for policy 0, policy_version 86180 (0.0009) +[2023-10-08 15:12:35,665][102897] Updated weights for policy 0, policy_version 86190 (0.0009) +[2023-10-08 15:12:36,040][102897] Updated weights for policy 0, policy_version 86200 (0.0007) +[2023-10-08 15:12:36,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.5, 300 sec: 14329.1). Total num frames: 176652288. Throughput: 0: 1797.5, 1: 1791.1. Samples: 44165182. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:12:36,876][101941] Avg episode reward: [(0, '8.300'), (1, '14.030')] +[2023-10-08 15:12:37,794][102898] Updated weights for policy 1, policy_version 86310 (0.0009) +[2023-10-08 15:12:38,164][102898] Updated weights for policy 1, policy_version 86320 (0.0009) +[2023-10-08 15:12:38,526][102898] Updated weights for policy 1, policy_version 86330 (0.0007) +[2023-10-08 15:12:39,679][102897] Updated weights for policy 0, policy_version 86210 (0.0009) +[2023-10-08 15:12:40,041][102897] Updated weights for policy 0, policy_version 86220 (0.0009) +[2023-10-08 15:12:40,405][102897] Updated weights for policy 0, policy_version 86230 (0.0008) +[2023-10-08 15:12:40,774][102897] Updated weights for policy 0, policy_version 86240 (0.0011) +[2023-10-08 15:12:41,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 176717824. Throughput: 0: 1806.2, 1: 1791.9. Samples: 44186868. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:12:41,876][101941] Avg episode reward: [(0, '8.150'), (1, '14.330')] +[2023-10-08 15:12:42,365][102898] Updated weights for policy 1, policy_version 86340 (0.0008) +[2023-10-08 15:12:42,739][102898] Updated weights for policy 1, policy_version 86350 (0.0009) +[2023-10-08 15:12:43,107][102898] Updated weights for policy 1, policy_version 86360 (0.0008) +[2023-10-08 15:12:44,569][102897] Updated weights for policy 0, policy_version 86250 (0.0009) +[2023-10-08 15:12:44,943][102897] Updated weights for policy 0, policy_version 86260 (0.0008) +[2023-10-08 15:12:45,305][102897] Updated weights for policy 0, policy_version 86270 (0.0007) +[2023-10-08 15:12:46,765][102898] Updated weights for policy 1, policy_version 86370 (0.0008) +[2023-10-08 15:12:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 176783360. Throughput: 0: 1795.7, 1: 1803.2. Samples: 44208704. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:12:46,876][101941] Avg episode reward: [(0, '8.940'), (1, '15.460')] +[2023-10-08 15:12:47,137][102898] Updated weights for policy 1, policy_version 86380 (0.0008) +[2023-10-08 15:12:47,510][102898] Updated weights for policy 1, policy_version 86390 (0.0008) +[2023-10-08 15:12:47,874][102760] Saving new best policy, reward=15.460! +[2023-10-08 15:12:47,876][102898] Updated weights for policy 1, policy_version 86400 (0.0009) +[2023-10-08 15:12:49,036][102897] Updated weights for policy 0, policy_version 86280 (0.0010) +[2023-10-08 15:12:49,413][102897] Updated weights for policy 0, policy_version 86290 (0.0008) +[2023-10-08 15:12:49,778][102897] Updated weights for policy 0, policy_version 86300 (0.0008) +[2023-10-08 15:12:51,820][102898] Updated weights for policy 1, policy_version 86410 (0.0009) +[2023-10-08 15:12:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 176848896. Throughput: 0: 1806.0, 1: 1790.2. Samples: 44219138. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:12:51,876][101941] Avg episode reward: [(0, '9.070'), (1, '14.860')] +[2023-10-08 15:12:52,188][102898] Updated weights for policy 1, policy_version 86420 (0.0007) +[2023-10-08 15:12:52,554][102898] Updated weights for policy 1, policy_version 86430 (0.0008) +[2023-10-08 15:12:53,603][102897] Updated weights for policy 0, policy_version 86310 (0.0007) +[2023-10-08 15:12:53,971][102897] Updated weights for policy 0, policy_version 86320 (0.0007) +[2023-10-08 15:12:54,344][102897] Updated weights for policy 0, policy_version 86330 (0.0011) +[2023-10-08 15:12:56,060][102898] Updated weights for policy 1, policy_version 86440 (0.0008) +[2023-10-08 15:12:56,429][102898] Updated weights for policy 1, policy_version 86450 (0.0009) +[2023-10-08 15:12:56,792][102898] Updated weights for policy 1, policy_version 86460 (0.0011) +[2023-10-08 15:12:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 176914432. Throughput: 0: 1797.1, 1: 1796.5. Samples: 44240986. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:12:56,876][101941] Avg episode reward: [(0, '9.360'), (1, '13.830')] +[2023-10-08 15:12:58,012][102897] Updated weights for policy 0, policy_version 86340 (0.0009) +[2023-10-08 15:12:58,380][102897] Updated weights for policy 0, policy_version 86350 (0.0009) +[2023-10-08 15:12:58,761][102897] Updated weights for policy 0, policy_version 86360 (0.0009) +[2023-10-08 15:13:00,513][102898] Updated weights for policy 1, policy_version 86470 (0.0009) +[2023-10-08 15:13:00,885][102898] Updated weights for policy 1, policy_version 86480 (0.0007) +[2023-10-08 15:13:01,247][102898] Updated weights for policy 1, policy_version 86490 (0.0007) +[2023-10-08 15:13:01,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 177012736. Throughput: 0: 1800.3, 1: 1784.5. Samples: 44262010. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:13:01,876][101941] Avg episode reward: [(0, '8.820'), (1, '14.480')] +[2023-10-08 15:13:02,461][102897] Updated weights for policy 0, policy_version 86370 (0.0010) +[2023-10-08 15:13:02,835][102897] Updated weights for policy 0, policy_version 86380 (0.0009) +[2023-10-08 15:13:03,198][102897] Updated weights for policy 0, policy_version 86390 (0.0009) +[2023-10-08 15:13:03,568][102897] Updated weights for policy 0, policy_version 86400 (0.0009) +[2023-10-08 15:13:05,105][102898] Updated weights for policy 1, policy_version 86500 (0.0008) +[2023-10-08 15:13:05,481][102898] Updated weights for policy 1, policy_version 86510 (0.0010) +[2023-10-08 15:13:05,845][102898] Updated weights for policy 1, policy_version 86520 (0.0007) +[2023-10-08 15:13:06,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 177078272. Throughput: 0: 1799.0, 1: 1791.4. Samples: 44273094. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:13:06,876][101941] Avg episode reward: [(0, '8.120'), (1, '13.290')] +[2023-10-08 15:13:07,384][102897] Updated weights for policy 0, policy_version 86410 (0.0011) +[2023-10-08 15:13:07,752][102897] Updated weights for policy 0, policy_version 86420 (0.0010) +[2023-10-08 15:13:08,128][102897] Updated weights for policy 0, policy_version 86430 (0.0011) +[2023-10-08 15:13:09,560][102898] Updated weights for policy 1, policy_version 86530 (0.0007) +[2023-10-08 15:13:09,937][102898] Updated weights for policy 1, policy_version 86540 (0.0008) +[2023-10-08 15:13:10,292][102898] Updated weights for policy 1, policy_version 86550 (0.0007) +[2023-10-08 15:13:10,660][102898] Updated weights for policy 1, policy_version 86560 (0.0008) +[2023-10-08 15:13:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 177143808. Throughput: 0: 1797.5, 1: 1789.6. Samples: 44294414. Policy #0 lag: (min: 29.0, avg: 31.5, max: 61.0) +[2023-10-08 15:13:11,876][101941] Avg episode reward: [(0, '8.250'), (1, '14.070')] +[2023-10-08 15:13:11,905][102897] Updated weights for policy 0, policy_version 86440 (0.0011) +[2023-10-08 15:13:12,267][102897] Updated weights for policy 0, policy_version 86450 (0.0009) +[2023-10-08 15:13:12,639][102897] Updated weights for policy 0, policy_version 86460 (0.0009) +[2023-10-08 15:13:14,298][102898] Updated weights for policy 1, policy_version 86570 (0.0009) +[2023-10-08 15:13:14,667][102898] Updated weights for policy 1, policy_version 86580 (0.0007) +[2023-10-08 15:13:15,027][102898] Updated weights for policy 1, policy_version 86590 (0.0008) +[2023-10-08 15:13:16,366][102897] Updated weights for policy 0, policy_version 86470 (0.0008) +[2023-10-08 15:13:16,747][102897] Updated weights for policy 0, policy_version 86480 (0.0008) +[2023-10-08 15:13:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 177209344. Throughput: 0: 1805.5, 1: 1791.6. Samples: 44316440. Policy #0 lag: (min: 29.0, avg: 31.5, max: 61.0) +[2023-10-08 15:13:16,876][101941] Avg episode reward: [(0, '8.260'), (1, '14.430')] +[2023-10-08 15:13:17,109][102897] Updated weights for policy 0, policy_version 86490 (0.0008) +[2023-10-08 15:13:18,903][102898] Updated weights for policy 1, policy_version 86600 (0.0007) +[2023-10-08 15:13:19,268][102898] Updated weights for policy 1, policy_version 86610 (0.0007) +[2023-10-08 15:13:19,632][102898] Updated weights for policy 1, policy_version 86620 (0.0007) +[2023-10-08 15:13:20,963][102897] Updated weights for policy 0, policy_version 86500 (0.0008) +[2023-10-08 15:13:21,329][102897] Updated weights for policy 0, policy_version 86510 (0.0008) +[2023-10-08 15:13:21,694][102897] Updated weights for policy 0, policy_version 86520 (0.0008) +[2023-10-08 15:13:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 177274880. Throughput: 0: 1786.4, 1: 1803.5. Samples: 44326726. Policy #0 lag: (min: 29.0, avg: 31.5, max: 61.0) +[2023-10-08 15:13:21,876][101941] Avg episode reward: [(0, '9.050'), (1, '15.380')] +[2023-10-08 15:13:23,413][102898] Updated weights for policy 1, policy_version 86630 (0.0008) +[2023-10-08 15:13:23,774][102898] Updated weights for policy 1, policy_version 86640 (0.0008) +[2023-10-08 15:13:24,145][102898] Updated weights for policy 1, policy_version 86650 (0.0007) +[2023-10-08 15:13:25,462][102897] Updated weights for policy 0, policy_version 86530 (0.0007) +[2023-10-08 15:13:25,834][102897] Updated weights for policy 0, policy_version 86540 (0.0008) +[2023-10-08 15:13:26,200][102897] Updated weights for policy 0, policy_version 86550 (0.0007) +[2023-10-08 15:13:26,570][102897] Updated weights for policy 0, policy_version 86560 (0.0009) +[2023-10-08 15:13:26,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 177373184. Throughput: 0: 1800.9, 1: 1791.8. Samples: 44348540. Policy #0 lag: (min: 29.0, avg: 31.5, max: 61.0) +[2023-10-08 15:13:26,875][101941] Avg episode reward: [(0, '8.400'), (1, '15.040')] +[2023-10-08 15:13:27,749][102898] Updated weights for policy 1, policy_version 86660 (0.0009) +[2023-10-08 15:13:28,122][102898] Updated weights for policy 1, policy_version 86670 (0.0008) +[2023-10-08 15:13:28,483][102898] Updated weights for policy 1, policy_version 86680 (0.0009) +[2023-10-08 15:13:30,325][102897] Updated weights for policy 0, policy_version 86570 (0.0010) +[2023-10-08 15:13:30,694][102897] Updated weights for policy 0, policy_version 86580 (0.0011) +[2023-10-08 15:13:31,067][102897] Updated weights for policy 0, policy_version 86590 (0.0009) +[2023-10-08 15:13:31,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 177438720. Throughput: 0: 1782.4, 1: 1796.8. Samples: 44369766. Policy #0 lag: (min: 29.0, avg: 31.5, max: 61.0) +[2023-10-08 15:13:31,876][101941] Avg episode reward: [(0, '8.260'), (1, '14.250')] +[2023-10-08 15:13:32,279][102898] Updated weights for policy 1, policy_version 86690 (0.0009) +[2023-10-08 15:13:32,635][102898] Updated weights for policy 1, policy_version 86700 (0.0009) +[2023-10-08 15:13:33,006][102898] Updated weights for policy 1, policy_version 86710 (0.0008) +[2023-10-08 15:13:33,363][102898] Updated weights for policy 1, policy_version 86720 (0.0009) +[2023-10-08 15:13:34,736][102897] Updated weights for policy 0, policy_version 86600 (0.0007) +[2023-10-08 15:13:35,111][102897] Updated weights for policy 0, policy_version 86610 (0.0008) +[2023-10-08 15:13:35,473][102897] Updated weights for policy 0, policy_version 86620 (0.0008) +[2023-10-08 15:13:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 177504256. Throughput: 0: 1804.9, 1: 1795.6. Samples: 44381158. Policy #0 lag: (min: 29.0, avg: 31.5, max: 61.0) +[2023-10-08 15:13:36,876][101941] Avg episode reward: [(0, '8.950'), (1, '14.650')] +[2023-10-08 15:13:37,154][102898] Updated weights for policy 1, policy_version 86730 (0.0008) +[2023-10-08 15:13:37,530][102898] Updated weights for policy 1, policy_version 86740 (0.0009) +[2023-10-08 15:13:37,885][102898] Updated weights for policy 1, policy_version 86750 (0.0008) +[2023-10-08 15:13:39,146][102897] Updated weights for policy 0, policy_version 86630 (0.0007) +[2023-10-08 15:13:39,510][102897] Updated weights for policy 0, policy_version 86640 (0.0007) +[2023-10-08 15:13:39,882][102897] Updated weights for policy 0, policy_version 86650 (0.0007) +[2023-10-08 15:13:41,624][102898] Updated weights for policy 1, policy_version 86760 (0.0009) +[2023-10-08 15:13:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 177569792. Throughput: 0: 1790.7, 1: 1793.5. Samples: 44402272. Policy #0 lag: (min: 29.0, avg: 31.5, max: 61.0) +[2023-10-08 15:13:41,876][101941] Avg episode reward: [(0, '9.210'), (1, '14.840')] +[2023-10-08 15:13:41,982][102898] Updated weights for policy 1, policy_version 86770 (0.0010) +[2023-10-08 15:13:42,352][102898] Updated weights for policy 1, policy_version 86780 (0.0010) +[2023-10-08 15:13:43,704][102897] Updated weights for policy 0, policy_version 86660 (0.0010) +[2023-10-08 15:13:44,077][102897] Updated weights for policy 0, policy_version 86670 (0.0007) +[2023-10-08 15:13:44,441][102897] Updated weights for policy 0, policy_version 86680 (0.0007) +[2023-10-08 15:13:46,202][102898] Updated weights for policy 1, policy_version 86790 (0.0009) +[2023-10-08 15:13:46,568][102898] Updated weights for policy 1, policy_version 86800 (0.0009) +[2023-10-08 15:13:46,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 177635328. Throughput: 0: 1797.1, 1: 1810.5. Samples: 44424350. Policy #0 lag: (min: 29.0, avg: 31.5, max: 61.0) +[2023-10-08 15:13:46,875][101941] Avg episode reward: [(0, '9.320'), (1, '13.400')] +[2023-10-08 15:13:46,938][102898] Updated weights for policy 1, policy_version 86810 (0.0008) +[2023-10-08 15:13:48,242][102897] Updated weights for policy 0, policy_version 86690 (0.0008) +[2023-10-08 15:13:48,616][102897] Updated weights for policy 0, policy_version 86700 (0.0008) +[2023-10-08 15:13:48,987][102897] Updated weights for policy 0, policy_version 86710 (0.0007) +[2023-10-08 15:13:49,353][102897] Updated weights for policy 0, policy_version 86720 (0.0010) +[2023-10-08 15:13:50,845][102898] Updated weights for policy 1, policy_version 86820 (0.0007) +[2023-10-08 15:13:51,207][102898] Updated weights for policy 1, policy_version 86830 (0.0007) +[2023-10-08 15:13:51,571][102898] Updated weights for policy 1, policy_version 86840 (0.0007) +[2023-10-08 15:13:51,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 177733632. Throughput: 0: 1799.9, 1: 1789.7. Samples: 44434628. Policy #0 lag: (min: 29.0, avg: 31.5, max: 61.0) +[2023-10-08 15:13:51,876][101941] Avg episode reward: [(0, '9.370'), (1, '13.200')] +[2023-10-08 15:13:53,028][102897] Updated weights for policy 0, policy_version 86730 (0.0008) +[2023-10-08 15:13:53,396][102897] Updated weights for policy 0, policy_version 86740 (0.0008) +[2023-10-08 15:13:53,769][102897] Updated weights for policy 0, policy_version 86750 (0.0008) +[2023-10-08 15:13:55,335][102898] Updated weights for policy 1, policy_version 86850 (0.0008) +[2023-10-08 15:13:55,695][102898] Updated weights for policy 1, policy_version 86860 (0.0010) +[2023-10-08 15:13:56,067][102898] Updated weights for policy 1, policy_version 86870 (0.0010) +[2023-10-08 15:13:56,431][102898] Updated weights for policy 1, policy_version 86880 (0.0010) +[2023-10-08 15:13:56,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 177799168. Throughput: 0: 1795.8, 1: 1804.6. Samples: 44456430. Policy #0 lag: (min: 29.0, avg: 31.5, max: 61.0) +[2023-10-08 15:13:56,876][101941] Avg episode reward: [(0, '9.030'), (1, '13.100')] +[2023-10-08 15:13:57,393][102897] Updated weights for policy 0, policy_version 86760 (0.0007) +[2023-10-08 15:13:57,757][102897] Updated weights for policy 0, policy_version 86770 (0.0007) +[2023-10-08 15:13:58,124][102897] Updated weights for policy 0, policy_version 86780 (0.0007) +[2023-10-08 15:14:00,075][102898] Updated weights for policy 1, policy_version 86890 (0.0009) +[2023-10-08 15:14:00,440][102898] Updated weights for policy 1, policy_version 86900 (0.0008) +[2023-10-08 15:14:00,803][102898] Updated weights for policy 1, policy_version 86910 (0.0008) +[2023-10-08 15:14:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 177864704. Throughput: 0: 1796.0, 1: 1782.6. Samples: 44477474. Policy #0 lag: (min: 29.0, avg: 31.5, max: 61.0) +[2023-10-08 15:14:01,876][101941] Avg episode reward: [(0, '8.460'), (1, '14.090')] +[2023-10-08 15:14:02,000][102897] Updated weights for policy 0, policy_version 86790 (0.0009) +[2023-10-08 15:14:02,365][102897] Updated weights for policy 0, policy_version 86800 (0.0008) +[2023-10-08 15:14:02,736][102897] Updated weights for policy 0, policy_version 86810 (0.0009) +[2023-10-08 15:14:04,726][102898] Updated weights for policy 1, policy_version 86920 (0.0008) +[2023-10-08 15:14:05,097][102898] Updated weights for policy 1, policy_version 86930 (0.0008) +[2023-10-08 15:14:05,469][102898] Updated weights for policy 1, policy_version 86940 (0.0009) +[2023-10-08 15:14:06,434][102897] Updated weights for policy 0, policy_version 86820 (0.0007) +[2023-10-08 15:14:06,807][102897] Updated weights for policy 0, policy_version 86830 (0.0007) +[2023-10-08 15:14:06,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 177930240. Throughput: 0: 1795.8, 1: 1803.8. Samples: 44488706. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:14:06,876][101941] Avg episode reward: [(0, '8.780'), (1, '13.950')] +[2023-10-08 15:14:07,186][102897] Updated weights for policy 0, policy_version 86840 (0.0007) +[2023-10-08 15:14:09,030][102898] Updated weights for policy 1, policy_version 86950 (0.0010) +[2023-10-08 15:14:09,394][102898] Updated weights for policy 1, policy_version 86960 (0.0009) +[2023-10-08 15:14:09,763][102898] Updated weights for policy 1, policy_version 86970 (0.0007) +[2023-10-08 15:14:11,010][102897] Updated weights for policy 0, policy_version 86850 (0.0007) +[2023-10-08 15:14:11,381][102897] Updated weights for policy 0, policy_version 86860 (0.0008) +[2023-10-08 15:14:11,747][102897] Updated weights for policy 0, policy_version 86870 (0.0008) +[2023-10-08 15:14:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 177995776. Throughput: 0: 1803.4, 1: 1784.8. Samples: 44510012. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:14:11,876][101941] Avg episode reward: [(0, '9.070'), (1, '13.900')] +[2023-10-08 15:14:12,114][102897] Updated weights for policy 0, policy_version 86880 (0.0007) +[2023-10-08 15:14:13,507][102898] Updated weights for policy 1, policy_version 86980 (0.0007) +[2023-10-08 15:14:13,869][102898] Updated weights for policy 1, policy_version 86990 (0.0010) +[2023-10-08 15:14:14,233][102898] Updated weights for policy 1, policy_version 87000 (0.0010) +[2023-10-08 15:14:15,887][102897] Updated weights for policy 0, policy_version 86890 (0.0007) +[2023-10-08 15:14:16,269][102897] Updated weights for policy 0, policy_version 86900 (0.0008) +[2023-10-08 15:14:16,643][102897] Updated weights for policy 0, policy_version 86910 (0.0009) +[2023-10-08 15:14:16,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 178094080. Throughput: 0: 1815.3, 1: 1785.1. Samples: 44531780. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:14:16,876][101941] Avg episode reward: [(0, '8.930'), (1, '14.460')] +[2023-10-08 15:14:16,885][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000086912_88997888.pth... +[2023-10-08 15:14:16,885][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000087008_89096192.pth... +[2023-10-08 15:14:16,915][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000085344_87392256.pth +[2023-10-08 15:14:16,923][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000085216_87261184.pth +[2023-10-08 15:14:17,923][102898] Updated weights for policy 1, policy_version 87010 (0.0009) +[2023-10-08 15:14:18,296][102898] Updated weights for policy 1, policy_version 87020 (0.0007) +[2023-10-08 15:14:18,654][102898] Updated weights for policy 1, policy_version 87030 (0.0007) +[2023-10-08 15:14:19,028][102898] Updated weights for policy 1, policy_version 87040 (0.0011) +[2023-10-08 15:14:20,240][102897] Updated weights for policy 0, policy_version 86920 (0.0008) +[2023-10-08 15:14:20,612][102897] Updated weights for policy 0, policy_version 86930 (0.0007) +[2023-10-08 15:14:20,981][102897] Updated weights for policy 0, policy_version 86940 (0.0007) +[2023-10-08 15:14:21,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 178159616. Throughput: 0: 1802.9, 1: 1785.8. Samples: 44542650. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:14:21,876][101941] Avg episode reward: [(0, '9.380'), (1, '12.960')] +[2023-10-08 15:14:22,859][102898] Updated weights for policy 1, policy_version 87050 (0.0009) +[2023-10-08 15:14:23,230][102898] Updated weights for policy 1, policy_version 87060 (0.0007) +[2023-10-08 15:14:23,602][102898] Updated weights for policy 1, policy_version 87070 (0.0007) +[2023-10-08 15:14:24,802][102897] Updated weights for policy 0, policy_version 86950 (0.0009) +[2023-10-08 15:14:25,172][102897] Updated weights for policy 0, policy_version 86960 (0.0008) +[2023-10-08 15:14:25,547][102897] Updated weights for policy 0, policy_version 86970 (0.0007) +[2023-10-08 15:14:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 178225152. Throughput: 0: 1808.3, 1: 1785.8. Samples: 44564004. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:14:26,876][101941] Avg episode reward: [(0, '9.180'), (1, '14.270')] +[2023-10-08 15:14:27,445][102898] Updated weights for policy 1, policy_version 87080 (0.0008) +[2023-10-08 15:14:27,816][102898] Updated weights for policy 1, policy_version 87090 (0.0007) +[2023-10-08 15:14:28,188][102898] Updated weights for policy 1, policy_version 87100 (0.0009) +[2023-10-08 15:14:29,291][102897] Updated weights for policy 0, policy_version 86980 (0.0010) +[2023-10-08 15:14:29,665][102897] Updated weights for policy 0, policy_version 86990 (0.0007) +[2023-10-08 15:14:30,049][102897] Updated weights for policy 0, policy_version 87000 (0.0008) +[2023-10-08 15:14:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 178290688. Throughput: 0: 1787.9, 1: 1799.4. Samples: 44585778. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:14:31,876][101941] Avg episode reward: [(0, '8.970'), (1, '14.050')] +[2023-10-08 15:14:31,892][102898] Updated weights for policy 1, policy_version 87110 (0.0010) +[2023-10-08 15:14:32,254][102898] Updated weights for policy 1, policy_version 87120 (0.0009) +[2023-10-08 15:14:32,620][102898] Updated weights for policy 1, policy_version 87130 (0.0008) +[2023-10-08 15:14:33,775][102897] Updated weights for policy 0, policy_version 87010 (0.0008) +[2023-10-08 15:14:34,146][102897] Updated weights for policy 0, policy_version 87020 (0.0008) +[2023-10-08 15:14:34,522][102897] Updated weights for policy 0, policy_version 87030 (0.0007) +[2023-10-08 15:14:34,887][102897] Updated weights for policy 0, policy_version 87040 (0.0009) +[2023-10-08 15:14:36,394][102898] Updated weights for policy 1, policy_version 87140 (0.0007) +[2023-10-08 15:14:36,766][102898] Updated weights for policy 1, policy_version 87150 (0.0008) +[2023-10-08 15:14:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 178356224. Throughput: 0: 1801.5, 1: 1788.6. Samples: 44596184. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:14:36,876][101941] Avg episode reward: [(0, '8.880'), (1, '13.740')] +[2023-10-08 15:14:37,120][102898] Updated weights for policy 1, policy_version 87160 (0.0008) +[2023-10-08 15:14:38,669][102897] Updated weights for policy 0, policy_version 87050 (0.0007) +[2023-10-08 15:14:39,034][102897] Updated weights for policy 0, policy_version 87060 (0.0009) +[2023-10-08 15:14:39,409][102897] Updated weights for policy 0, policy_version 87070 (0.0008) +[2023-10-08 15:14:40,822][102898] Updated weights for policy 1, policy_version 87170 (0.0009) +[2023-10-08 15:14:41,185][102898] Updated weights for policy 1, policy_version 87180 (0.0010) +[2023-10-08 15:14:41,555][102898] Updated weights for policy 1, policy_version 87190 (0.0008) +[2023-10-08 15:14:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 178421760. Throughput: 0: 1788.1, 1: 1798.9. Samples: 44617848. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:14:41,876][101941] Avg episode reward: [(0, '8.470'), (1, '13.450')] +[2023-10-08 15:14:41,920][102898] Updated weights for policy 1, policy_version 87200 (0.0008) +[2023-10-08 15:14:43,271][102897] Updated weights for policy 0, policy_version 87080 (0.0008) +[2023-10-08 15:14:43,635][102897] Updated weights for policy 0, policy_version 87090 (0.0011) +[2023-10-08 15:14:44,011][102897] Updated weights for policy 0, policy_version 87100 (0.0009) +[2023-10-08 15:14:45,679][102898] Updated weights for policy 1, policy_version 87210 (0.0009) +[2023-10-08 15:14:46,048][102898] Updated weights for policy 1, policy_version 87220 (0.0007) +[2023-10-08 15:14:46,411][102898] Updated weights for policy 1, policy_version 87230 (0.0007) +[2023-10-08 15:14:46,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 178520064. Throughput: 0: 1793.1, 1: 1794.5. Samples: 44638916. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:14:46,876][101941] Avg episode reward: [(0, '9.180'), (1, '14.170')] +[2023-10-08 15:14:47,637][102897] Updated weights for policy 0, policy_version 87110 (0.0010) +[2023-10-08 15:14:48,006][102897] Updated weights for policy 0, policy_version 87120 (0.0008) +[2023-10-08 15:14:48,373][102897] Updated weights for policy 0, policy_version 87130 (0.0007) +[2023-10-08 15:14:50,227][102898] Updated weights for policy 1, policy_version 87240 (0.0010) +[2023-10-08 15:14:50,593][102898] Updated weights for policy 1, policy_version 87250 (0.0007) +[2023-10-08 15:14:50,956][102898] Updated weights for policy 1, policy_version 87260 (0.0009) +[2023-10-08 15:14:51,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 178585600. Throughput: 0: 1789.3, 1: 1794.1. Samples: 44649960. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:14:51,875][101941] Avg episode reward: [(0, '8.900'), (1, '13.360')] +[2023-10-08 15:14:52,160][102897] Updated weights for policy 0, policy_version 87140 (0.0009) +[2023-10-08 15:14:52,533][102897] Updated weights for policy 0, policy_version 87150 (0.0008) +[2023-10-08 15:14:52,902][102897] Updated weights for policy 0, policy_version 87160 (0.0008) +[2023-10-08 15:14:54,694][102898] Updated weights for policy 1, policy_version 87270 (0.0008) +[2023-10-08 15:14:55,057][102898] Updated weights for policy 1, policy_version 87280 (0.0007) +[2023-10-08 15:14:55,429][102898] Updated weights for policy 1, policy_version 87290 (0.0007) +[2023-10-08 15:14:56,757][102897] Updated weights for policy 0, policy_version 87170 (0.0008) +[2023-10-08 15:14:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 178651136. Throughput: 0: 1785.2, 1: 1796.6. Samples: 44671194. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:14:56,876][101941] Avg episode reward: [(0, '8.530'), (1, '14.130')] +[2023-10-08 15:14:57,120][102897] Updated weights for policy 0, policy_version 87180 (0.0009) +[2023-10-08 15:14:57,497][102897] Updated weights for policy 0, policy_version 87190 (0.0010) +[2023-10-08 15:14:57,868][102897] Updated weights for policy 0, policy_version 87200 (0.0009) +[2023-10-08 15:14:59,241][102898] Updated weights for policy 1, policy_version 87300 (0.0009) +[2023-10-08 15:14:59,607][102898] Updated weights for policy 1, policy_version 87310 (0.0010) +[2023-10-08 15:14:59,967][102898] Updated weights for policy 1, policy_version 87320 (0.0007) +[2023-10-08 15:15:01,543][102897] Updated weights for policy 0, policy_version 87210 (0.0009) +[2023-10-08 15:15:01,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 178716672. Throughput: 0: 1800.6, 1: 1787.4. Samples: 44693242. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:15:01,876][101941] Avg episode reward: [(0, '7.890'), (1, '15.150')] +[2023-10-08 15:15:01,922][102897] Updated weights for policy 0, policy_version 87220 (0.0011) +[2023-10-08 15:15:02,287][102897] Updated weights for policy 0, policy_version 87230 (0.0009) +[2023-10-08 15:15:03,760][102898] Updated weights for policy 1, policy_version 87330 (0.0010) +[2023-10-08 15:15:04,125][102898] Updated weights for policy 1, policy_version 87340 (0.0011) +[2023-10-08 15:15:04,483][102898] Updated weights for policy 1, policy_version 87350 (0.0010) +[2023-10-08 15:15:04,852][102898] Updated weights for policy 1, policy_version 87360 (0.0009) +[2023-10-08 15:15:06,064][102897] Updated weights for policy 0, policy_version 87240 (0.0011) +[2023-10-08 15:15:06,425][102897] Updated weights for policy 0, policy_version 87250 (0.0008) +[2023-10-08 15:15:06,791][102897] Updated weights for policy 0, policy_version 87260 (0.0007) +[2023-10-08 15:15:06,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 178782208. Throughput: 0: 1780.6, 1: 1798.5. Samples: 44703710. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:15:06,875][101941] Avg episode reward: [(0, '8.410'), (1, '14.540')] +[2023-10-08 15:15:08,481][102898] Updated weights for policy 1, policy_version 87370 (0.0008) +[2023-10-08 15:15:08,853][102898] Updated weights for policy 1, policy_version 87380 (0.0008) +[2023-10-08 15:15:09,211][102898] Updated weights for policy 1, policy_version 87390 (0.0009) +[2023-10-08 15:15:10,275][102897] Updated weights for policy 0, policy_version 87270 (0.0008) +[2023-10-08 15:15:10,643][102897] Updated weights for policy 0, policy_version 87280 (0.0008) +[2023-10-08 15:15:11,022][102897] Updated weights for policy 0, policy_version 87290 (0.0008) +[2023-10-08 15:15:11,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 178880512. Throughput: 0: 1800.7, 1: 1787.9. Samples: 44725488. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:15:11,876][101941] Avg episode reward: [(0, '9.080'), (1, '15.680')] +[2023-10-08 15:15:11,877][102760] Saving new best policy, reward=15.680! +[2023-10-08 15:15:13,181][102898] Updated weights for policy 1, policy_version 87400 (0.0007) +[2023-10-08 15:15:13,568][102898] Updated weights for policy 1, policy_version 87410 (0.0009) +[2023-10-08 15:15:13,927][102898] Updated weights for policy 1, policy_version 87420 (0.0009) +[2023-10-08 15:15:14,903][102897] Updated weights for policy 0, policy_version 87300 (0.0007) +[2023-10-08 15:15:15,279][102897] Updated weights for policy 0, policy_version 87310 (0.0008) +[2023-10-08 15:15:15,650][102897] Updated weights for policy 0, policy_version 87320 (0.0010) +[2023-10-08 15:15:16,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 178946048. Throughput: 0: 1786.5, 1: 1785.6. Samples: 44746526. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:15:16,876][101941] Avg episode reward: [(0, '9.440'), (1, '14.410')] +[2023-10-08 15:15:17,746][102898] Updated weights for policy 1, policy_version 87430 (0.0009) +[2023-10-08 15:15:18,114][102898] Updated weights for policy 1, policy_version 87440 (0.0008) +[2023-10-08 15:15:18,475][102898] Updated weights for policy 1, policy_version 87450 (0.0009) +[2023-10-08 15:15:19,306][102897] Updated weights for policy 0, policy_version 87330 (0.0007) +[2023-10-08 15:15:19,677][102897] Updated weights for policy 0, policy_version 87340 (0.0008) +[2023-10-08 15:15:20,053][102897] Updated weights for policy 0, policy_version 87350 (0.0009) +[2023-10-08 15:15:20,422][102897] Updated weights for policy 0, policy_version 87360 (0.0009) +[2023-10-08 15:15:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 179011584. Throughput: 0: 1803.0, 1: 1784.0. Samples: 44757602. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:15:21,876][101941] Avg episode reward: [(0, '9.630'), (1, '15.140')] +[2023-10-08 15:15:22,302][102898] Updated weights for policy 1, policy_version 87460 (0.0009) +[2023-10-08 15:15:22,660][102898] Updated weights for policy 1, policy_version 87470 (0.0009) +[2023-10-08 15:15:23,032][102898] Updated weights for policy 1, policy_version 87480 (0.0009) +[2023-10-08 15:15:24,261][102897] Updated weights for policy 0, policy_version 87370 (0.0010) +[2023-10-08 15:15:24,629][102897] Updated weights for policy 0, policy_version 87380 (0.0009) +[2023-10-08 15:15:24,987][102897] Updated weights for policy 0, policy_version 87390 (0.0008) +[2023-10-08 15:15:26,775][102898] Updated weights for policy 1, policy_version 87490 (0.0009) +[2023-10-08 15:15:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 179077120. Throughput: 0: 1788.0, 1: 1782.1. Samples: 44778500. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:15:26,875][101941] Avg episode reward: [(0, '10.010'), (1, '14.330')] +[2023-10-08 15:15:27,140][102898] Updated weights for policy 1, policy_version 87500 (0.0008) +[2023-10-08 15:15:27,512][102898] Updated weights for policy 1, policy_version 87510 (0.0008) +[2023-10-08 15:15:27,871][102898] Updated weights for policy 1, policy_version 87520 (0.0008) +[2023-10-08 15:15:28,762][102897] Updated weights for policy 0, policy_version 87400 (0.0008) +[2023-10-08 15:15:29,136][102897] Updated weights for policy 0, policy_version 87410 (0.0008) +[2023-10-08 15:15:29,509][102897] Updated weights for policy 0, policy_version 87420 (0.0007) +[2023-10-08 15:15:31,550][102898] Updated weights for policy 1, policy_version 87530 (0.0007) +[2023-10-08 15:15:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 179142656. Throughput: 0: 1791.2, 1: 1807.6. Samples: 44800860. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:15:31,876][101941] Avg episode reward: [(0, '9.690'), (1, '13.660')] +[2023-10-08 15:15:31,916][102898] Updated weights for policy 1, policy_version 87540 (0.0007) +[2023-10-08 15:15:32,281][102898] Updated weights for policy 1, policy_version 87550 (0.0007) +[2023-10-08 15:15:33,228][102897] Updated weights for policy 0, policy_version 87430 (0.0008) +[2023-10-08 15:15:33,594][102897] Updated weights for policy 0, policy_version 87440 (0.0007) +[2023-10-08 15:15:33,969][102897] Updated weights for policy 0, policy_version 87450 (0.0007) +[2023-10-08 15:15:35,985][102898] Updated weights for policy 1, policy_version 87560 (0.0008) +[2023-10-08 15:15:36,358][102898] Updated weights for policy 1, policy_version 87570 (0.0010) +[2023-10-08 15:15:36,730][102898] Updated weights for policy 1, policy_version 87580 (0.0008) +[2023-10-08 15:15:36,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 179240960. Throughput: 0: 1797.9, 1: 1785.2. Samples: 44811198. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:15:36,876][101941] Avg episode reward: [(0, '8.930'), (1, '13.590')] +[2023-10-08 15:15:37,607][102897] Updated weights for policy 0, policy_version 87460 (0.0009) +[2023-10-08 15:15:37,984][102897] Updated weights for policy 0, policy_version 87470 (0.0009) +[2023-10-08 15:15:38,343][102897] Updated weights for policy 0, policy_version 87480 (0.0010) +[2023-10-08 15:15:40,387][102898] Updated weights for policy 1, policy_version 87590 (0.0007) +[2023-10-08 15:15:40,746][102898] Updated weights for policy 1, policy_version 87600 (0.0008) +[2023-10-08 15:15:41,112][102898] Updated weights for policy 1, policy_version 87610 (0.0010) +[2023-10-08 15:15:41,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 179306496. Throughput: 0: 1800.8, 1: 1806.3. Samples: 44833516. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:15:41,876][101941] Avg episode reward: [(0, '9.330'), (1, '14.570')] +[2023-10-08 15:15:42,211][102897] Updated weights for policy 0, policy_version 87490 (0.0008) +[2023-10-08 15:15:42,587][102897] Updated weights for policy 0, policy_version 87500 (0.0010) +[2023-10-08 15:15:42,959][102897] Updated weights for policy 0, policy_version 87510 (0.0007) +[2023-10-08 15:15:43,326][102897] Updated weights for policy 0, policy_version 87520 (0.0009) +[2023-10-08 15:15:44,652][102898] Updated weights for policy 1, policy_version 87620 (0.0010) +[2023-10-08 15:15:45,017][102898] Updated weights for policy 1, policy_version 87630 (0.0008) +[2023-10-08 15:15:45,385][102898] Updated weights for policy 1, policy_version 87640 (0.0008) +[2023-10-08 15:15:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 179372032. Throughput: 0: 1802.5, 1: 1793.1. Samples: 44855044. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:15:46,875][101941] Avg episode reward: [(0, '8.770'), (1, '14.760')] +[2023-10-08 15:15:47,029][102897] Updated weights for policy 0, policy_version 87530 (0.0008) +[2023-10-08 15:15:47,399][102897] Updated weights for policy 0, policy_version 87540 (0.0007) +[2023-10-08 15:15:47,767][102897] Updated weights for policy 0, policy_version 87550 (0.0008) +[2023-10-08 15:15:49,113][102898] Updated weights for policy 1, policy_version 87650 (0.0009) +[2023-10-08 15:15:49,488][102898] Updated weights for policy 1, policy_version 87660 (0.0009) +[2023-10-08 15:15:49,848][102898] Updated weights for policy 1, policy_version 87670 (0.0010) +[2023-10-08 15:15:50,219][102898] Updated weights for policy 1, policy_version 87680 (0.0011) +[2023-10-08 15:15:51,374][102897] Updated weights for policy 0, policy_version 87560 (0.0007) +[2023-10-08 15:15:51,734][102897] Updated weights for policy 0, policy_version 87570 (0.0010) +[2023-10-08 15:15:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 179437568. Throughput: 0: 1795.3, 1: 1806.2. Samples: 44865778. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:15:51,876][101941] Avg episode reward: [(0, '8.330'), (1, '13.890')] +[2023-10-08 15:15:52,110][102897] Updated weights for policy 0, policy_version 87580 (0.0007) +[2023-10-08 15:15:54,069][102898] Updated weights for policy 1, policy_version 87690 (0.0008) +[2023-10-08 15:15:54,446][102898] Updated weights for policy 1, policy_version 87700 (0.0009) +[2023-10-08 15:15:54,807][102898] Updated weights for policy 1, policy_version 87710 (0.0010) +[2023-10-08 15:15:55,872][102897] Updated weights for policy 0, policy_version 87590 (0.0009) +[2023-10-08 15:15:56,244][102897] Updated weights for policy 0, policy_version 87600 (0.0007) +[2023-10-08 15:15:56,625][102897] Updated weights for policy 0, policy_version 87610 (0.0007) +[2023-10-08 15:15:56,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 179535872. Throughput: 0: 1805.6, 1: 1791.7. Samples: 44887368. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 15:15:56,876][101941] Avg episode reward: [(0, '8.320'), (1, '14.300')] +[2023-10-08 15:15:58,724][102898] Updated weights for policy 1, policy_version 87720 (0.0010) +[2023-10-08 15:15:59,109][102898] Updated weights for policy 1, policy_version 87730 (0.0010) +[2023-10-08 15:15:59,471][102898] Updated weights for policy 1, policy_version 87740 (0.0010) +[2023-10-08 15:16:00,364][102897] Updated weights for policy 0, policy_version 87620 (0.0008) +[2023-10-08 15:16:00,730][102897] Updated weights for policy 0, policy_version 87630 (0.0008) +[2023-10-08 15:16:01,100][102897] Updated weights for policy 0, policy_version 87640 (0.0009) +[2023-10-08 15:16:01,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 179601408. Throughput: 0: 1802.6, 1: 1792.8. Samples: 44908318. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 15:16:01,875][101941] Avg episode reward: [(0, '9.120'), (1, '15.560')] +[2023-10-08 15:16:03,150][102898] Updated weights for policy 1, policy_version 87750 (0.0009) +[2023-10-08 15:16:03,524][102898] Updated weights for policy 1, policy_version 87760 (0.0009) +[2023-10-08 15:16:03,880][102898] Updated weights for policy 1, policy_version 87770 (0.0007) +[2023-10-08 15:16:04,890][102897] Updated weights for policy 0, policy_version 87650 (0.0007) +[2023-10-08 15:16:05,258][102897] Updated weights for policy 0, policy_version 87660 (0.0008) +[2023-10-08 15:16:05,629][102897] Updated weights for policy 0, policy_version 87670 (0.0008) +[2023-10-08 15:16:05,997][102897] Updated weights for policy 0, policy_version 87680 (0.0007) +[2023-10-08 15:16:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 179666944. Throughput: 0: 1802.2, 1: 1795.8. Samples: 44919514. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 15:16:06,876][101941] Avg episode reward: [(0, '9.450'), (1, '16.050')] +[2023-10-08 15:16:06,878][102760] Saving new best policy, reward=16.050! +[2023-10-08 15:16:07,605][102898] Updated weights for policy 1, policy_version 87780 (0.0007) +[2023-10-08 15:16:07,974][102898] Updated weights for policy 1, policy_version 87790 (0.0007) +[2023-10-08 15:16:08,337][102898] Updated weights for policy 1, policy_version 87800 (0.0008) +[2023-10-08 15:16:09,837][102897] Updated weights for policy 0, policy_version 87690 (0.0007) +[2023-10-08 15:16:10,201][102897] Updated weights for policy 0, policy_version 87700 (0.0009) +[2023-10-08 15:16:10,566][102897] Updated weights for policy 0, policy_version 87710 (0.0010) +[2023-10-08 15:16:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 179732480. Throughput: 0: 1809.9, 1: 1796.8. Samples: 44940802. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 15:16:11,875][101941] Avg episode reward: [(0, '9.400'), (1, '18.430')] +[2023-10-08 15:16:11,876][102760] Saving new best policy, reward=18.430! +[2023-10-08 15:16:12,289][102898] Updated weights for policy 1, policy_version 87810 (0.0010) +[2023-10-08 15:16:12,655][102898] Updated weights for policy 1, policy_version 87820 (0.0007) +[2023-10-08 15:16:13,016][102898] Updated weights for policy 1, policy_version 87830 (0.0009) +[2023-10-08 15:16:13,392][102898] Updated weights for policy 1, policy_version 87840 (0.0009) +[2023-10-08 15:16:14,322][102897] Updated weights for policy 0, policy_version 87720 (0.0009) +[2023-10-08 15:16:14,700][102897] Updated weights for policy 0, policy_version 87730 (0.0009) +[2023-10-08 15:16:15,070][102897] Updated weights for policy 0, policy_version 87740 (0.0007) +[2023-10-08 15:16:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 179798016. Throughput: 0: 1797.5, 1: 1802.5. Samples: 44962860. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 15:16:16,876][101941] Avg episode reward: [(0, '9.270'), (1, '16.840')] +[2023-10-08 15:16:16,885][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000087744_89849856.pth... +[2023-10-08 15:16:16,921][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000086048_88113152.pth +[2023-10-08 15:16:17,169][102898] Updated weights for policy 1, policy_version 87850 (0.0008) +[2023-10-08 15:16:17,543][102898] Updated weights for policy 1, policy_version 87860 (0.0011) +[2023-10-08 15:16:17,914][102898] Updated weights for policy 1, policy_version 87870 (0.0008) +[2023-10-08 15:16:17,982][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000087872_89980928.pth... +[2023-10-08 15:16:18,022][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000086176_88244224.pth +[2023-10-08 15:16:19,024][102897] Updated weights for policy 0, policy_version 87750 (0.0007) +[2023-10-08 15:16:19,388][102897] Updated weights for policy 0, policy_version 87760 (0.0009) +[2023-10-08 15:16:19,756][102897] Updated weights for policy 0, policy_version 87770 (0.0007) +[2023-10-08 15:16:21,649][102898] Updated weights for policy 1, policy_version 87880 (0.0008) +[2023-10-08 15:16:21,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 179863552. Throughput: 0: 1807.9, 1: 1795.1. Samples: 44973332. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 15:16:21,876][101941] Avg episode reward: [(0, '8.680'), (1, '15.500')] +[2023-10-08 15:16:22,023][102898] Updated weights for policy 1, policy_version 87890 (0.0008) +[2023-10-08 15:16:22,390][102898] Updated weights for policy 1, policy_version 87900 (0.0008) +[2023-10-08 15:16:23,430][102897] Updated weights for policy 0, policy_version 87780 (0.0007) +[2023-10-08 15:16:23,790][102897] Updated weights for policy 0, policy_version 87790 (0.0009) +[2023-10-08 15:16:24,168][102897] Updated weights for policy 0, policy_version 87800 (0.0008) +[2023-10-08 15:16:26,191][102898] Updated weights for policy 1, policy_version 87910 (0.0008) +[2023-10-08 15:16:26,563][102898] Updated weights for policy 1, policy_version 87920 (0.0007) +[2023-10-08 15:16:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 179929088. Throughput: 0: 1783.3, 1: 1798.1. Samples: 44994674. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 15:16:26,875][101941] Avg episode reward: [(0, '8.560'), (1, '15.870')] +[2023-10-08 15:16:26,928][102898] Updated weights for policy 1, policy_version 87930 (0.0007) +[2023-10-08 15:16:27,945][102897] Updated weights for policy 0, policy_version 87810 (0.0009) +[2023-10-08 15:16:28,317][102897] Updated weights for policy 0, policy_version 87820 (0.0010) +[2023-10-08 15:16:28,681][102897] Updated weights for policy 0, policy_version 87830 (0.0009) +[2023-10-08 15:16:29,047][102897] Updated weights for policy 0, policy_version 87840 (0.0009) +[2023-10-08 15:16:30,595][102898] Updated weights for policy 1, policy_version 87940 (0.0008) +[2023-10-08 15:16:30,955][102898] Updated weights for policy 1, policy_version 87950 (0.0008) +[2023-10-08 15:16:31,312][102898] Updated weights for policy 1, policy_version 87960 (0.0007) +[2023-10-08 15:16:31,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 180027392. Throughput: 0: 1787.8, 1: 1793.2. Samples: 45016188. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 15:16:31,876][101941] Avg episode reward: [(0, '8.970'), (1, '16.280')] +[2023-10-08 15:16:32,764][102897] Updated weights for policy 0, policy_version 87850 (0.0008) +[2023-10-08 15:16:33,134][102897] Updated weights for policy 0, policy_version 87860 (0.0007) +[2023-10-08 15:16:33,508][102897] Updated weights for policy 0, policy_version 87870 (0.0008) +[2023-10-08 15:16:35,068][102898] Updated weights for policy 1, policy_version 87970 (0.0008) +[2023-10-08 15:16:35,430][102898] Updated weights for policy 1, policy_version 87980 (0.0009) +[2023-10-08 15:16:35,803][102898] Updated weights for policy 1, policy_version 87990 (0.0010) +[2023-10-08 15:16:36,169][102898] Updated weights for policy 1, policy_version 88000 (0.0009) +[2023-10-08 15:16:36,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 180092928. Throughput: 0: 1789.4, 1: 1797.1. Samples: 45027172. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 15:16:36,875][101941] Avg episode reward: [(0, '9.400'), (1, '16.710')] +[2023-10-08 15:16:37,239][102897] Updated weights for policy 0, policy_version 87880 (0.0008) +[2023-10-08 15:16:37,615][102897] Updated weights for policy 0, policy_version 87890 (0.0008) +[2023-10-08 15:16:37,981][102897] Updated weights for policy 0, policy_version 87900 (0.0007) +[2023-10-08 15:16:39,940][102898] Updated weights for policy 1, policy_version 88010 (0.0007) +[2023-10-08 15:16:40,307][102898] Updated weights for policy 1, policy_version 88020 (0.0007) +[2023-10-08 15:16:40,664][102898] Updated weights for policy 1, policy_version 88030 (0.0007) +[2023-10-08 15:16:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 180158464. Throughput: 0: 1783.0, 1: 1797.7. Samples: 45048502. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 15:16:41,876][101941] Avg episode reward: [(0, '9.620'), (1, '18.860')] +[2023-10-08 15:16:41,878][102760] Saving new best policy, reward=18.860! +[2023-10-08 15:16:41,891][102897] Updated weights for policy 0, policy_version 87910 (0.0008) +[2023-10-08 15:16:42,254][102897] Updated weights for policy 0, policy_version 87920 (0.0009) +[2023-10-08 15:16:42,621][102897] Updated weights for policy 0, policy_version 87930 (0.0007) +[2023-10-08 15:16:44,308][102898] Updated weights for policy 1, policy_version 88040 (0.0008) +[2023-10-08 15:16:44,677][102898] Updated weights for policy 1, policy_version 88050 (0.0010) +[2023-10-08 15:16:45,046][102898] Updated weights for policy 1, policy_version 88060 (0.0010) +[2023-10-08 15:16:46,372][102897] Updated weights for policy 0, policy_version 87940 (0.0008) +[2023-10-08 15:16:46,743][102897] Updated weights for policy 0, policy_version 87950 (0.0008) +[2023-10-08 15:16:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 180224000. Throughput: 0: 1805.2, 1: 1789.1. Samples: 45070064. Policy #0 lag: (min: 31.0, avg: 38.6, max: 63.0) +[2023-10-08 15:16:46,875][101941] Avg episode reward: [(0, '9.040'), (1, '15.470')] +[2023-10-08 15:16:47,112][102897] Updated weights for policy 0, policy_version 87960 (0.0007) +[2023-10-08 15:16:48,782][102898] Updated weights for policy 1, policy_version 88070 (0.0009) +[2023-10-08 15:16:49,143][102898] Updated weights for policy 1, policy_version 88080 (0.0007) +[2023-10-08 15:16:49,511][102898] Updated weights for policy 1, policy_version 88090 (0.0008) +[2023-10-08 15:16:50,830][102897] Updated weights for policy 0, policy_version 87970 (0.0009) +[2023-10-08 15:16:51,206][102897] Updated weights for policy 0, policy_version 87980 (0.0010) +[2023-10-08 15:16:51,568][102897] Updated weights for policy 0, policy_version 87990 (0.0007) +[2023-10-08 15:16:51,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 180289536. Throughput: 0: 1779.4, 1: 1800.8. Samples: 45080620. Policy #0 lag: (min: 31.0, avg: 40.9, max: 63.0) +[2023-10-08 15:16:51,875][101941] Avg episode reward: [(0, '9.170'), (1, '14.270')] +[2023-10-08 15:16:51,936][102897] Updated weights for policy 0, policy_version 88000 (0.0009) +[2023-10-08 15:16:53,135][102898] Updated weights for policy 1, policy_version 88100 (0.0010) +[2023-10-08 15:16:53,514][102898] Updated weights for policy 1, policy_version 88110 (0.0008) +[2023-10-08 15:16:53,880][102898] Updated weights for policy 1, policy_version 88120 (0.0008) +[2023-10-08 15:16:55,794][102897] Updated weights for policy 0, policy_version 88010 (0.0008) +[2023-10-08 15:16:56,155][102897] Updated weights for policy 0, policy_version 88020 (0.0008) +[2023-10-08 15:16:56,522][102897] Updated weights for policy 0, policy_version 88030 (0.0008) +[2023-10-08 15:16:56,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 180387840. Throughput: 0: 1799.7, 1: 1794.2. Samples: 45102528. Policy #0 lag: (min: 31.0, avg: 40.9, max: 63.0) +[2023-10-08 15:16:56,876][101941] Avg episode reward: [(0, '8.850'), (1, '13.740')] +[2023-10-08 15:16:57,582][102898] Updated weights for policy 1, policy_version 88130 (0.0009) +[2023-10-08 15:16:57,950][102898] Updated weights for policy 1, policy_version 88140 (0.0007) +[2023-10-08 15:16:58,329][102898] Updated weights for policy 1, policy_version 88150 (0.0007) +[2023-10-08 15:16:58,697][102898] Updated weights for policy 1, policy_version 88160 (0.0007) +[2023-10-08 15:17:00,391][102897] Updated weights for policy 0, policy_version 88040 (0.0010) +[2023-10-08 15:17:00,761][102897] Updated weights for policy 0, policy_version 88050 (0.0009) +[2023-10-08 15:17:01,123][102897] Updated weights for policy 0, policy_version 88060 (0.0007) +[2023-10-08 15:17:01,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 180453376. Throughput: 0: 1772.1, 1: 1802.5. Samples: 45123718. Policy #0 lag: (min: 31.0, avg: 40.9, max: 63.0) +[2023-10-08 15:17:01,876][101941] Avg episode reward: [(0, '8.700'), (1, '14.210')] +[2023-10-08 15:17:02,479][102898] Updated weights for policy 1, policy_version 88170 (0.0008) +[2023-10-08 15:17:02,851][102898] Updated weights for policy 1, policy_version 88180 (0.0007) +[2023-10-08 15:17:03,220][102898] Updated weights for policy 1, policy_version 88190 (0.0007) +[2023-10-08 15:17:04,828][102897] Updated weights for policy 0, policy_version 88070 (0.0009) +[2023-10-08 15:17:05,195][102897] Updated weights for policy 0, policy_version 88080 (0.0011) +[2023-10-08 15:17:05,558][102897] Updated weights for policy 0, policy_version 88090 (0.0009) +[2023-10-08 15:17:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 180518912. Throughput: 0: 1792.1, 1: 1803.0. Samples: 45135110. Policy #0 lag: (min: 31.0, avg: 40.9, max: 63.0) +[2023-10-08 15:17:06,876][101941] Avg episode reward: [(0, '9.230'), (1, '15.500')] +[2023-10-08 15:17:06,982][102898] Updated weights for policy 1, policy_version 88200 (0.0009) +[2023-10-08 15:17:07,338][102898] Updated weights for policy 1, policy_version 88210 (0.0007) +[2023-10-08 15:17:07,712][102898] Updated weights for policy 1, policy_version 88220 (0.0009) +[2023-10-08 15:17:09,179][102897] Updated weights for policy 0, policy_version 88100 (0.0010) +[2023-10-08 15:17:09,547][102897] Updated weights for policy 0, policy_version 88110 (0.0010) +[2023-10-08 15:17:09,920][102897] Updated weights for policy 0, policy_version 88120 (0.0010) +[2023-10-08 15:17:11,458][102898] Updated weights for policy 1, policy_version 88230 (0.0010) +[2023-10-08 15:17:11,817][102898] Updated weights for policy 1, policy_version 88240 (0.0011) +[2023-10-08 15:17:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 180584448. Throughput: 0: 1777.6, 1: 1809.6. Samples: 45156098. Policy #0 lag: (min: 31.0, avg: 40.9, max: 63.0) +[2023-10-08 15:17:11,876][101941] Avg episode reward: [(0, '8.970'), (1, '15.680')] +[2023-10-08 15:17:12,191][102898] Updated weights for policy 1, policy_version 88250 (0.0010) +[2023-10-08 15:17:13,773][102897] Updated weights for policy 0, policy_version 88130 (0.0008) +[2023-10-08 15:17:14,148][102897] Updated weights for policy 0, policy_version 88140 (0.0007) +[2023-10-08 15:17:14,518][102897] Updated weights for policy 0, policy_version 88150 (0.0008) +[2023-10-08 15:17:14,888][102897] Updated weights for policy 0, policy_version 88160 (0.0008) +[2023-10-08 15:17:15,949][102898] Updated weights for policy 1, policy_version 88260 (0.0008) +[2023-10-08 15:17:16,312][102898] Updated weights for policy 1, policy_version 88270 (0.0008) +[2023-10-08 15:17:16,685][102898] Updated weights for policy 1, policy_version 88280 (0.0008) +[2023-10-08 15:17:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 180649984. Throughput: 0: 1773.2, 1: 1814.2. Samples: 45177622. Policy #0 lag: (min: 31.0, avg: 40.9, max: 63.0) +[2023-10-08 15:17:16,876][101941] Avg episode reward: [(0, '8.560'), (1, '15.010')] +[2023-10-08 15:17:18,610][102897] Updated weights for policy 0, policy_version 88170 (0.0008) +[2023-10-08 15:17:18,975][102897] Updated weights for policy 0, policy_version 88180 (0.0010) +[2023-10-08 15:17:19,337][102897] Updated weights for policy 0, policy_version 88190 (0.0010) +[2023-10-08 15:17:20,376][102898] Updated weights for policy 1, policy_version 88290 (0.0008) +[2023-10-08 15:17:20,744][102898] Updated weights for policy 1, policy_version 88300 (0.0010) +[2023-10-08 15:17:21,109][102898] Updated weights for policy 1, policy_version 88310 (0.0009) +[2023-10-08 15:17:21,473][102898] Updated weights for policy 1, policy_version 88320 (0.0008) +[2023-10-08 15:17:21,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 180748288. Throughput: 0: 1777.4, 1: 1801.3. Samples: 45188214. Policy #0 lag: (min: 31.0, avg: 40.9, max: 63.0) +[2023-10-08 15:17:21,876][101941] Avg episode reward: [(0, '8.950'), (1, '15.720')] +[2023-10-08 15:17:23,079][102897] Updated weights for policy 0, policy_version 88200 (0.0009) +[2023-10-08 15:17:23,451][102897] Updated weights for policy 0, policy_version 88210 (0.0007) +[2023-10-08 15:17:23,828][102897] Updated weights for policy 0, policy_version 88220 (0.0011) +[2023-10-08 15:17:25,088][102898] Updated weights for policy 1, policy_version 88330 (0.0010) +[2023-10-08 15:17:25,456][102898] Updated weights for policy 1, policy_version 88340 (0.0010) +[2023-10-08 15:17:25,821][102898] Updated weights for policy 1, policy_version 88350 (0.0007) +[2023-10-08 15:17:26,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 180813824. Throughput: 0: 1773.0, 1: 1812.1. Samples: 45209834. Policy #0 lag: (min: 31.0, avg: 40.9, max: 63.0) +[2023-10-08 15:17:26,876][101941] Avg episode reward: [(0, '9.280'), (1, '15.380')] +[2023-10-08 15:17:27,659][102897] Updated weights for policy 0, policy_version 88230 (0.0010) +[2023-10-08 15:17:28,033][102897] Updated weights for policy 0, policy_version 88240 (0.0009) +[2023-10-08 15:17:28,404][102897] Updated weights for policy 0, policy_version 88250 (0.0010) +[2023-10-08 15:17:29,870][102898] Updated weights for policy 1, policy_version 88360 (0.0007) +[2023-10-08 15:17:30,243][102898] Updated weights for policy 1, policy_version 88370 (0.0008) +[2023-10-08 15:17:30,606][102898] Updated weights for policy 1, policy_version 88380 (0.0007) +[2023-10-08 15:17:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 180879360. Throughput: 0: 1780.7, 1: 1801.8. Samples: 45231276. Policy #0 lag: (min: 31.0, avg: 40.9, max: 63.0) +[2023-10-08 15:17:31,876][101941] Avg episode reward: [(0, '9.720'), (1, '15.950')] +[2023-10-08 15:17:32,184][102897] Updated weights for policy 0, policy_version 88260 (0.0010) +[2023-10-08 15:17:32,545][102897] Updated weights for policy 0, policy_version 88270 (0.0009) +[2023-10-08 15:17:32,919][102897] Updated weights for policy 0, policy_version 88280 (0.0009) +[2023-10-08 15:17:34,406][102898] Updated weights for policy 1, policy_version 88390 (0.0008) +[2023-10-08 15:17:34,770][102898] Updated weights for policy 1, policy_version 88400 (0.0008) +[2023-10-08 15:17:35,148][102898] Updated weights for policy 1, policy_version 88410 (0.0008) +[2023-10-08 15:17:36,781][102897] Updated weights for policy 0, policy_version 88290 (0.0007) +[2023-10-08 15:17:36,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 180944896. Throughput: 0: 1771.6, 1: 1817.0. Samples: 45242108. Policy #0 lag: (min: 31.0, avg: 40.9, max: 63.0) +[2023-10-08 15:17:36,875][101941] Avg episode reward: [(0, '9.110'), (1, '15.310')] +[2023-10-08 15:17:37,149][102897] Updated weights for policy 0, policy_version 88300 (0.0007) +[2023-10-08 15:17:37,522][102897] Updated weights for policy 0, policy_version 88310 (0.0010) +[2023-10-08 15:17:37,891][102897] Updated weights for policy 0, policy_version 88320 (0.0010) +[2023-10-08 15:17:38,891][102898] Updated weights for policy 1, policy_version 88420 (0.0009) +[2023-10-08 15:17:39,262][102898] Updated weights for policy 1, policy_version 88430 (0.0009) +[2023-10-08 15:17:39,628][102898] Updated weights for policy 1, policy_version 88440 (0.0008) +[2023-10-08 15:17:41,728][102897] Updated weights for policy 0, policy_version 88330 (0.0008) +[2023-10-08 15:17:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 181010432. Throughput: 0: 1773.0, 1: 1794.8. Samples: 45263080. Policy #0 lag: (min: 31.0, avg: 40.9, max: 63.0) +[2023-10-08 15:17:41,876][101941] Avg episode reward: [(0, '9.110'), (1, '14.670')] +[2023-10-08 15:17:42,093][102897] Updated weights for policy 0, policy_version 88340 (0.0009) +[2023-10-08 15:17:42,461][102897] Updated weights for policy 0, policy_version 88350 (0.0007) +[2023-10-08 15:17:43,346][102898] Updated weights for policy 1, policy_version 88450 (0.0009) +[2023-10-08 15:17:43,707][102898] Updated weights for policy 1, policy_version 88460 (0.0008) +[2023-10-08 15:17:44,079][102898] Updated weights for policy 1, policy_version 88470 (0.0009) +[2023-10-08 15:17:44,451][102898] Updated weights for policy 1, policy_version 88480 (0.0009) +[2023-10-08 15:17:46,221][102897] Updated weights for policy 0, policy_version 88360 (0.0007) +[2023-10-08 15:17:46,608][102897] Updated weights for policy 0, policy_version 88370 (0.0009) +[2023-10-08 15:17:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 181075968. Throughput: 0: 1792.9, 1: 1786.9. Samples: 45284806. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:17:46,876][101941] Avg episode reward: [(0, '9.060'), (1, '13.680')] +[2023-10-08 15:17:46,985][102897] Updated weights for policy 0, policy_version 88380 (0.0008) +[2023-10-08 15:17:48,192][102898] Updated weights for policy 1, policy_version 88490 (0.0008) +[2023-10-08 15:17:48,564][102898] Updated weights for policy 1, policy_version 88500 (0.0009) +[2023-10-08 15:17:48,931][102898] Updated weights for policy 1, policy_version 88510 (0.0008) +[2023-10-08 15:17:50,850][102897] Updated weights for policy 0, policy_version 88390 (0.0009) +[2023-10-08 15:17:51,222][102897] Updated weights for policy 0, policy_version 88400 (0.0012) +[2023-10-08 15:17:51,593][102897] Updated weights for policy 0, policy_version 88410 (0.0008) +[2023-10-08 15:17:51,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 181174272. Throughput: 0: 1767.8, 1: 1786.9. Samples: 45295072. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:17:51,876][101941] Avg episode reward: [(0, '9.170'), (1, '14.880')] +[2023-10-08 15:17:52,651][102898] Updated weights for policy 1, policy_version 88520 (0.0007) +[2023-10-08 15:17:53,014][102898] Updated weights for policy 1, policy_version 88530 (0.0007) +[2023-10-08 15:17:53,385][102898] Updated weights for policy 1, policy_version 88540 (0.0009) +[2023-10-08 15:17:55,391][102897] Updated weights for policy 0, policy_version 88420 (0.0009) +[2023-10-08 15:17:55,760][102897] Updated weights for policy 0, policy_version 88430 (0.0008) +[2023-10-08 15:17:56,143][102897] Updated weights for policy 0, policy_version 88440 (0.0009) +[2023-10-08 15:17:56,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 181239808. Throughput: 0: 1796.4, 1: 1782.3. Samples: 45317138. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:17:56,876][101941] Avg episode reward: [(0, '9.140'), (1, '16.150')] +[2023-10-08 15:17:57,002][102898] Updated weights for policy 1, policy_version 88550 (0.0007) +[2023-10-08 15:17:57,377][102898] Updated weights for policy 1, policy_version 88560 (0.0009) +[2023-10-08 15:17:57,736][102898] Updated weights for policy 1, policy_version 88570 (0.0007) +[2023-10-08 15:17:59,934][102897] Updated weights for policy 0, policy_version 88450 (0.0009) +[2023-10-08 15:18:00,301][102897] Updated weights for policy 0, policy_version 88460 (0.0008) +[2023-10-08 15:18:00,667][102897] Updated weights for policy 0, policy_version 88470 (0.0007) +[2023-10-08 15:18:01,043][102897] Updated weights for policy 0, policy_version 88480 (0.0007) +[2023-10-08 15:18:01,601][102898] Updated weights for policy 1, policy_version 88580 (0.0007) +[2023-10-08 15:18:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 181305344. Throughput: 0: 1766.5, 1: 1802.1. Samples: 45338212. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:18:01,875][101941] Avg episode reward: [(0, '8.620'), (1, '15.690')] +[2023-10-08 15:18:01,967][102898] Updated weights for policy 1, policy_version 88590 (0.0007) +[2023-10-08 15:18:02,330][102898] Updated weights for policy 1, policy_version 88600 (0.0007) +[2023-10-08 15:18:04,719][102897] Updated weights for policy 0, policy_version 88490 (0.0008) +[2023-10-08 15:18:05,091][102897] Updated weights for policy 0, policy_version 88500 (0.0010) +[2023-10-08 15:18:05,462][102897] Updated weights for policy 0, policy_version 88510 (0.0008) +[2023-10-08 15:18:06,138][102898] Updated weights for policy 1, policy_version 88610 (0.0007) +[2023-10-08 15:18:06,518][102898] Updated weights for policy 1, policy_version 88620 (0.0009) +[2023-10-08 15:18:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 181370880. Throughput: 0: 1799.7, 1: 1788.4. Samples: 45349678. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:18:06,876][101941] Avg episode reward: [(0, '9.090'), (1, '15.960')] +[2023-10-08 15:18:06,883][102898] Updated weights for policy 1, policy_version 88630 (0.0010) +[2023-10-08 15:18:07,241][102898] Updated weights for policy 1, policy_version 88640 (0.0010) +[2023-10-08 15:18:09,213][102897] Updated weights for policy 0, policy_version 88520 (0.0009) +[2023-10-08 15:18:09,577][102897] Updated weights for policy 0, policy_version 88530 (0.0008) +[2023-10-08 15:18:09,949][102897] Updated weights for policy 0, policy_version 88540 (0.0008) +[2023-10-08 15:18:11,101][102898] Updated weights for policy 1, policy_version 88650 (0.0008) +[2023-10-08 15:18:11,469][102898] Updated weights for policy 1, policy_version 88660 (0.0008) +[2023-10-08 15:18:11,831][102898] Updated weights for policy 1, policy_version 88670 (0.0008) +[2023-10-08 15:18:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 181436416. Throughput: 0: 1770.4, 1: 1800.5. Samples: 45370520. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:18:11,876][101941] Avg episode reward: [(0, '9.000'), (1, '13.840')] +[2023-10-08 15:18:13,971][102897] Updated weights for policy 0, policy_version 88550 (0.0009) +[2023-10-08 15:18:14,348][102897] Updated weights for policy 0, policy_version 88560 (0.0007) +[2023-10-08 15:18:14,711][102897] Updated weights for policy 0, policy_version 88570 (0.0008) +[2023-10-08 15:18:15,547][102898] Updated weights for policy 1, policy_version 88680 (0.0008) +[2023-10-08 15:18:15,917][102898] Updated weights for policy 1, policy_version 88690 (0.0008) +[2023-10-08 15:18:16,273][102898] Updated weights for policy 1, policy_version 88700 (0.0007) +[2023-10-08 15:18:16,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 181534720. Throughput: 0: 1772.4, 1: 1790.3. Samples: 45391598. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:18:16,875][101941] Avg episode reward: [(0, '8.570'), (1, '13.780')] +[2023-10-08 15:18:16,886][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000088704_90832896.pth... +[2023-10-08 15:18:16,886][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000088576_90701824.pth... +[2023-10-08 15:18:16,921][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000086912_88997888.pth +[2023-10-08 15:18:16,927][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000087008_89096192.pth +[2023-10-08 15:18:18,340][102897] Updated weights for policy 0, policy_version 88580 (0.0008) +[2023-10-08 15:18:18,695][102897] Updated weights for policy 0, policy_version 88590 (0.0007) +[2023-10-08 15:18:19,064][102897] Updated weights for policy 0, policy_version 88600 (0.0007) +[2023-10-08 15:18:19,863][102898] Updated weights for policy 1, policy_version 88710 (0.0007) +[2023-10-08 15:18:20,232][102898] Updated weights for policy 1, policy_version 88720 (0.0010) +[2023-10-08 15:18:20,592][102898] Updated weights for policy 1, policy_version 88730 (0.0008) +[2023-10-08 15:18:21,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 181600256. Throughput: 0: 1779.3, 1: 1798.6. Samples: 45403116. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:18:21,875][101941] Avg episode reward: [(0, '9.240'), (1, '13.740')] +[2023-10-08 15:18:22,771][102897] Updated weights for policy 0, policy_version 88610 (0.0007) +[2023-10-08 15:18:23,139][102897] Updated weights for policy 0, policy_version 88620 (0.0008) +[2023-10-08 15:18:23,509][102897] Updated weights for policy 0, policy_version 88630 (0.0008) +[2023-10-08 15:18:23,872][102897] Updated weights for policy 0, policy_version 88640 (0.0008) +[2023-10-08 15:18:24,321][102898] Updated weights for policy 1, policy_version 88740 (0.0009) +[2023-10-08 15:18:24,692][102898] Updated weights for policy 1, policy_version 88750 (0.0007) +[2023-10-08 15:18:25,050][102898] Updated weights for policy 1, policy_version 88760 (0.0007) +[2023-10-08 15:18:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 181665792. Throughput: 0: 1780.6, 1: 1794.9. Samples: 45423980. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:18:26,876][101941] Avg episode reward: [(0, '9.960'), (1, '14.070')] +[2023-10-08 15:18:27,580][102897] Updated weights for policy 0, policy_version 88650 (0.0009) +[2023-10-08 15:18:27,952][102897] Updated weights for policy 0, policy_version 88660 (0.0009) +[2023-10-08 15:18:28,327][102897] Updated weights for policy 0, policy_version 88670 (0.0010) +[2023-10-08 15:18:28,896][102898] Updated weights for policy 1, policy_version 88770 (0.0009) +[2023-10-08 15:18:29,266][102898] Updated weights for policy 1, policy_version 88780 (0.0009) +[2023-10-08 15:18:29,640][102898] Updated weights for policy 1, policy_version 88790 (0.0009) +[2023-10-08 15:18:30,016][102898] Updated weights for policy 1, policy_version 88800 (0.0009) +[2023-10-08 15:18:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 181731328. Throughput: 0: 1795.6, 1: 1790.5. Samples: 45446180. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:18:31,876][101941] Avg episode reward: [(0, '9.860'), (1, '13.800')] +[2023-10-08 15:18:32,222][102897] Updated weights for policy 0, policy_version 88680 (0.0007) +[2023-10-08 15:18:32,603][102897] Updated weights for policy 0, policy_version 88690 (0.0008) +[2023-10-08 15:18:32,967][102897] Updated weights for policy 0, policy_version 88700 (0.0007) +[2023-10-08 15:18:33,732][102898] Updated weights for policy 1, policy_version 88810 (0.0008) +[2023-10-08 15:18:34,106][102898] Updated weights for policy 1, policy_version 88820 (0.0009) +[2023-10-08 15:18:34,471][102898] Updated weights for policy 1, policy_version 88830 (0.0008) +[2023-10-08 15:18:36,632][102897] Updated weights for policy 0, policy_version 88710 (0.0008) +[2023-10-08 15:18:36,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 181796864. Throughput: 0: 1782.9, 1: 1794.0. Samples: 45456028. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:18:36,876][101941] Avg episode reward: [(0, '8.500'), (1, '14.910')] +[2023-10-08 15:18:37,005][102897] Updated weights for policy 0, policy_version 88720 (0.0007) +[2023-10-08 15:18:37,384][102897] Updated weights for policy 0, policy_version 88730 (0.0011) +[2023-10-08 15:18:38,420][102898] Updated weights for policy 1, policy_version 88840 (0.0008) +[2023-10-08 15:18:38,784][102898] Updated weights for policy 1, policy_version 88850 (0.0007) +[2023-10-08 15:18:39,147][102898] Updated weights for policy 1, policy_version 88860 (0.0008) +[2023-10-08 15:18:41,174][102897] Updated weights for policy 0, policy_version 88740 (0.0009) +[2023-10-08 15:18:41,552][102897] Updated weights for policy 0, policy_version 88750 (0.0009) +[2023-10-08 15:18:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 181862400. Throughput: 0: 1784.3, 1: 1788.2. Samples: 45477900. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:18:41,876][101941] Avg episode reward: [(0, '8.660'), (1, '15.100')] +[2023-10-08 15:18:41,913][102897] Updated weights for policy 0, policy_version 88760 (0.0007) +[2023-10-08 15:18:42,808][102898] Updated weights for policy 1, policy_version 88870 (0.0007) +[2023-10-08 15:18:43,178][102898] Updated weights for policy 1, policy_version 88880 (0.0008) +[2023-10-08 15:18:43,533][102898] Updated weights for policy 1, policy_version 88890 (0.0009) +[2023-10-08 15:18:45,642][102897] Updated weights for policy 0, policy_version 88770 (0.0009) +[2023-10-08 15:18:46,017][102897] Updated weights for policy 0, policy_version 88780 (0.0007) +[2023-10-08 15:18:46,391][102897] Updated weights for policy 0, policy_version 88790 (0.0010) +[2023-10-08 15:18:46,754][102897] Updated weights for policy 0, policy_version 88800 (0.0007) +[2023-10-08 15:18:46,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 181960704. Throughput: 0: 1795.7, 1: 1788.0. Samples: 45499482. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:18:46,876][101941] Avg episode reward: [(0, '9.420'), (1, '15.600')] +[2023-10-08 15:18:47,147][102898] Updated weights for policy 1, policy_version 88900 (0.0008) +[2023-10-08 15:18:47,516][102898] Updated weights for policy 1, policy_version 88910 (0.0008) +[2023-10-08 15:18:47,882][102898] Updated weights for policy 1, policy_version 88920 (0.0008) +[2023-10-08 15:18:50,492][102897] Updated weights for policy 0, policy_version 88810 (0.0007) +[2023-10-08 15:18:50,864][102897] Updated weights for policy 0, policy_version 88820 (0.0009) +[2023-10-08 15:18:51,239][102897] Updated weights for policy 0, policy_version 88830 (0.0010) +[2023-10-08 15:18:51,678][102898] Updated weights for policy 1, policy_version 88930 (0.0008) +[2023-10-08 15:18:51,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 182026240. Throughput: 0: 1782.0, 1: 1790.4. Samples: 45510436. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:18:51,875][101941] Avg episode reward: [(0, '9.740'), (1, '15.120')] +[2023-10-08 15:18:52,046][102898] Updated weights for policy 1, policy_version 88940 (0.0008) +[2023-10-08 15:18:52,416][102898] Updated weights for policy 1, policy_version 88950 (0.0009) +[2023-10-08 15:18:52,782][102898] Updated weights for policy 1, policy_version 88960 (0.0008) +[2023-10-08 15:18:55,035][102897] Updated weights for policy 0, policy_version 88840 (0.0007) +[2023-10-08 15:18:55,398][102897] Updated weights for policy 0, policy_version 88850 (0.0007) +[2023-10-08 15:18:55,764][102897] Updated weights for policy 0, policy_version 88860 (0.0009) +[2023-10-08 15:18:56,601][102898] Updated weights for policy 1, policy_version 88970 (0.0008) +[2023-10-08 15:18:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 182091776. Throughput: 0: 1799.5, 1: 1796.2. Samples: 45532330. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:18:56,877][101941] Avg episode reward: [(0, '9.220'), (1, '15.580')] +[2023-10-08 15:18:56,978][102898] Updated weights for policy 1, policy_version 88980 (0.0008) +[2023-10-08 15:18:57,342][102898] Updated weights for policy 1, policy_version 88990 (0.0009) +[2023-10-08 15:18:59,522][102897] Updated weights for policy 0, policy_version 88870 (0.0008) +[2023-10-08 15:18:59,888][102897] Updated weights for policy 0, policy_version 88880 (0.0007) +[2023-10-08 15:19:00,258][102897] Updated weights for policy 0, policy_version 88890 (0.0008) +[2023-10-08 15:19:01,267][102898] Updated weights for policy 1, policy_version 89000 (0.0009) +[2023-10-08 15:19:01,638][102898] Updated weights for policy 1, policy_version 89010 (0.0009) +[2023-10-08 15:19:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 182157312. Throughput: 0: 1786.0, 1: 1810.3. Samples: 45553430. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:19:01,876][101941] Avg episode reward: [(0, '8.460'), (1, '15.760')] +[2023-10-08 15:19:02,005][102898] Updated weights for policy 1, policy_version 89020 (0.0008) +[2023-10-08 15:19:03,902][102897] Updated weights for policy 0, policy_version 88900 (0.0008) +[2023-10-08 15:19:04,265][102897] Updated weights for policy 0, policy_version 88910 (0.0011) +[2023-10-08 15:19:04,633][102897] Updated weights for policy 0, policy_version 88920 (0.0010) +[2023-10-08 15:19:05,540][102898] Updated weights for policy 1, policy_version 89030 (0.0008) +[2023-10-08 15:19:05,907][102898] Updated weights for policy 1, policy_version 89040 (0.0008) +[2023-10-08 15:19:06,272][102898] Updated weights for policy 1, policy_version 89050 (0.0008) +[2023-10-08 15:19:06,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 182255616. Throughput: 0: 1802.0, 1: 1789.4. Samples: 45564728. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:19:06,876][101941] Avg episode reward: [(0, '8.340'), (1, '14.710')] +[2023-10-08 15:19:08,432][102897] Updated weights for policy 0, policy_version 88930 (0.0010) +[2023-10-08 15:19:08,796][102897] Updated weights for policy 0, policy_version 88940 (0.0008) +[2023-10-08 15:19:09,175][102897] Updated weights for policy 0, policy_version 88950 (0.0007) +[2023-10-08 15:19:09,540][102897] Updated weights for policy 0, policy_version 88960 (0.0007) +[2023-10-08 15:19:10,142][102898] Updated weights for policy 1, policy_version 89060 (0.0009) +[2023-10-08 15:19:10,510][102898] Updated weights for policy 1, policy_version 89070 (0.0010) +[2023-10-08 15:19:10,870][102898] Updated weights for policy 1, policy_version 89080 (0.0011) +[2023-10-08 15:19:11,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 182321152. Throughput: 0: 1789.4, 1: 1808.0. Samples: 45585864. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:19:11,875][101941] Avg episode reward: [(0, '8.380'), (1, '15.200')] +[2023-10-08 15:19:13,251][102897] Updated weights for policy 0, policy_version 88970 (0.0010) +[2023-10-08 15:19:13,632][102897] Updated weights for policy 0, policy_version 88980 (0.0007) +[2023-10-08 15:19:14,000][102897] Updated weights for policy 0, policy_version 88990 (0.0008) +[2023-10-08 15:19:14,448][102898] Updated weights for policy 1, policy_version 89090 (0.0009) +[2023-10-08 15:19:14,823][102898] Updated weights for policy 1, policy_version 89100 (0.0009) +[2023-10-08 15:19:15,198][102898] Updated weights for policy 1, policy_version 89110 (0.0008) +[2023-10-08 15:19:15,564][102898] Updated weights for policy 1, policy_version 89120 (0.0009) +[2023-10-08 15:19:16,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 182386688. Throughput: 0: 1792.4, 1: 1795.9. Samples: 45607656. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:19:16,876][101941] Avg episode reward: [(0, '9.660'), (1, '17.940')] +[2023-10-08 15:19:17,788][102897] Updated weights for policy 0, policy_version 89000 (0.0008) +[2023-10-08 15:19:18,165][102897] Updated weights for policy 0, policy_version 89010 (0.0007) +[2023-10-08 15:19:18,540][102897] Updated weights for policy 0, policy_version 89020 (0.0009) +[2023-10-08 15:19:19,396][102898] Updated weights for policy 1, policy_version 89130 (0.0007) +[2023-10-08 15:19:19,764][102898] Updated weights for policy 1, policy_version 89140 (0.0007) +[2023-10-08 15:19:20,127][102898] Updated weights for policy 1, policy_version 89150 (0.0008) +[2023-10-08 15:19:21,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 182452224. Throughput: 0: 1789.9, 1: 1812.4. Samples: 45618132. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:19:21,876][101941] Avg episode reward: [(0, '9.530'), (1, '17.690')] +[2023-10-08 15:19:22,227][102897] Updated weights for policy 0, policy_version 89030 (0.0008) +[2023-10-08 15:19:22,599][102897] Updated weights for policy 0, policy_version 89040 (0.0007) +[2023-10-08 15:19:22,958][102897] Updated weights for policy 0, policy_version 89050 (0.0009) +[2023-10-08 15:19:23,815][102898] Updated weights for policy 1, policy_version 89160 (0.0010) +[2023-10-08 15:19:24,196][102898] Updated weights for policy 1, policy_version 89170 (0.0010) +[2023-10-08 15:19:24,566][102898] Updated weights for policy 1, policy_version 89180 (0.0008) +[2023-10-08 15:19:26,632][102897] Updated weights for policy 0, policy_version 89060 (0.0007) +[2023-10-08 15:19:26,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 182517760. Throughput: 0: 1802.1, 1: 1796.4. Samples: 45639830. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:19:26,875][101941] Avg episode reward: [(0, '10.090'), (1, '19.860')] +[2023-10-08 15:19:26,876][102760] Saving new best policy, reward=19.860! +[2023-10-08 15:19:27,007][102897] Updated weights for policy 0, policy_version 89070 (0.0009) +[2023-10-08 15:19:27,373][102897] Updated weights for policy 0, policy_version 89080 (0.0008) +[2023-10-08 15:19:28,252][102898] Updated weights for policy 1, policy_version 89190 (0.0007) +[2023-10-08 15:19:28,614][102898] Updated weights for policy 1, policy_version 89200 (0.0009) +[2023-10-08 15:19:28,981][102898] Updated weights for policy 1, policy_version 89210 (0.0007) +[2023-10-08 15:19:31,232][102897] Updated weights for policy 0, policy_version 89090 (0.0007) +[2023-10-08 15:19:31,596][102897] Updated weights for policy 0, policy_version 89100 (0.0008) +[2023-10-08 15:19:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 182583296. Throughput: 0: 1813.0, 1: 1795.7. Samples: 45661872. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:19:31,876][101941] Avg episode reward: [(0, '8.870'), (1, '20.760')] +[2023-10-08 15:19:31,885][102760] Saving new best policy, reward=20.760! +[2023-10-08 15:19:31,967][102897] Updated weights for policy 0, policy_version 89110 (0.0008) +[2023-10-08 15:19:32,345][102897] Updated weights for policy 0, policy_version 89120 (0.0008) +[2023-10-08 15:19:32,720][102898] Updated weights for policy 1, policy_version 89220 (0.0007) +[2023-10-08 15:19:33,086][102898] Updated weights for policy 1, policy_version 89230 (0.0007) +[2023-10-08 15:19:33,452][102898] Updated weights for policy 1, policy_version 89240 (0.0009) +[2023-10-08 15:19:36,147][102897] Updated weights for policy 0, policy_version 89130 (0.0009) +[2023-10-08 15:19:36,514][102897] Updated weights for policy 0, policy_version 89140 (0.0007) +[2023-10-08 15:19:36,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 182648832. Throughput: 0: 1797.3, 1: 1793.9. Samples: 45672042. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:19:36,876][101941] Avg episode reward: [(0, '8.830'), (1, '19.990')] +[2023-10-08 15:19:36,877][102897] Updated weights for policy 0, policy_version 89150 (0.0008) +[2023-10-08 15:19:37,174][102898] Updated weights for policy 1, policy_version 89250 (0.0009) +[2023-10-08 15:19:37,553][102898] Updated weights for policy 1, policy_version 89260 (0.0009) +[2023-10-08 15:19:37,922][102898] Updated weights for policy 1, policy_version 89270 (0.0010) +[2023-10-08 15:19:38,290][102898] Updated weights for policy 1, policy_version 89280 (0.0008) +[2023-10-08 15:19:40,590][102897] Updated weights for policy 0, policy_version 89160 (0.0008) +[2023-10-08 15:19:40,963][102897] Updated weights for policy 0, policy_version 89170 (0.0009) +[2023-10-08 15:19:41,335][102897] Updated weights for policy 0, policy_version 89180 (0.0009) +[2023-10-08 15:19:41,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 182747136. Throughput: 0: 1807.3, 1: 1793.3. Samples: 45694356. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 15:19:41,875][101941] Avg episode reward: [(0, '9.540'), (1, '20.340')] +[2023-10-08 15:19:41,960][102898] Updated weights for policy 1, policy_version 89290 (0.0011) +[2023-10-08 15:19:42,318][102898] Updated weights for policy 1, policy_version 89300 (0.0010) +[2023-10-08 15:19:42,690][102898] Updated weights for policy 1, policy_version 89310 (0.0010) +[2023-10-08 15:19:45,118][102897] Updated weights for policy 0, policy_version 89190 (0.0007) +[2023-10-08 15:19:45,482][102897] Updated weights for policy 0, policy_version 89200 (0.0008) +[2023-10-08 15:19:45,858][102897] Updated weights for policy 0, policy_version 89210 (0.0009) +[2023-10-08 15:19:46,472][102898] Updated weights for policy 1, policy_version 89320 (0.0009) +[2023-10-08 15:19:46,840][102898] Updated weights for policy 1, policy_version 89330 (0.0007) +[2023-10-08 15:19:46,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 182812672. Throughput: 0: 1792.0, 1: 1803.9. Samples: 45715244. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 15:19:46,875][101941] Avg episode reward: [(0, '9.760'), (1, '18.840')] +[2023-10-08 15:19:47,211][102898] Updated weights for policy 1, policy_version 89340 (0.0008) +[2023-10-08 15:19:49,540][102897] Updated weights for policy 0, policy_version 89220 (0.0008) +[2023-10-08 15:19:49,914][102897] Updated weights for policy 0, policy_version 89230 (0.0011) +[2023-10-08 15:19:50,281][102897] Updated weights for policy 0, policy_version 89240 (0.0011) +[2023-10-08 15:19:51,032][102898] Updated weights for policy 1, policy_version 89350 (0.0010) +[2023-10-08 15:19:51,403][102898] Updated weights for policy 1, policy_version 89360 (0.0009) +[2023-10-08 15:19:51,766][102898] Updated weights for policy 1, policy_version 89370 (0.0007) +[2023-10-08 15:19:51,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 182878208. Throughput: 0: 1806.2, 1: 1795.0. Samples: 45726784. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 15:19:51,876][101941] Avg episode reward: [(0, '9.440'), (1, '18.170')] +[2023-10-08 15:19:54,018][102897] Updated weights for policy 0, policy_version 89250 (0.0009) +[2023-10-08 15:19:54,387][102897] Updated weights for policy 0, policy_version 89260 (0.0008) +[2023-10-08 15:19:54,756][102897] Updated weights for policy 0, policy_version 89270 (0.0009) +[2023-10-08 15:19:55,125][102897] Updated weights for policy 0, policy_version 89280 (0.0008) +[2023-10-08 15:19:55,532][102898] Updated weights for policy 1, policy_version 89380 (0.0009) +[2023-10-08 15:19:55,905][102898] Updated weights for policy 1, policy_version 89390 (0.0011) +[2023-10-08 15:19:56,262][102898] Updated weights for policy 1, policy_version 89400 (0.0008) +[2023-10-08 15:19:56,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 182976512. Throughput: 0: 1791.0, 1: 1806.6. Samples: 45747758. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 15:19:56,876][101941] Avg episode reward: [(0, '9.100'), (1, '18.270')] +[2023-10-08 15:19:58,908][102897] Updated weights for policy 0, policy_version 89290 (0.0009) +[2023-10-08 15:19:59,282][102897] Updated weights for policy 0, policy_version 89300 (0.0007) +[2023-10-08 15:19:59,651][102897] Updated weights for policy 0, policy_version 89310 (0.0007) +[2023-10-08 15:19:59,982][102898] Updated weights for policy 1, policy_version 89410 (0.0008) +[2023-10-08 15:20:00,351][102898] Updated weights for policy 1, policy_version 89420 (0.0010) +[2023-10-08 15:20:00,717][102898] Updated weights for policy 1, policy_version 89430 (0.0009) +[2023-10-08 15:20:01,091][102898] Updated weights for policy 1, policy_version 89440 (0.0009) +[2023-10-08 15:20:01,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 183042048. Throughput: 0: 1795.2, 1: 1790.5. Samples: 45769012. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 15:20:01,875][101941] Avg episode reward: [(0, '9.300'), (1, '18.090')] +[2023-10-08 15:20:03,226][102897] Updated weights for policy 0, policy_version 89320 (0.0007) +[2023-10-08 15:20:03,590][102897] Updated weights for policy 0, policy_version 89330 (0.0007) +[2023-10-08 15:20:03,967][102897] Updated weights for policy 0, policy_version 89340 (0.0010) +[2023-10-08 15:20:04,911][102898] Updated weights for policy 1, policy_version 89450 (0.0009) +[2023-10-08 15:20:05,283][102898] Updated weights for policy 1, policy_version 89460 (0.0009) +[2023-10-08 15:20:05,645][102898] Updated weights for policy 1, policy_version 89470 (0.0009) +[2023-10-08 15:20:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 183107584. Throughput: 0: 1802.8, 1: 1799.5. Samples: 45780238. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 15:20:06,876][101941] Avg episode reward: [(0, '9.440'), (1, '18.000')] +[2023-10-08 15:20:07,708][102897] Updated weights for policy 0, policy_version 89350 (0.0008) +[2023-10-08 15:20:08,072][102897] Updated weights for policy 0, policy_version 89360 (0.0009) +[2023-10-08 15:20:08,443][102897] Updated weights for policy 0, policy_version 89370 (0.0009) +[2023-10-08 15:20:09,374][102898] Updated weights for policy 1, policy_version 89480 (0.0009) +[2023-10-08 15:20:09,743][102898] Updated weights for policy 1, policy_version 89490 (0.0009) +[2023-10-08 15:20:10,103][102898] Updated weights for policy 1, policy_version 89500 (0.0009) +[2023-10-08 15:20:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 183173120. Throughput: 0: 1801.0, 1: 1788.0. Samples: 45801336. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 15:20:11,875][101941] Avg episode reward: [(0, '9.420'), (1, '18.930')] +[2023-10-08 15:20:12,067][102897] Updated weights for policy 0, policy_version 89380 (0.0008) +[2023-10-08 15:20:12,433][102897] Updated weights for policy 0, policy_version 89390 (0.0008) +[2023-10-08 15:20:12,800][102897] Updated weights for policy 0, policy_version 89400 (0.0008) +[2023-10-08 15:20:13,884][102898] Updated weights for policy 1, policy_version 89510 (0.0009) +[2023-10-08 15:20:14,246][102898] Updated weights for policy 1, policy_version 89520 (0.0008) +[2023-10-08 15:20:14,622][102898] Updated weights for policy 1, policy_version 89530 (0.0008) +[2023-10-08 15:20:16,611][102897] Updated weights for policy 0, policy_version 89410 (0.0007) +[2023-10-08 15:20:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 183238656. Throughput: 0: 1809.4, 1: 1789.6. Samples: 45823824. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 15:20:16,876][101941] Avg episode reward: [(0, '9.270'), (1, '17.350')] +[2023-10-08 15:20:16,885][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000089536_91684864.pth... +[2023-10-08 15:20:16,925][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000087872_89980928.pth +[2023-10-08 15:20:16,978][102897] Updated weights for policy 0, policy_version 89420 (0.0008) +[2023-10-08 15:20:17,342][102897] Updated weights for policy 0, policy_version 89430 (0.0007) +[2023-10-08 15:20:17,709][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000089440_91586560.pth... +[2023-10-08 15:20:17,709][102897] Updated weights for policy 0, policy_version 89440 (0.0009) +[2023-10-08 15:20:17,738][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000087744_89849856.pth +[2023-10-08 15:20:18,336][102898] Updated weights for policy 1, policy_version 89540 (0.0007) +[2023-10-08 15:20:18,705][102898] Updated weights for policy 1, policy_version 89550 (0.0007) +[2023-10-08 15:20:19,079][102898] Updated weights for policy 1, policy_version 89560 (0.0009) +[2023-10-08 15:20:21,451][102897] Updated weights for policy 0, policy_version 89450 (0.0010) +[2023-10-08 15:20:21,819][102897] Updated weights for policy 0, policy_version 89460 (0.0008) +[2023-10-08 15:20:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 183304192. Throughput: 0: 1799.2, 1: 1788.0. Samples: 45833470. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 15:20:21,876][101941] Avg episode reward: [(0, '9.240'), (1, '15.830')] +[2023-10-08 15:20:22,182][102897] Updated weights for policy 0, policy_version 89470 (0.0011) +[2023-10-08 15:20:22,879][102898] Updated weights for policy 1, policy_version 89570 (0.0008) +[2023-10-08 15:20:23,247][102898] Updated weights for policy 1, policy_version 89580 (0.0010) +[2023-10-08 15:20:23,615][102898] Updated weights for policy 1, policy_version 89590 (0.0007) +[2023-10-08 15:20:23,979][102898] Updated weights for policy 1, policy_version 89600 (0.0009) +[2023-10-08 15:20:25,926][102897] Updated weights for policy 0, policy_version 89480 (0.0008) +[2023-10-08 15:20:26,293][102897] Updated weights for policy 0, policy_version 89490 (0.0007) +[2023-10-08 15:20:26,671][102897] Updated weights for policy 0, policy_version 89500 (0.0007) +[2023-10-08 15:20:26,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.5, 300 sec: 14440.1). Total num frames: 183402496. Throughput: 0: 1803.5, 1: 1783.7. Samples: 45855780. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 15:20:26,876][101941] Avg episode reward: [(0, '9.480'), (1, '15.820')] +[2023-10-08 15:20:27,781][102898] Updated weights for policy 1, policy_version 89610 (0.0008) +[2023-10-08 15:20:28,149][102898] Updated weights for policy 1, policy_version 89620 (0.0008) +[2023-10-08 15:20:28,514][102898] Updated weights for policy 1, policy_version 89630 (0.0008) +[2023-10-08 15:20:30,246][102897] Updated weights for policy 0, policy_version 89510 (0.0009) +[2023-10-08 15:20:30,614][102897] Updated weights for policy 0, policy_version 89520 (0.0007) +[2023-10-08 15:20:30,975][102897] Updated weights for policy 0, policy_version 89530 (0.0008) +[2023-10-08 15:20:31,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 183468032. Throughput: 0: 1805.9, 1: 1792.6. Samples: 45877174. Policy #0 lag: (min: 31.0, avg: 34.7, max: 63.0) +[2023-10-08 15:20:31,876][101941] Avg episode reward: [(0, '9.200'), (1, '16.070')] +[2023-10-08 15:20:32,358][102898] Updated weights for policy 1, policy_version 89640 (0.0009) +[2023-10-08 15:20:32,724][102898] Updated weights for policy 1, policy_version 89650 (0.0008) +[2023-10-08 15:20:33,098][102898] Updated weights for policy 1, policy_version 89660 (0.0007) +[2023-10-08 15:20:34,878][102897] Updated weights for policy 0, policy_version 89540 (0.0007) +[2023-10-08 15:20:35,246][102897] Updated weights for policy 0, policy_version 89550 (0.0008) +[2023-10-08 15:20:35,625][102897] Updated weights for policy 0, policy_version 89560 (0.0009) +[2023-10-08 15:20:36,829][102898] Updated weights for policy 1, policy_version 89670 (0.0007) +[2023-10-08 15:20:36,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 183533568. Throughput: 0: 1804.4, 1: 1784.4. Samples: 45888276. Policy #0 lag: (min: 25.0, avg: 41.5, max: 57.0) +[2023-10-08 15:20:36,875][101941] Avg episode reward: [(0, '9.170'), (1, '17.430')] +[2023-10-08 15:20:37,201][102898] Updated weights for policy 1, policy_version 89680 (0.0007) +[2023-10-08 15:20:37,574][102898] Updated weights for policy 1, policy_version 89690 (0.0007) +[2023-10-08 15:20:39,358][102897] Updated weights for policy 0, policy_version 89570 (0.0007) +[2023-10-08 15:20:39,730][102897] Updated weights for policy 0, policy_version 89580 (0.0008) +[2023-10-08 15:20:40,103][102897] Updated weights for policy 0, policy_version 89590 (0.0007) +[2023-10-08 15:20:40,469][102897] Updated weights for policy 0, policy_version 89600 (0.0010) +[2023-10-08 15:20:41,389][102898] Updated weights for policy 1, policy_version 89700 (0.0008) +[2023-10-08 15:20:41,758][102898] Updated weights for policy 1, policy_version 89710 (0.0010) +[2023-10-08 15:20:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 183599104. Throughput: 0: 1806.0, 1: 1788.1. Samples: 45909494. Policy #0 lag: (min: 25.0, avg: 41.5, max: 57.0) +[2023-10-08 15:20:41,876][101941] Avg episode reward: [(0, '9.300'), (1, '17.690')] +[2023-10-08 15:20:42,125][102898] Updated weights for policy 1, policy_version 89720 (0.0010) +[2023-10-08 15:20:44,360][102897] Updated weights for policy 0, policy_version 89610 (0.0010) +[2023-10-08 15:20:44,730][102897] Updated weights for policy 0, policy_version 89620 (0.0011) +[2023-10-08 15:20:45,096][102897] Updated weights for policy 0, policy_version 89630 (0.0011) +[2023-10-08 15:20:45,777][102898] Updated weights for policy 1, policy_version 89730 (0.0009) +[2023-10-08 15:20:46,143][102898] Updated weights for policy 1, policy_version 89740 (0.0011) +[2023-10-08 15:20:46,513][102898] Updated weights for policy 1, policy_version 89750 (0.0011) +[2023-10-08 15:20:46,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 183664640. Throughput: 0: 1792.0, 1: 1799.0. Samples: 45930610. Policy #0 lag: (min: 25.0, avg: 41.5, max: 57.0) +[2023-10-08 15:20:46,875][101941] Avg episode reward: [(0, '9.290'), (1, '16.890')] +[2023-10-08 15:20:46,885][102898] Updated weights for policy 1, policy_version 89760 (0.0009) +[2023-10-08 15:20:49,052][102897] Updated weights for policy 0, policy_version 89640 (0.0008) +[2023-10-08 15:20:49,424][102897] Updated weights for policy 0, policy_version 89650 (0.0007) +[2023-10-08 15:20:49,794][102897] Updated weights for policy 0, policy_version 89660 (0.0008) +[2023-10-08 15:20:50,604][102898] Updated weights for policy 1, policy_version 89770 (0.0008) +[2023-10-08 15:20:50,961][102898] Updated weights for policy 1, policy_version 89780 (0.0007) +[2023-10-08 15:20:51,339][102898] Updated weights for policy 1, policy_version 89790 (0.0007) +[2023-10-08 15:20:51,875][101941] Fps is (10 sec: 16384.5, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 183762944. Throughput: 0: 1800.4, 1: 1788.5. Samples: 45941736. Policy #0 lag: (min: 25.0, avg: 41.5, max: 57.0) +[2023-10-08 15:20:51,875][101941] Avg episode reward: [(0, '9.520'), (1, '15.390')] +[2023-10-08 15:20:53,553][102897] Updated weights for policy 0, policy_version 89670 (0.0007) +[2023-10-08 15:20:53,918][102897] Updated weights for policy 0, policy_version 89680 (0.0009) +[2023-10-08 15:20:54,286][102897] Updated weights for policy 0, policy_version 89690 (0.0010) +[2023-10-08 15:20:55,184][102898] Updated weights for policy 1, policy_version 89800 (0.0009) +[2023-10-08 15:20:55,552][102898] Updated weights for policy 1, policy_version 89810 (0.0009) +[2023-10-08 15:20:55,921][102898] Updated weights for policy 1, policy_version 89820 (0.0011) +[2023-10-08 15:20:56,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 183828480. Throughput: 0: 1778.5, 1: 1805.1. Samples: 45962600. Policy #0 lag: (min: 25.0, avg: 41.5, max: 57.0) +[2023-10-08 15:20:56,876][101941] Avg episode reward: [(0, '9.680'), (1, '15.530')] +[2023-10-08 15:20:57,966][102897] Updated weights for policy 0, policy_version 89700 (0.0009) +[2023-10-08 15:20:58,336][102897] Updated weights for policy 0, policy_version 89710 (0.0010) +[2023-10-08 15:20:58,706][102897] Updated weights for policy 0, policy_version 89720 (0.0008) +[2023-10-08 15:20:59,506][102898] Updated weights for policy 1, policy_version 89830 (0.0009) +[2023-10-08 15:20:59,875][102898] Updated weights for policy 1, policy_version 89840 (0.0009) +[2023-10-08 15:21:00,248][102898] Updated weights for policy 1, policy_version 89850 (0.0008) +[2023-10-08 15:21:01,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 183894016. Throughput: 0: 1778.8, 1: 1788.2. Samples: 45984336. Policy #0 lag: (min: 25.0, avg: 41.5, max: 57.0) +[2023-10-08 15:21:01,876][101941] Avg episode reward: [(0, '9.830'), (1, '15.400')] +[2023-10-08 15:21:02,559][102897] Updated weights for policy 0, policy_version 89730 (0.0010) +[2023-10-08 15:21:02,932][102897] Updated weights for policy 0, policy_version 89740 (0.0010) +[2023-10-08 15:21:03,292][102897] Updated weights for policy 0, policy_version 89750 (0.0010) +[2023-10-08 15:21:03,657][102897] Updated weights for policy 0, policy_version 89760 (0.0008) +[2023-10-08 15:21:03,984][102898] Updated weights for policy 1, policy_version 89860 (0.0008) +[2023-10-08 15:21:04,350][102898] Updated weights for policy 1, policy_version 89870 (0.0007) +[2023-10-08 15:21:04,724][102898] Updated weights for policy 1, policy_version 89880 (0.0009) +[2023-10-08 15:21:06,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 183959552. Throughput: 0: 1780.9, 1: 1811.6. Samples: 45995130. Policy #0 lag: (min: 25.0, avg: 41.5, max: 57.0) +[2023-10-08 15:21:06,875][101941] Avg episode reward: [(0, '9.680'), (1, '16.650')] +[2023-10-08 15:21:07,498][102897] Updated weights for policy 0, policy_version 89770 (0.0007) +[2023-10-08 15:21:07,873][102897] Updated weights for policy 0, policy_version 89780 (0.0007) +[2023-10-08 15:21:08,237][102897] Updated weights for policy 0, policy_version 89790 (0.0010) +[2023-10-08 15:21:08,400][102898] Updated weights for policy 1, policy_version 89890 (0.0009) +[2023-10-08 15:21:08,763][102898] Updated weights for policy 1, policy_version 89900 (0.0011) +[2023-10-08 15:21:09,134][102898] Updated weights for policy 1, policy_version 89910 (0.0011) +[2023-10-08 15:21:09,508][102898] Updated weights for policy 1, policy_version 89920 (0.0007) +[2023-10-08 15:21:11,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 184025088. Throughput: 0: 1776.3, 1: 1798.8. Samples: 46016660. Policy #0 lag: (min: 25.0, avg: 41.5, max: 57.0) +[2023-10-08 15:21:11,876][101941] Avg episode reward: [(0, '9.820'), (1, '19.320')] +[2023-10-08 15:21:12,091][102897] Updated weights for policy 0, policy_version 89800 (0.0009) +[2023-10-08 15:21:12,453][102897] Updated weights for policy 0, policy_version 89810 (0.0009) +[2023-10-08 15:21:12,828][102897] Updated weights for policy 0, policy_version 89820 (0.0007) +[2023-10-08 15:21:13,390][102898] Updated weights for policy 1, policy_version 89930 (0.0008) +[2023-10-08 15:21:13,752][102898] Updated weights for policy 1, policy_version 89940 (0.0008) +[2023-10-08 15:21:14,124][102898] Updated weights for policy 1, policy_version 89950 (0.0007) +[2023-10-08 15:21:16,592][102897] Updated weights for policy 0, policy_version 89830 (0.0007) +[2023-10-08 15:21:16,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 184090624. Throughput: 0: 1796.9, 1: 1797.5. Samples: 46038924. Policy #0 lag: (min: 25.0, avg: 41.5, max: 57.0) +[2023-10-08 15:21:16,876][101941] Avg episode reward: [(0, '9.740'), (1, '18.580')] +[2023-10-08 15:21:16,961][102897] Updated weights for policy 0, policy_version 89840 (0.0007) +[2023-10-08 15:21:17,336][102897] Updated weights for policy 0, policy_version 89850 (0.0009) +[2023-10-08 15:21:17,976][102898] Updated weights for policy 1, policy_version 89960 (0.0007) +[2023-10-08 15:21:18,336][102898] Updated weights for policy 1, policy_version 89970 (0.0008) +[2023-10-08 15:21:18,703][102898] Updated weights for policy 1, policy_version 89980 (0.0007) +[2023-10-08 15:21:21,040][102897] Updated weights for policy 0, policy_version 89860 (0.0009) +[2023-10-08 15:21:21,411][102897] Updated weights for policy 0, policy_version 89870 (0.0011) +[2023-10-08 15:21:21,784][102897] Updated weights for policy 0, policy_version 89880 (0.0008) +[2023-10-08 15:21:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 184156160. Throughput: 0: 1768.6, 1: 1798.2. Samples: 46048780. Policy #0 lag: (min: 25.0, avg: 41.5, max: 57.0) +[2023-10-08 15:21:21,875][101941] Avg episode reward: [(0, '9.710'), (1, '19.000')] +[2023-10-08 15:21:22,523][102898] Updated weights for policy 1, policy_version 89990 (0.0009) +[2023-10-08 15:21:22,882][102898] Updated weights for policy 1, policy_version 90000 (0.0008) +[2023-10-08 15:21:23,249][102898] Updated weights for policy 1, policy_version 90010 (0.0008) +[2023-10-08 15:21:25,371][102897] Updated weights for policy 0, policy_version 89890 (0.0007) +[2023-10-08 15:21:25,742][102897] Updated weights for policy 0, policy_version 89900 (0.0007) +[2023-10-08 15:21:26,096][102897] Updated weights for policy 0, policy_version 89910 (0.0007) +[2023-10-08 15:21:26,472][102897] Updated weights for policy 0, policy_version 89920 (0.0007) +[2023-10-08 15:21:26,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 184254464. Throughput: 0: 1796.3, 1: 1793.8. Samples: 46071050. Policy #0 lag: (min: 25.0, avg: 41.5, max: 57.0) +[2023-10-08 15:21:26,876][101941] Avg episode reward: [(0, '9.310'), (1, '19.510')] +[2023-10-08 15:21:27,030][102898] Updated weights for policy 1, policy_version 90020 (0.0009) +[2023-10-08 15:21:27,400][102898] Updated weights for policy 1, policy_version 90030 (0.0010) +[2023-10-08 15:21:27,764][102898] Updated weights for policy 1, policy_version 90040 (0.0009) +[2023-10-08 15:21:30,422][102897] Updated weights for policy 0, policy_version 89930 (0.0008) +[2023-10-08 15:21:30,793][102897] Updated weights for policy 0, policy_version 89940 (0.0008) +[2023-10-08 15:21:31,169][102897] Updated weights for policy 0, policy_version 89950 (0.0008) +[2023-10-08 15:21:31,491][102898] Updated weights for policy 1, policy_version 90050 (0.0009) +[2023-10-08 15:21:31,855][102898] Updated weights for policy 1, policy_version 90060 (0.0007) +[2023-10-08 15:21:31,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 184320000. Throughput: 0: 1771.1, 1: 1814.1. Samples: 46091944. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 15:21:31,875][101941] Avg episode reward: [(0, '8.680'), (1, '18.350')] +[2023-10-08 15:21:32,220][102898] Updated weights for policy 1, policy_version 90070 (0.0007) +[2023-10-08 15:21:32,584][102898] Updated weights for policy 1, policy_version 90080 (0.0008) +[2023-10-08 15:21:34,898][102897] Updated weights for policy 0, policy_version 89960 (0.0009) +[2023-10-08 15:21:35,279][102897] Updated weights for policy 0, policy_version 89970 (0.0010) +[2023-10-08 15:21:35,645][102897] Updated weights for policy 0, policy_version 89980 (0.0009) +[2023-10-08 15:21:36,312][102898] Updated weights for policy 1, policy_version 90090 (0.0010) +[2023-10-08 15:21:36,680][102898] Updated weights for policy 1, policy_version 90100 (0.0009) +[2023-10-08 15:21:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 184385536. Throughput: 0: 1797.5, 1: 1794.6. Samples: 46103382. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 15:21:36,875][101941] Avg episode reward: [(0, '7.860'), (1, '19.020')] +[2023-10-08 15:21:37,039][102898] Updated weights for policy 1, policy_version 90110 (0.0011) +[2023-10-08 15:21:39,319][102897] Updated weights for policy 0, policy_version 89990 (0.0009) +[2023-10-08 15:21:39,693][102897] Updated weights for policy 0, policy_version 90000 (0.0007) +[2023-10-08 15:21:40,061][102897] Updated weights for policy 0, policy_version 90010 (0.0008) +[2023-10-08 15:21:40,789][102898] Updated weights for policy 1, policy_version 90120 (0.0010) +[2023-10-08 15:21:41,151][102898] Updated weights for policy 1, policy_version 90130 (0.0010) +[2023-10-08 15:21:41,515][102898] Updated weights for policy 1, policy_version 90140 (0.0007) +[2023-10-08 15:21:41,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 184483840. Throughput: 0: 1780.7, 1: 1810.8. Samples: 46124216. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 15:21:41,876][101941] Avg episode reward: [(0, '8.470'), (1, '17.400')] +[2023-10-08 15:21:43,721][102897] Updated weights for policy 0, policy_version 90020 (0.0009) +[2023-10-08 15:21:44,099][102897] Updated weights for policy 0, policy_version 90030 (0.0010) +[2023-10-08 15:21:44,469][102897] Updated weights for policy 0, policy_version 90040 (0.0010) +[2023-10-08 15:21:45,271][102898] Updated weights for policy 1, policy_version 90150 (0.0008) +[2023-10-08 15:21:45,635][102898] Updated weights for policy 1, policy_version 90160 (0.0009) +[2023-10-08 15:21:46,002][102898] Updated weights for policy 1, policy_version 90170 (0.0007) +[2023-10-08 15:21:46,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 184549376. Throughput: 0: 1783.6, 1: 1797.9. Samples: 46145506. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 15:21:46,876][101941] Avg episode reward: [(0, '8.230'), (1, '18.680')] +[2023-10-08 15:21:48,305][102897] Updated weights for policy 0, policy_version 90050 (0.0008) +[2023-10-08 15:21:48,678][102897] Updated weights for policy 0, policy_version 90060 (0.0007) +[2023-10-08 15:21:49,048][102897] Updated weights for policy 0, policy_version 90070 (0.0009) +[2023-10-08 15:21:49,409][102897] Updated weights for policy 0, policy_version 90080 (0.0009) +[2023-10-08 15:21:49,654][102898] Updated weights for policy 1, policy_version 90180 (0.0008) +[2023-10-08 15:21:50,017][102898] Updated weights for policy 1, policy_version 90190 (0.0008) +[2023-10-08 15:21:50,385][102898] Updated weights for policy 1, policy_version 90200 (0.0008) +[2023-10-08 15:21:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 184614912. Throughput: 0: 1783.8, 1: 1809.2. Samples: 46156814. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 15:21:51,875][101941] Avg episode reward: [(0, '9.480'), (1, '18.710')] +[2023-10-08 15:21:53,205][102897] Updated weights for policy 0, policy_version 90090 (0.0008) +[2023-10-08 15:21:53,575][102897] Updated weights for policy 0, policy_version 90100 (0.0008) +[2023-10-08 15:21:53,957][102897] Updated weights for policy 0, policy_version 90110 (0.0010) +[2023-10-08 15:21:54,231][102898] Updated weights for policy 1, policy_version 90210 (0.0008) +[2023-10-08 15:21:54,600][102898] Updated weights for policy 1, policy_version 90220 (0.0009) +[2023-10-08 15:21:54,975][102898] Updated weights for policy 1, policy_version 90230 (0.0007) +[2023-10-08 15:21:55,346][102898] Updated weights for policy 1, policy_version 90240 (0.0008) +[2023-10-08 15:21:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 184680448. Throughput: 0: 1791.0, 1: 1788.8. Samples: 46177752. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 15:21:56,875][101941] Avg episode reward: [(0, '9.550'), (1, '18.650')] +[2023-10-08 15:21:57,520][102897] Updated weights for policy 0, policy_version 90120 (0.0008) +[2023-10-08 15:21:57,893][102897] Updated weights for policy 0, policy_version 90130 (0.0008) +[2023-10-08 15:21:58,262][102897] Updated weights for policy 0, policy_version 90140 (0.0008) +[2023-10-08 15:21:59,058][102898] Updated weights for policy 1, policy_version 90250 (0.0007) +[2023-10-08 15:21:59,427][102898] Updated weights for policy 1, policy_version 90260 (0.0007) +[2023-10-08 15:21:59,804][102898] Updated weights for policy 1, policy_version 90270 (0.0007) +[2023-10-08 15:22:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 184745984. Throughput: 0: 1798.1, 1: 1790.8. Samples: 46200420. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 15:22:01,875][101941] Avg episode reward: [(0, '8.750'), (1, '19.280')] +[2023-10-08 15:22:02,087][102897] Updated weights for policy 0, policy_version 90150 (0.0007) +[2023-10-08 15:22:02,462][102897] Updated weights for policy 0, policy_version 90160 (0.0008) +[2023-10-08 15:22:02,838][102897] Updated weights for policy 0, policy_version 90170 (0.0007) +[2023-10-08 15:22:03,621][102898] Updated weights for policy 1, policy_version 90280 (0.0008) +[2023-10-08 15:22:03,999][102898] Updated weights for policy 1, policy_version 90290 (0.0010) +[2023-10-08 15:22:04,360][102898] Updated weights for policy 1, policy_version 90300 (0.0010) +[2023-10-08 15:22:06,716][102897] Updated weights for policy 0, policy_version 90180 (0.0007) +[2023-10-08 15:22:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 184811520. Throughput: 0: 1794.2, 1: 1794.4. Samples: 46210264. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 15:22:06,875][101941] Avg episode reward: [(0, '8.640'), (1, '19.060')] +[2023-10-08 15:22:07,082][102897] Updated weights for policy 0, policy_version 90190 (0.0007) +[2023-10-08 15:22:07,458][102897] Updated weights for policy 0, policy_version 90200 (0.0008) +[2023-10-08 15:22:07,972][102898] Updated weights for policy 1, policy_version 90310 (0.0008) +[2023-10-08 15:22:08,338][102898] Updated weights for policy 1, policy_version 90320 (0.0010) +[2023-10-08 15:22:08,705][102898] Updated weights for policy 1, policy_version 90330 (0.0009) +[2023-10-08 15:22:11,309][102897] Updated weights for policy 0, policy_version 90210 (0.0008) +[2023-10-08 15:22:11,674][102897] Updated weights for policy 0, policy_version 90220 (0.0007) +[2023-10-08 15:22:11,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 184877056. Throughput: 0: 1791.5, 1: 1792.9. Samples: 46232348. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 15:22:11,876][101941] Avg episode reward: [(0, '8.940'), (1, '18.630')] +[2023-10-08 15:22:12,040][102897] Updated weights for policy 0, policy_version 90230 (0.0008) +[2023-10-08 15:22:12,412][102897] Updated weights for policy 0, policy_version 90240 (0.0008) +[2023-10-08 15:22:12,485][102898] Updated weights for policy 1, policy_version 90340 (0.0009) +[2023-10-08 15:22:12,847][102898] Updated weights for policy 1, policy_version 90350 (0.0007) +[2023-10-08 15:22:13,218][102898] Updated weights for policy 1, policy_version 90360 (0.0007) +[2023-10-08 15:22:16,238][102897] Updated weights for policy 0, policy_version 90250 (0.0010) +[2023-10-08 15:22:16,607][102897] Updated weights for policy 0, policy_version 90260 (0.0008) +[2023-10-08 15:22:16,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 184942592. Throughput: 0: 1807.1, 1: 1800.3. Samples: 46254276. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 15:22:16,876][101941] Avg episode reward: [(0, '8.810'), (1, '20.160')] +[2023-10-08 15:22:16,907][102898] Updated weights for policy 1, policy_version 90370 (0.0007) +[2023-10-08 15:22:16,975][102897] Updated weights for policy 0, policy_version 90270 (0.0009) +[2023-10-08 15:22:17,047][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000090272_92438528.pth... +[2023-10-08 15:22:17,075][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000088576_90701824.pth +[2023-10-08 15:22:17,276][102898] Updated weights for policy 1, policy_version 90380 (0.0009) +[2023-10-08 15:22:17,645][102898] Updated weights for policy 1, policy_version 90390 (0.0009) +[2023-10-08 15:22:18,005][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000090400_92569600.pth... +[2023-10-08 15:22:18,006][102898] Updated weights for policy 1, policy_version 90400 (0.0010) +[2023-10-08 15:22:18,048][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000088704_90832896.pth +[2023-10-08 15:22:20,577][102897] Updated weights for policy 0, policy_version 90280 (0.0009) +[2023-10-08 15:22:20,945][102897] Updated weights for policy 0, policy_version 90290 (0.0007) +[2023-10-08 15:22:21,306][102897] Updated weights for policy 0, policy_version 90300 (0.0008) +[2023-10-08 15:22:21,695][102898] Updated weights for policy 1, policy_version 90410 (0.0009) +[2023-10-08 15:22:21,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 185040896. Throughput: 0: 1784.8, 1: 1799.1. Samples: 46264660. Policy #0 lag: (min: 4.0, avg: 4.0, max: 4.0) +[2023-10-08 15:22:21,876][101941] Avg episode reward: [(0, '8.950'), (1, '21.120')] +[2023-10-08 15:22:22,058][102898] Updated weights for policy 1, policy_version 90420 (0.0009) +[2023-10-08 15:22:22,441][102898] Updated weights for policy 1, policy_version 90430 (0.0009) +[2023-10-08 15:22:22,511][102760] Saving new best policy, reward=21.120! +[2023-10-08 15:22:25,065][102897] Updated weights for policy 0, policy_version 90310 (0.0007) +[2023-10-08 15:22:25,435][102897] Updated weights for policy 0, policy_version 90320 (0.0008) +[2023-10-08 15:22:25,797][102897] Updated weights for policy 0, policy_version 90330 (0.0009) +[2023-10-08 15:22:26,136][102898] Updated weights for policy 1, policy_version 90440 (0.0009) +[2023-10-08 15:22:26,508][102898] Updated weights for policy 1, policy_version 90450 (0.0007) +[2023-10-08 15:22:26,874][102898] Updated weights for policy 1, policy_version 90460 (0.0007) +[2023-10-08 15:22:26,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 185106432. Throughput: 0: 1803.4, 1: 1800.4. Samples: 46286388. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:22:26,876][101941] Avg episode reward: [(0, '8.400'), (1, '21.440')] +[2023-10-08 15:22:27,016][102760] Saving new best policy, reward=21.440! +[2023-10-08 15:22:29,579][102897] Updated weights for policy 0, policy_version 90340 (0.0007) +[2023-10-08 15:22:29,948][102897] Updated weights for policy 0, policy_version 90350 (0.0007) +[2023-10-08 15:22:30,326][102897] Updated weights for policy 0, policy_version 90360 (0.0010) +[2023-10-08 15:22:30,507][102898] Updated weights for policy 1, policy_version 90470 (0.0007) +[2023-10-08 15:22:30,881][102898] Updated weights for policy 1, policy_version 90480 (0.0007) +[2023-10-08 15:22:31,247][102898] Updated weights for policy 1, policy_version 90490 (0.0007) +[2023-10-08 15:22:31,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 185204736. Throughput: 0: 1780.9, 1: 1801.4. Samples: 46306710. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:22:31,875][101941] Avg episode reward: [(0, '9.240'), (1, '22.930')] +[2023-10-08 15:22:31,884][102760] Saving new best policy, reward=22.930! +[2023-10-08 15:22:34,206][102897] Updated weights for policy 0, policy_version 90370 (0.0007) +[2023-10-08 15:22:34,579][102897] Updated weights for policy 0, policy_version 90380 (0.0007) +[2023-10-08 15:22:34,951][102897] Updated weights for policy 0, policy_version 90390 (0.0007) +[2023-10-08 15:22:35,050][102898] Updated weights for policy 1, policy_version 90500 (0.0008) +[2023-10-08 15:22:35,320][102897] Updated weights for policy 0, policy_version 90400 (0.0009) +[2023-10-08 15:22:35,422][102898] Updated weights for policy 1, policy_version 90510 (0.0007) +[2023-10-08 15:22:35,788][102898] Updated weights for policy 1, policy_version 90520 (0.0007) +[2023-10-08 15:22:36,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 185270272. Throughput: 0: 1805.0, 1: 1793.6. Samples: 46318754. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:22:36,876][101941] Avg episode reward: [(0, '9.090'), (1, '21.190')] +[2023-10-08 15:22:38,914][102897] Updated weights for policy 0, policy_version 90410 (0.0009) +[2023-10-08 15:22:39,283][102897] Updated weights for policy 0, policy_version 90420 (0.0011) +[2023-10-08 15:22:39,620][102898] Updated weights for policy 1, policy_version 90530 (0.0007) +[2023-10-08 15:22:39,652][102897] Updated weights for policy 0, policy_version 90430 (0.0008) +[2023-10-08 15:22:39,990][102898] Updated weights for policy 1, policy_version 90540 (0.0010) +[2023-10-08 15:22:40,348][102898] Updated weights for policy 1, policy_version 90550 (0.0008) +[2023-10-08 15:22:40,723][102898] Updated weights for policy 1, policy_version 90560 (0.0008) +[2023-10-08 15:22:41,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 185335808. Throughput: 0: 1784.7, 1: 1801.3. Samples: 46339126. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:22:41,876][101941] Avg episode reward: [(0, '9.140'), (1, '21.360')] +[2023-10-08 15:22:43,327][102897] Updated weights for policy 0, policy_version 90440 (0.0007) +[2023-10-08 15:22:43,702][102897] Updated weights for policy 0, policy_version 90450 (0.0008) +[2023-10-08 15:22:44,059][102897] Updated weights for policy 0, policy_version 90460 (0.0008) +[2023-10-08 15:22:44,482][102898] Updated weights for policy 1, policy_version 90570 (0.0008) +[2023-10-08 15:22:44,847][102898] Updated weights for policy 1, policy_version 90580 (0.0009) +[2023-10-08 15:22:45,215][102898] Updated weights for policy 1, policy_version 90590 (0.0009) +[2023-10-08 15:22:46,875][101941] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 185401344. Throughput: 0: 1783.0, 1: 1794.4. Samples: 46361408. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:22:46,876][101941] Avg episode reward: [(0, '9.270'), (1, '20.720')] +[2023-10-08 15:22:47,971][102897] Updated weights for policy 0, policy_version 90470 (0.0007) +[2023-10-08 15:22:48,344][102897] Updated weights for policy 0, policy_version 90480 (0.0007) +[2023-10-08 15:22:48,704][102897] Updated weights for policy 0, policy_version 90490 (0.0007) +[2023-10-08 15:22:48,965][102898] Updated weights for policy 1, policy_version 90600 (0.0007) +[2023-10-08 15:22:49,343][102898] Updated weights for policy 1, policy_version 90610 (0.0007) +[2023-10-08 15:22:49,709][102898] Updated weights for policy 1, policy_version 90620 (0.0009) +[2023-10-08 15:22:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 185466880. Throughput: 0: 1784.4, 1: 1802.5. Samples: 46371676. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:22:51,876][101941] Avg episode reward: [(0, '9.310'), (1, '20.970')] +[2023-10-08 15:22:52,336][102897] Updated weights for policy 0, policy_version 90500 (0.0008) +[2023-10-08 15:22:52,707][102897] Updated weights for policy 0, policy_version 90510 (0.0007) +[2023-10-08 15:22:53,075][102897] Updated weights for policy 0, policy_version 90520 (0.0007) +[2023-10-08 15:22:53,338][102898] Updated weights for policy 1, policy_version 90630 (0.0008) +[2023-10-08 15:22:53,713][102898] Updated weights for policy 1, policy_version 90640 (0.0008) +[2023-10-08 15:22:54,074][102898] Updated weights for policy 1, policy_version 90650 (0.0007) +[2023-10-08 15:22:56,762][102897] Updated weights for policy 0, policy_version 90530 (0.0007) +[2023-10-08 15:22:56,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 185532416. Throughput: 0: 1791.2, 1: 1799.4. Samples: 46393926. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:22:56,876][101941] Avg episode reward: [(0, '10.100'), (1, '19.320')] +[2023-10-08 15:22:57,133][102897] Updated weights for policy 0, policy_version 90540 (0.0010) +[2023-10-08 15:22:57,508][102897] Updated weights for policy 0, policy_version 90550 (0.0010) +[2023-10-08 15:22:57,723][102898] Updated weights for policy 1, policy_version 90660 (0.0007) +[2023-10-08 15:22:57,873][102897] Updated weights for policy 0, policy_version 90560 (0.0007) +[2023-10-08 15:22:58,081][102898] Updated weights for policy 1, policy_version 90670 (0.0009) +[2023-10-08 15:22:58,453][102898] Updated weights for policy 1, policy_version 90680 (0.0007) +[2023-10-08 15:23:01,684][102897] Updated weights for policy 0, policy_version 90570 (0.0009) +[2023-10-08 15:23:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 185597952. Throughput: 0: 1805.3, 1: 1792.4. Samples: 46416174. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:23:01,876][101941] Avg episode reward: [(0, '9.750'), (1, '17.410')] +[2023-10-08 15:23:02,060][102897] Updated weights for policy 0, policy_version 90580 (0.0008) +[2023-10-08 15:23:02,193][102898] Updated weights for policy 1, policy_version 90690 (0.0007) +[2023-10-08 15:23:02,431][102897] Updated weights for policy 0, policy_version 90590 (0.0008) +[2023-10-08 15:23:02,568][102898] Updated weights for policy 1, policy_version 90700 (0.0008) +[2023-10-08 15:23:02,927][102898] Updated weights for policy 1, policy_version 90710 (0.0007) +[2023-10-08 15:23:03,295][102898] Updated weights for policy 1, policy_version 90720 (0.0007) +[2023-10-08 15:23:06,334][102897] Updated weights for policy 0, policy_version 90600 (0.0008) +[2023-10-08 15:23:06,705][102897] Updated weights for policy 0, policy_version 90610 (0.0009) +[2023-10-08 15:23:06,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 185663488. Throughput: 0: 1793.2, 1: 1794.3. Samples: 46426096. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:23:06,876][101941] Avg episode reward: [(0, '9.160'), (1, '17.780')] +[2023-10-08 15:23:06,995][102898] Updated weights for policy 1, policy_version 90730 (0.0007) +[2023-10-08 15:23:07,081][102897] Updated weights for policy 0, policy_version 90620 (0.0008) +[2023-10-08 15:23:07,360][102898] Updated weights for policy 1, policy_version 90740 (0.0009) +[2023-10-08 15:23:07,722][102898] Updated weights for policy 1, policy_version 90750 (0.0008) +[2023-10-08 15:23:10,863][102897] Updated weights for policy 0, policy_version 90630 (0.0008) +[2023-10-08 15:23:11,233][102897] Updated weights for policy 0, policy_version 90640 (0.0009) +[2023-10-08 15:23:11,509][102898] Updated weights for policy 1, policy_version 90760 (0.0009) +[2023-10-08 15:23:11,603][102897] Updated weights for policy 0, policy_version 90650 (0.0008) +[2023-10-08 15:23:11,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 185761792. Throughput: 0: 1807.4, 1: 1802.0. Samples: 46448812. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:23:11,875][101941] Avg episode reward: [(0, '9.080'), (1, '16.660')] +[2023-10-08 15:23:11,883][102898] Updated weights for policy 1, policy_version 90770 (0.0009) +[2023-10-08 15:23:12,242][102898] Updated weights for policy 1, policy_version 90780 (0.0008) +[2023-10-08 15:23:15,366][102897] Updated weights for policy 0, policy_version 90660 (0.0008) +[2023-10-08 15:23:15,732][102897] Updated weights for policy 0, policy_version 90670 (0.0007) +[2023-10-08 15:23:15,852][102898] Updated weights for policy 1, policy_version 90790 (0.0008) +[2023-10-08 15:23:16,100][102897] Updated weights for policy 0, policy_version 90680 (0.0007) +[2023-10-08 15:23:16,225][102898] Updated weights for policy 1, policy_version 90800 (0.0008) +[2023-10-08 15:23:16,591][102898] Updated weights for policy 1, policy_version 90810 (0.0010) +[2023-10-08 15:23:16,875][101941] Fps is (10 sec: 19660.8, 60 sec: 15291.7, 300 sec: 14440.1). Total num frames: 185860096. Throughput: 0: 1797.1, 1: 1814.4. Samples: 46469230. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:23:16,876][101941] Avg episode reward: [(0, '9.490'), (1, '19.540')] +[2023-10-08 15:23:19,869][102897] Updated weights for policy 0, policy_version 90690 (0.0008) +[2023-10-08 15:23:20,241][102897] Updated weights for policy 0, policy_version 90700 (0.0009) +[2023-10-08 15:23:20,279][102898] Updated weights for policy 1, policy_version 90820 (0.0008) +[2023-10-08 15:23:20,600][102897] Updated weights for policy 0, policy_version 90710 (0.0009) +[2023-10-08 15:23:20,646][102898] Updated weights for policy 1, policy_version 90830 (0.0008) +[2023-10-08 15:23:20,969][102897] Updated weights for policy 0, policy_version 90720 (0.0009) +[2023-10-08 15:23:21,011][102898] Updated weights for policy 1, policy_version 90840 (0.0008) +[2023-10-08 15:23:21,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 185925632. Throughput: 0: 1805.9, 1: 1809.9. Samples: 46481468. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:23:21,876][101941] Avg episode reward: [(0, '9.630'), (1, '20.930')] +[2023-10-08 15:23:24,641][102898] Updated weights for policy 1, policy_version 90850 (0.0008) +[2023-10-08 15:23:24,695][102897] Updated weights for policy 0, policy_version 90730 (0.0007) +[2023-10-08 15:23:25,007][102898] Updated weights for policy 1, policy_version 90860 (0.0008) +[2023-10-08 15:23:25,062][102897] Updated weights for policy 0, policy_version 90740 (0.0008) +[2023-10-08 15:23:25,366][102898] Updated weights for policy 1, policy_version 90870 (0.0008) +[2023-10-08 15:23:25,439][102897] Updated weights for policy 0, policy_version 90750 (0.0007) +[2023-10-08 15:23:25,734][102898] Updated weights for policy 1, policy_version 90880 (0.0008) +[2023-10-08 15:23:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14745.7, 300 sec: 14440.1). Total num frames: 185991168. Throughput: 0: 1794.0, 1: 1820.5. Samples: 46501778. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:23:26,876][101941] Avg episode reward: [(0, '8.910'), (1, '20.140')] +[2023-10-08 15:23:29,115][102897] Updated weights for policy 0, policy_version 90760 (0.0008) +[2023-10-08 15:23:29,451][102898] Updated weights for policy 1, policy_version 90890 (0.0007) +[2023-10-08 15:23:29,472][102897] Updated weights for policy 0, policy_version 90770 (0.0007) +[2023-10-08 15:23:29,816][102898] Updated weights for policy 1, policy_version 90900 (0.0008) +[2023-10-08 15:23:29,844][102897] Updated weights for policy 0, policy_version 90780 (0.0007) +[2023-10-08 15:23:30,187][102898] Updated weights for policy 1, policy_version 90910 (0.0007) +[2023-10-08 15:23:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 186056704. Throughput: 0: 1785.6, 1: 1820.2. Samples: 46523666. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:23:31,876][101941] Avg episode reward: [(0, '9.230'), (1, '16.120')] +[2023-10-08 15:23:33,639][102897] Updated weights for policy 0, policy_version 90790 (0.0007) +[2023-10-08 15:23:33,999][102897] Updated weights for policy 0, policy_version 90800 (0.0007) +[2023-10-08 15:23:34,131][102898] Updated weights for policy 1, policy_version 90920 (0.0008) +[2023-10-08 15:23:34,364][102897] Updated weights for policy 0, policy_version 90810 (0.0007) +[2023-10-08 15:23:34,498][102898] Updated weights for policy 1, policy_version 90930 (0.0008) +[2023-10-08 15:23:34,867][102898] Updated weights for policy 1, policy_version 90940 (0.0009) +[2023-10-08 15:23:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 186122240. Throughput: 0: 1794.1, 1: 1820.5. Samples: 46534332. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:23:36,876][101941] Avg episode reward: [(0, '8.760'), (1, '17.930')] +[2023-10-08 15:23:38,206][102897] Updated weights for policy 0, policy_version 90820 (0.0008) +[2023-10-08 15:23:38,575][102897] Updated weights for policy 0, policy_version 90830 (0.0008) +[2023-10-08 15:23:38,718][102898] Updated weights for policy 1, policy_version 90950 (0.0007) +[2023-10-08 15:23:38,940][102897] Updated weights for policy 0, policy_version 90840 (0.0007) +[2023-10-08 15:23:39,083][102898] Updated weights for policy 1, policy_version 90960 (0.0008) +[2023-10-08 15:23:39,443][102898] Updated weights for policy 1, policy_version 90970 (0.0008) +[2023-10-08 15:23:41,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 186187776. Throughput: 0: 1781.8, 1: 1805.7. Samples: 46555366. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:23:41,875][101941] Avg episode reward: [(0, '8.430'), (1, '18.000')] +[2023-10-08 15:23:42,792][102897] Updated weights for policy 0, policy_version 90850 (0.0007) +[2023-10-08 15:23:43,162][102897] Updated weights for policy 0, policy_version 90860 (0.0007) +[2023-10-08 15:23:43,199][102898] Updated weights for policy 1, policy_version 90980 (0.0010) +[2023-10-08 15:23:43,536][102897] Updated weights for policy 0, policy_version 90870 (0.0007) +[2023-10-08 15:23:43,567][102898] Updated weights for policy 1, policy_version 90990 (0.0009) +[2023-10-08 15:23:43,905][102897] Updated weights for policy 0, policy_version 90880 (0.0007) +[2023-10-08 15:23:43,939][102898] Updated weights for policy 1, policy_version 91000 (0.0008) +[2023-10-08 15:23:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 186253312. Throughput: 0: 1780.4, 1: 1802.1. Samples: 46577388. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:23:46,876][101941] Avg episode reward: [(0, '9.390'), (1, '17.630')] +[2023-10-08 15:23:47,727][102897] Updated weights for policy 0, policy_version 90890 (0.0008) +[2023-10-08 15:23:47,782][102898] Updated weights for policy 1, policy_version 91010 (0.0010) +[2023-10-08 15:23:48,094][102897] Updated weights for policy 0, policy_version 90900 (0.0008) +[2023-10-08 15:23:48,149][102898] Updated weights for policy 1, policy_version 91020 (0.0007) +[2023-10-08 15:23:48,466][102897] Updated weights for policy 0, policy_version 90910 (0.0008) +[2023-10-08 15:23:48,511][102898] Updated weights for policy 1, policy_version 91030 (0.0008) +[2023-10-08 15:23:48,877][102898] Updated weights for policy 1, policy_version 91040 (0.0010) +[2023-10-08 15:23:51,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 186318848. Throughput: 0: 1775.0, 1: 1801.4. Samples: 46587034. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:23:51,876][101941] Avg episode reward: [(0, '8.890'), (1, '20.170')] +[2023-10-08 15:23:52,217][102897] Updated weights for policy 0, policy_version 90920 (0.0009) +[2023-10-08 15:23:52,586][102897] Updated weights for policy 0, policy_version 90930 (0.0009) +[2023-10-08 15:23:52,686][102898] Updated weights for policy 1, policy_version 91050 (0.0007) +[2023-10-08 15:23:52,957][102897] Updated weights for policy 0, policy_version 90940 (0.0008) +[2023-10-08 15:23:53,047][102898] Updated weights for policy 1, policy_version 91060 (0.0008) +[2023-10-08 15:23:53,410][102898] Updated weights for policy 1, policy_version 91070 (0.0008) +[2023-10-08 15:23:56,818][102897] Updated weights for policy 0, policy_version 90950 (0.0008) +[2023-10-08 15:23:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 186384384. Throughput: 0: 1774.8, 1: 1788.7. Samples: 46609172. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:23:56,876][101941] Avg episode reward: [(0, '8.940'), (1, '19.040')] +[2023-10-08 15:23:57,192][102897] Updated weights for policy 0, policy_version 90960 (0.0008) +[2023-10-08 15:23:57,322][102898] Updated weights for policy 1, policy_version 91080 (0.0007) +[2023-10-08 15:23:57,564][102897] Updated weights for policy 0, policy_version 90970 (0.0008) +[2023-10-08 15:23:57,681][102898] Updated weights for policy 1, policy_version 91090 (0.0008) +[2023-10-08 15:23:58,046][102898] Updated weights for policy 1, policy_version 91100 (0.0008) +[2023-10-08 15:24:01,300][102897] Updated weights for policy 0, policy_version 90980 (0.0007) +[2023-10-08 15:24:01,664][102897] Updated weights for policy 0, policy_version 90990 (0.0008) +[2023-10-08 15:24:01,838][102898] Updated weights for policy 1, policy_version 91110 (0.0008) +[2023-10-08 15:24:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 186449920. Throughput: 0: 1794.4, 1: 1798.3. Samples: 46630902. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:24:01,876][101941] Avg episode reward: [(0, '9.000'), (1, '17.950')] +[2023-10-08 15:24:02,039][102897] Updated weights for policy 0, policy_version 91000 (0.0007) +[2023-10-08 15:24:02,197][102898] Updated weights for policy 1, policy_version 91120 (0.0007) +[2023-10-08 15:24:02,567][102898] Updated weights for policy 1, policy_version 91130 (0.0008) +[2023-10-08 15:24:05,748][102897] Updated weights for policy 0, policy_version 91010 (0.0008) +[2023-10-08 15:24:06,121][102897] Updated weights for policy 0, policy_version 91020 (0.0009) +[2023-10-08 15:24:06,289][102898] Updated weights for policy 1, policy_version 91140 (0.0007) +[2023-10-08 15:24:06,488][102897] Updated weights for policy 0, policy_version 91030 (0.0008) +[2023-10-08 15:24:06,665][102898] Updated weights for policy 1, policy_version 91150 (0.0007) +[2023-10-08 15:24:06,862][102897] Updated weights for policy 0, policy_version 91040 (0.0009) +[2023-10-08 15:24:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 186548224. Throughput: 0: 1770.1, 1: 1776.7. Samples: 46641074. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:24:06,876][101941] Avg episode reward: [(0, '9.040'), (1, '19.690')] +[2023-10-08 15:24:07,020][102898] Updated weights for policy 1, policy_version 91160 (0.0007) +[2023-10-08 15:24:10,518][102897] Updated weights for policy 0, policy_version 91050 (0.0008) +[2023-10-08 15:24:10,886][102897] Updated weights for policy 0, policy_version 91060 (0.0008) +[2023-10-08 15:24:10,936][102898] Updated weights for policy 1, policy_version 91170 (0.0009) +[2023-10-08 15:24:11,255][102897] Updated weights for policy 0, policy_version 91070 (0.0008) +[2023-10-08 15:24:11,305][102898] Updated weights for policy 1, policy_version 91180 (0.0007) +[2023-10-08 15:24:11,667][102898] Updated weights for policy 1, policy_version 91190 (0.0008) +[2023-10-08 15:24:11,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 186613760. Throughput: 0: 1797.3, 1: 1790.5. Samples: 46663230. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:24:11,875][101941] Avg episode reward: [(0, '9.730'), (1, '19.880')] +[2023-10-08 15:24:12,038][102898] Updated weights for policy 1, policy_version 91200 (0.0009) +[2023-10-08 15:24:14,835][102897] Updated weights for policy 0, policy_version 91080 (0.0007) +[2023-10-08 15:24:15,197][102897] Updated weights for policy 0, policy_version 91090 (0.0007) +[2023-10-08 15:24:15,572][102897] Updated weights for policy 0, policy_version 91100 (0.0007) +[2023-10-08 15:24:15,633][102898] Updated weights for policy 1, policy_version 91210 (0.0007) +[2023-10-08 15:24:15,991][102898] Updated weights for policy 1, policy_version 91220 (0.0008) +[2023-10-08 15:24:16,359][102898] Updated weights for policy 1, policy_version 91230 (0.0008) +[2023-10-08 15:24:16,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 186712064. Throughput: 0: 1786.4, 1: 1767.3. Samples: 46683586. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:24:16,876][101941] Avg episode reward: [(0, '9.920'), (1, '20.870')] +[2023-10-08 15:24:16,888][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000091232_93421568.pth... +[2023-10-08 15:24:16,889][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000091104_93290496.pth... +[2023-10-08 15:24:16,924][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000089440_91586560.pth +[2023-10-08 15:24:16,929][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000089536_91684864.pth +[2023-10-08 15:24:19,235][102897] Updated weights for policy 0, policy_version 91110 (0.0009) +[2023-10-08 15:24:19,606][102897] Updated weights for policy 0, policy_version 91120 (0.0008) +[2023-10-08 15:24:19,986][102897] Updated weights for policy 0, policy_version 91130 (0.0009) +[2023-10-08 15:24:20,261][102898] Updated weights for policy 1, policy_version 91240 (0.0007) +[2023-10-08 15:24:20,634][102898] Updated weights for policy 1, policy_version 91250 (0.0008) +[2023-10-08 15:24:20,990][102898] Updated weights for policy 1, policy_version 91260 (0.0009) +[2023-10-08 15:24:21,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 186777600. Throughput: 0: 1802.9, 1: 1787.5. Samples: 46695902. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:24:21,876][101941] Avg episode reward: [(0, '9.790'), (1, '19.510')] +[2023-10-08 15:24:23,838][102897] Updated weights for policy 0, policy_version 91140 (0.0008) +[2023-10-08 15:24:24,209][102897] Updated weights for policy 0, policy_version 91150 (0.0009) +[2023-10-08 15:24:24,586][102897] Updated weights for policy 0, policy_version 91160 (0.0010) +[2023-10-08 15:24:24,694][102898] Updated weights for policy 1, policy_version 91270 (0.0008) +[2023-10-08 15:24:25,060][102898] Updated weights for policy 1, policy_version 91280 (0.0009) +[2023-10-08 15:24:25,432][102898] Updated weights for policy 1, policy_version 91290 (0.0009) +[2023-10-08 15:24:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 186843136. Throughput: 0: 1786.1, 1: 1783.2. Samples: 46715986. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 15:24:26,876][101941] Avg episode reward: [(0, '9.000'), (1, '18.090')] +[2023-10-08 15:24:28,690][102897] Updated weights for policy 0, policy_version 91170 (0.0009) +[2023-10-08 15:24:29,052][102897] Updated weights for policy 0, policy_version 91180 (0.0010) +[2023-10-08 15:24:29,423][102897] Updated weights for policy 0, policy_version 91190 (0.0009) +[2023-10-08 15:24:29,579][102898] Updated weights for policy 1, policy_version 91300 (0.0007) +[2023-10-08 15:24:29,789][102897] Updated weights for policy 0, policy_version 91200 (0.0009) +[2023-10-08 15:24:29,936][102898] Updated weights for policy 1, policy_version 91310 (0.0008) +[2023-10-08 15:24:30,306][102898] Updated weights for policy 1, policy_version 91320 (0.0010) +[2023-10-08 15:24:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 186908672. Throughput: 0: 1769.0, 1: 1759.6. Samples: 46736176. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 15:24:31,876][101941] Avg episode reward: [(0, '8.870'), (1, '18.070')] +[2023-10-08 15:24:33,956][102897] Updated weights for policy 0, policy_version 91210 (0.0007) +[2023-10-08 15:24:34,310][102898] Updated weights for policy 1, policy_version 91330 (0.0011) +[2023-10-08 15:24:34,327][102897] Updated weights for policy 0, policy_version 91220 (0.0011) +[2023-10-08 15:24:34,675][102898] Updated weights for policy 1, policy_version 91340 (0.0009) +[2023-10-08 15:24:34,690][102897] Updated weights for policy 0, policy_version 91230 (0.0009) +[2023-10-08 15:24:35,040][102898] Updated weights for policy 1, policy_version 91350 (0.0008) +[2023-10-08 15:24:35,403][102898] Updated weights for policy 1, policy_version 91360 (0.0010) +[2023-10-08 15:24:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 186974208. Throughput: 0: 1775.8, 1: 1780.1. Samples: 46747050. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 15:24:36,876][101941] Avg episode reward: [(0, '9.120'), (1, '17.840')] +[2023-10-08 15:24:38,762][102897] Updated weights for policy 0, policy_version 91240 (0.0009) +[2023-10-08 15:24:39,139][102897] Updated weights for policy 0, policy_version 91250 (0.0010) +[2023-10-08 15:24:39,450][102898] Updated weights for policy 1, policy_version 91370 (0.0009) +[2023-10-08 15:24:39,498][102897] Updated weights for policy 0, policy_version 91260 (0.0010) +[2023-10-08 15:24:39,807][102898] Updated weights for policy 1, policy_version 91380 (0.0010) +[2023-10-08 15:24:40,182][102898] Updated weights for policy 1, policy_version 91390 (0.0009) +[2023-10-08 15:24:41,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 187039744. Throughput: 0: 1745.1, 1: 1742.9. Samples: 46766130. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 15:24:41,876][101941] Avg episode reward: [(0, '8.150'), (1, '17.930')] +[2023-10-08 15:24:43,628][102897] Updated weights for policy 0, policy_version 91270 (0.0008) +[2023-10-08 15:24:43,988][102897] Updated weights for policy 0, policy_version 91280 (0.0010) +[2023-10-08 15:24:44,270][102898] Updated weights for policy 1, policy_version 91400 (0.0010) +[2023-10-08 15:24:44,350][102897] Updated weights for policy 0, policy_version 91290 (0.0008) +[2023-10-08 15:24:44,641][102898] Updated weights for policy 1, policy_version 91410 (0.0009) +[2023-10-08 15:24:44,995][102898] Updated weights for policy 1, policy_version 91420 (0.0011) +[2023-10-08 15:24:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 187105280. Throughput: 0: 1733.3, 1: 1726.4. Samples: 46786586. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 15:24:46,875][101941] Avg episode reward: [(0, '8.480'), (1, '17.670')] +[2023-10-08 15:24:48,491][102897] Updated weights for policy 0, policy_version 91300 (0.0009) +[2023-10-08 15:24:48,863][102897] Updated weights for policy 0, policy_version 91310 (0.0009) +[2023-10-08 15:24:49,098][102898] Updated weights for policy 1, policy_version 91430 (0.0010) +[2023-10-08 15:24:49,230][102897] Updated weights for policy 0, policy_version 91320 (0.0009) +[2023-10-08 15:24:49,455][102898] Updated weights for policy 1, policy_version 91440 (0.0009) +[2023-10-08 15:24:49,833][102898] Updated weights for policy 1, policy_version 91450 (0.0009) +[2023-10-08 15:24:51,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 187170816. Throughput: 0: 1719.0, 1: 1731.3. Samples: 46796338. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 15:24:51,876][101941] Avg episode reward: [(0, '9.550'), (1, '19.300')] +[2023-10-08 15:24:53,261][102897] Updated weights for policy 0, policy_version 91330 (0.0007) +[2023-10-08 15:24:53,631][102897] Updated weights for policy 0, policy_version 91340 (0.0010) +[2023-10-08 15:24:53,896][102898] Updated weights for policy 1, policy_version 91460 (0.0009) +[2023-10-08 15:24:54,002][102897] Updated weights for policy 0, policy_version 91350 (0.0009) +[2023-10-08 15:24:54,263][102898] Updated weights for policy 1, policy_version 91470 (0.0008) +[2023-10-08 15:24:54,365][102897] Updated weights for policy 0, policy_version 91360 (0.0009) +[2023-10-08 15:24:54,619][102898] Updated weights for policy 1, policy_version 91480 (0.0009) +[2023-10-08 15:24:56,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 187236352. Throughput: 0: 1698.0, 1: 1700.2. Samples: 46816146. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 15:24:56,876][101941] Avg episode reward: [(0, '9.260'), (1, '19.250')] +[2023-10-08 15:24:58,488][102897] Updated weights for policy 0, policy_version 91370 (0.0009) +[2023-10-08 15:24:58,681][102898] Updated weights for policy 1, policy_version 91490 (0.0009) +[2023-10-08 15:24:58,855][102897] Updated weights for policy 0, policy_version 91380 (0.0008) +[2023-10-08 15:24:59,050][102898] Updated weights for policy 1, policy_version 91500 (0.0009) +[2023-10-08 15:24:59,226][102897] Updated weights for policy 0, policy_version 91390 (0.0008) +[2023-10-08 15:24:59,416][102898] Updated weights for policy 1, policy_version 91510 (0.0009) +[2023-10-08 15:24:59,779][102898] Updated weights for policy 1, policy_version 91520 (0.0009) +[2023-10-08 15:25:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 187301888. Throughput: 0: 1695.0, 1: 1704.9. Samples: 46836580. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 15:25:01,875][101941] Avg episode reward: [(0, '8.980'), (1, '22.020')] +[2023-10-08 15:25:03,411][102897] Updated weights for policy 0, policy_version 91400 (0.0009) +[2023-10-08 15:25:03,782][102897] Updated weights for policy 0, policy_version 91410 (0.0008) +[2023-10-08 15:25:04,026][102898] Updated weights for policy 1, policy_version 91530 (0.0010) +[2023-10-08 15:25:04,155][102897] Updated weights for policy 0, policy_version 91420 (0.0008) +[2023-10-08 15:25:04,382][102898] Updated weights for policy 1, policy_version 91540 (0.0008) +[2023-10-08 15:25:04,747][102898] Updated weights for policy 1, policy_version 91550 (0.0008) +[2023-10-08 15:25:06,875][101941] Fps is (10 sec: 13107.1, 60 sec: 13653.3, 300 sec: 14218.0). Total num frames: 187367424. Throughput: 0: 1659.4, 1: 1674.0. Samples: 46845906. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 15:25:06,876][101941] Avg episode reward: [(0, '8.970'), (1, '21.540')] +[2023-10-08 15:25:07,913][102897] Updated weights for policy 0, policy_version 91430 (0.0008) +[2023-10-08 15:25:08,276][102897] Updated weights for policy 0, policy_version 91440 (0.0007) +[2023-10-08 15:25:08,603][102898] Updated weights for policy 1, policy_version 91560 (0.0008) +[2023-10-08 15:25:08,638][102897] Updated weights for policy 0, policy_version 91450 (0.0007) +[2023-10-08 15:25:08,980][102898] Updated weights for policy 1, policy_version 91570 (0.0009) +[2023-10-08 15:25:09,346][102898] Updated weights for policy 1, policy_version 91580 (0.0008) +[2023-10-08 15:25:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 13653.3, 300 sec: 14218.0). Total num frames: 187432960. Throughput: 0: 1688.8, 1: 1686.7. Samples: 46867882. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 15:25:11,876][101941] Avg episode reward: [(0, '8.800'), (1, '21.270')] +[2023-10-08 15:25:12,346][102897] Updated weights for policy 0, policy_version 91460 (0.0008) +[2023-10-08 15:25:12,723][102897] Updated weights for policy 0, policy_version 91470 (0.0007) +[2023-10-08 15:25:12,970][102898] Updated weights for policy 1, policy_version 91590 (0.0010) +[2023-10-08 15:25:13,092][102897] Updated weights for policy 0, policy_version 91480 (0.0007) +[2023-10-08 15:25:13,334][102898] Updated weights for policy 1, policy_version 91600 (0.0008) +[2023-10-08 15:25:13,701][102898] Updated weights for policy 1, policy_version 91610 (0.0009) +[2023-10-08 15:25:16,737][102897] Updated weights for policy 0, policy_version 91490 (0.0008) +[2023-10-08 15:25:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 13107.2, 300 sec: 14218.0). Total num frames: 187498496. Throughput: 0: 1710.9, 1: 1716.3. Samples: 46890402. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 15:25:16,876][101941] Avg episode reward: [(0, '9.330'), (1, '20.990')] +[2023-10-08 15:25:17,099][102897] Updated weights for policy 0, policy_version 91500 (0.0008) +[2023-10-08 15:25:17,392][102898] Updated weights for policy 1, policy_version 91620 (0.0008) +[2023-10-08 15:25:17,478][102897] Updated weights for policy 0, policy_version 91510 (0.0009) +[2023-10-08 15:25:17,760][102898] Updated weights for policy 1, policy_version 91630 (0.0008) +[2023-10-08 15:25:17,844][102897] Updated weights for policy 0, policy_version 91520 (0.0007) +[2023-10-08 15:25:18,126][102898] Updated weights for policy 1, policy_version 91640 (0.0007) +[2023-10-08 15:25:21,764][102897] Updated weights for policy 0, policy_version 91530 (0.0008) +[2023-10-08 15:25:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 14106.9). Total num frames: 187564032. Throughput: 0: 1703.5, 1: 1697.4. Samples: 46900088. Policy #0 lag: (min: 31.0, avg: 34.1, max: 63.0) +[2023-10-08 15:25:21,875][101941] Avg episode reward: [(0, '10.000'), (1, '21.250')] +[2023-10-08 15:25:21,944][102898] Updated weights for policy 1, policy_version 91650 (0.0009) +[2023-10-08 15:25:22,131][102897] Updated weights for policy 0, policy_version 91540 (0.0008) +[2023-10-08 15:25:22,299][102898] Updated weights for policy 1, policy_version 91660 (0.0008) +[2023-10-08 15:25:22,506][102897] Updated weights for policy 0, policy_version 91550 (0.0008) +[2023-10-08 15:25:22,679][102898] Updated weights for policy 1, policy_version 91670 (0.0008) +[2023-10-08 15:25:23,034][102898] Updated weights for policy 1, policy_version 91680 (0.0008) +[2023-10-08 15:25:26,374][102897] Updated weights for policy 0, policy_version 91560 (0.0008) +[2023-10-08 15:25:26,749][102897] Updated weights for policy 0, policy_version 91570 (0.0007) +[2023-10-08 15:25:26,854][102898] Updated weights for policy 1, policy_version 91690 (0.0009) +[2023-10-08 15:25:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 13107.2, 300 sec: 14106.9). Total num frames: 187629568. Throughput: 0: 1733.5, 1: 1734.9. Samples: 46922208. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:25:26,876][101941] Avg episode reward: [(0, '10.320'), (1, '21.940')] +[2023-10-08 15:25:27,117][102897] Updated weights for policy 0, policy_version 91580 (0.0007) +[2023-10-08 15:25:27,215][102898] Updated weights for policy 1, policy_version 91700 (0.0008) +[2023-10-08 15:25:27,582][102898] Updated weights for policy 1, policy_version 91710 (0.0008) +[2023-10-08 15:25:30,724][102897] Updated weights for policy 0, policy_version 91590 (0.0008) +[2023-10-08 15:25:31,096][102897] Updated weights for policy 0, policy_version 91600 (0.0007) +[2023-10-08 15:25:31,412][102898] Updated weights for policy 1, policy_version 91720 (0.0007) +[2023-10-08 15:25:31,474][102897] Updated weights for policy 0, policy_version 91610 (0.0008) +[2023-10-08 15:25:31,775][102898] Updated weights for policy 1, policy_version 91730 (0.0008) +[2023-10-08 15:25:31,875][101941] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 14218.0). Total num frames: 187727872. Throughput: 0: 1731.8, 1: 1749.2. Samples: 46943230. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:25:31,875][101941] Avg episode reward: [(0, '9.780'), (1, '23.600')] +[2023-10-08 15:25:32,149][102898] Updated weights for policy 1, policy_version 91740 (0.0010) +[2023-10-08 15:25:32,288][102760] Saving new best policy, reward=23.600! +[2023-10-08 15:25:35,257][102897] Updated weights for policy 0, policy_version 91620 (0.0007) +[2023-10-08 15:25:35,623][102897] Updated weights for policy 0, policy_version 91630 (0.0009) +[2023-10-08 15:25:35,929][102898] Updated weights for policy 1, policy_version 91750 (0.0008) +[2023-10-08 15:25:35,996][102897] Updated weights for policy 0, policy_version 91640 (0.0007) +[2023-10-08 15:25:36,307][102898] Updated weights for policy 1, policy_version 91760 (0.0007) +[2023-10-08 15:25:36,678][102898] Updated weights for policy 1, policy_version 91770 (0.0008) +[2023-10-08 15:25:36,875][101941] Fps is (10 sec: 16384.1, 60 sec: 13653.4, 300 sec: 14218.0). Total num frames: 187793408. Throughput: 0: 1760.5, 1: 1751.9. Samples: 46954396. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:25:36,875][101941] Avg episode reward: [(0, '9.570'), (1, '23.750')] +[2023-10-08 15:25:36,888][102760] Saving new best policy, reward=23.750! +[2023-10-08 15:25:39,927][102897] Updated weights for policy 0, policy_version 91650 (0.0008) +[2023-10-08 15:25:40,292][102897] Updated weights for policy 0, policy_version 91660 (0.0010) +[2023-10-08 15:25:40,454][102898] Updated weights for policy 1, policy_version 91780 (0.0010) +[2023-10-08 15:25:40,668][102897] Updated weights for policy 0, policy_version 91670 (0.0007) +[2023-10-08 15:25:40,824][102898] Updated weights for policy 1, policy_version 91790 (0.0008) +[2023-10-08 15:25:41,027][102897] Updated weights for policy 0, policy_version 91680 (0.0009) +[2023-10-08 15:25:41,179][102898] Updated weights for policy 1, policy_version 91800 (0.0008) +[2023-10-08 15:25:41,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 187891712. Throughput: 0: 1770.4, 1: 1780.9. Samples: 46975952. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:25:41,876][101941] Avg episode reward: [(0, '9.200'), (1, '21.400')] +[2023-10-08 15:25:44,719][102897] Updated weights for policy 0, policy_version 91690 (0.0007) +[2023-10-08 15:25:45,082][102897] Updated weights for policy 0, policy_version 91700 (0.0007) +[2023-10-08 15:25:45,086][102898] Updated weights for policy 1, policy_version 91810 (0.0010) +[2023-10-08 15:25:45,459][102897] Updated weights for policy 0, policy_version 91710 (0.0009) +[2023-10-08 15:25:45,459][102898] Updated weights for policy 1, policy_version 91820 (0.0008) +[2023-10-08 15:25:45,817][102898] Updated weights for policy 1, policy_version 91830 (0.0010) +[2023-10-08 15:25:46,182][102898] Updated weights for policy 1, policy_version 91840 (0.0008) +[2023-10-08 15:25:46,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 187957248. Throughput: 0: 1772.5, 1: 1771.1. Samples: 46996044. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:25:46,876][101941] Avg episode reward: [(0, '9.610'), (1, '21.310')] +[2023-10-08 15:25:49,260][102897] Updated weights for policy 0, policy_version 91720 (0.0008) +[2023-10-08 15:25:49,629][102897] Updated weights for policy 0, policy_version 91730 (0.0007) +[2023-10-08 15:25:49,721][102898] Updated weights for policy 1, policy_version 91850 (0.0008) +[2023-10-08 15:25:50,004][102897] Updated weights for policy 0, policy_version 91740 (0.0008) +[2023-10-08 15:25:50,096][102898] Updated weights for policy 1, policy_version 91860 (0.0007) +[2023-10-08 15:25:50,453][102898] Updated weights for policy 1, policy_version 91870 (0.0009) +[2023-10-08 15:25:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 188022784. Throughput: 0: 1802.1, 1: 1802.1. Samples: 47008096. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:25:51,875][101941] Avg episode reward: [(0, '9.710'), (1, '21.230')] +[2023-10-08 15:25:53,893][102897] Updated weights for policy 0, policy_version 91750 (0.0008) +[2023-10-08 15:25:54,257][102897] Updated weights for policy 0, policy_version 91760 (0.0008) +[2023-10-08 15:25:54,432][102898] Updated weights for policy 1, policy_version 91880 (0.0008) +[2023-10-08 15:25:54,627][102897] Updated weights for policy 0, policy_version 91770 (0.0008) +[2023-10-08 15:25:54,787][102898] Updated weights for policy 1, policy_version 91890 (0.0007) +[2023-10-08 15:25:55,153][102898] Updated weights for policy 1, policy_version 91900 (0.0008) +[2023-10-08 15:25:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 188088320. Throughput: 0: 1771.7, 1: 1783.1. Samples: 47027848. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:25:56,876][101941] Avg episode reward: [(0, '9.590'), (1, '21.010')] +[2023-10-08 15:25:58,355][102897] Updated weights for policy 0, policy_version 91780 (0.0008) +[2023-10-08 15:25:58,726][102897] Updated weights for policy 0, policy_version 91790 (0.0007) +[2023-10-08 15:25:59,069][102898] Updated weights for policy 1, policy_version 91910 (0.0009) +[2023-10-08 15:25:59,093][102897] Updated weights for policy 0, policy_version 91800 (0.0008) +[2023-10-08 15:25:59,450][102898] Updated weights for policy 1, policy_version 91920 (0.0007) +[2023-10-08 15:25:59,823][102898] Updated weights for policy 1, policy_version 91930 (0.0010) +[2023-10-08 15:26:01,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 188153856. Throughput: 0: 1775.1, 1: 1778.0. Samples: 47050292. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:26:01,876][101941] Avg episode reward: [(0, '8.670'), (1, '20.140')] +[2023-10-08 15:26:02,790][102897] Updated weights for policy 0, policy_version 91810 (0.0008) +[2023-10-08 15:26:03,166][102897] Updated weights for policy 0, policy_version 91820 (0.0008) +[2023-10-08 15:26:03,519][102898] Updated weights for policy 1, policy_version 91940 (0.0009) +[2023-10-08 15:26:03,541][102897] Updated weights for policy 0, policy_version 91830 (0.0007) +[2023-10-08 15:26:03,879][102898] Updated weights for policy 1, policy_version 91950 (0.0009) +[2023-10-08 15:26:03,909][102897] Updated weights for policy 0, policy_version 91840 (0.0008) +[2023-10-08 15:26:04,247][102898] Updated weights for policy 1, policy_version 91960 (0.0007) +[2023-10-08 15:26:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 188219392. Throughput: 0: 1777.4, 1: 1778.5. Samples: 47060102. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:26:06,876][101941] Avg episode reward: [(0, '9.150'), (1, '19.190')] +[2023-10-08 15:26:07,632][102897] Updated weights for policy 0, policy_version 91850 (0.0007) +[2023-10-08 15:26:07,989][102897] Updated weights for policy 0, policy_version 91860 (0.0009) +[2023-10-08 15:26:08,007][102898] Updated weights for policy 1, policy_version 91970 (0.0007) +[2023-10-08 15:26:08,357][102897] Updated weights for policy 0, policy_version 91870 (0.0008) +[2023-10-08 15:26:08,375][102898] Updated weights for policy 1, policy_version 91980 (0.0008) +[2023-10-08 15:26:08,732][102898] Updated weights for policy 1, policy_version 91990 (0.0008) +[2023-10-08 15:26:09,092][102898] Updated weights for policy 1, policy_version 92000 (0.0007) +[2023-10-08 15:26:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 188284928. Throughput: 0: 1781.7, 1: 1779.2. Samples: 47082450. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:26:11,876][101941] Avg episode reward: [(0, '9.360'), (1, '18.960')] +[2023-10-08 15:26:12,085][102897] Updated weights for policy 0, policy_version 91880 (0.0008) +[2023-10-08 15:26:12,460][102897] Updated weights for policy 0, policy_version 91890 (0.0008) +[2023-10-08 15:26:12,775][102898] Updated weights for policy 1, policy_version 92010 (0.0007) +[2023-10-08 15:26:12,827][102897] Updated weights for policy 0, policy_version 91900 (0.0007) +[2023-10-08 15:26:13,138][102898] Updated weights for policy 1, policy_version 92020 (0.0007) +[2023-10-08 15:26:13,513][102898] Updated weights for policy 1, policy_version 92030 (0.0007) +[2023-10-08 15:26:16,632][102897] Updated weights for policy 0, policy_version 91910 (0.0007) +[2023-10-08 15:26:16,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 188350464. Throughput: 0: 1801.6, 1: 1783.7. Samples: 47104566. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:26:16,875][101941] Avg episode reward: [(0, '9.110'), (1, '19.650')] +[2023-10-08 15:26:16,884][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000092032_94240768.pth... +[2023-10-08 15:26:16,929][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000090400_92569600.pth +[2023-10-08 15:26:16,934][102760] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p1/milestones/checkpoint_000092032_94240768.pth +[2023-10-08 15:26:17,003][102897] Updated weights for policy 0, policy_version 91920 (0.0007) +[2023-10-08 15:26:17,371][102897] Updated weights for policy 0, policy_version 91930 (0.0008) +[2023-10-08 15:26:17,398][102898] Updated weights for policy 1, policy_version 92040 (0.0009) +[2023-10-08 15:26:17,588][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000091936_94142464.pth... +[2023-10-08 15:26:17,618][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000090272_92438528.pth +[2023-10-08 15:26:17,622][102634] Saving a milestone ./train_atari/atari_asteroid_APPO/checkpoint_p0/milestones/checkpoint_000091936_94142464.pth +[2023-10-08 15:26:17,758][102898] Updated weights for policy 1, policy_version 92050 (0.0008) +[2023-10-08 15:26:18,131][102898] Updated weights for policy 1, policy_version 92060 (0.0009) +[2023-10-08 15:26:21,203][102897] Updated weights for policy 0, policy_version 91940 (0.0009) +[2023-10-08 15:26:21,577][102897] Updated weights for policy 0, policy_version 91950 (0.0011) +[2023-10-08 15:26:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14106.9). Total num frames: 188416000. Throughput: 0: 1780.1, 1: 1776.5. Samples: 47114442. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:26:21,876][101941] Avg episode reward: [(0, '8.940'), (1, '20.600')] +[2023-10-08 15:26:21,933][102898] Updated weights for policy 1, policy_version 92070 (0.0007) +[2023-10-08 15:26:21,943][102897] Updated weights for policy 0, policy_version 91960 (0.0009) +[2023-10-08 15:26:22,296][102898] Updated weights for policy 1, policy_version 92080 (0.0010) +[2023-10-08 15:26:22,661][102898] Updated weights for policy 1, policy_version 92090 (0.0008) +[2023-10-08 15:26:25,598][102897] Updated weights for policy 0, policy_version 91970 (0.0007) +[2023-10-08 15:26:25,969][102897] Updated weights for policy 0, policy_version 91980 (0.0010) +[2023-10-08 15:26:26,343][102897] Updated weights for policy 0, policy_version 91990 (0.0010) +[2023-10-08 15:26:26,605][102898] Updated weights for policy 1, policy_version 92100 (0.0009) +[2023-10-08 15:26:26,719][102897] Updated weights for policy 0, policy_version 92000 (0.0008) +[2023-10-08 15:26:26,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14218.0). Total num frames: 188514304. Throughput: 0: 1796.2, 1: 1776.0. Samples: 47136700. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:26:26,876][101941] Avg episode reward: [(0, '9.600'), (1, '23.100')] +[2023-10-08 15:26:26,966][102898] Updated weights for policy 1, policy_version 92110 (0.0009) +[2023-10-08 15:26:27,339][102898] Updated weights for policy 1, policy_version 92120 (0.0008) +[2023-10-08 15:26:30,294][102897] Updated weights for policy 0, policy_version 92010 (0.0007) +[2023-10-08 15:26:30,662][102897] Updated weights for policy 0, policy_version 92020 (0.0008) +[2023-10-08 15:26:31,041][102897] Updated weights for policy 0, policy_version 92030 (0.0008) +[2023-10-08 15:26:31,095][102898] Updated weights for policy 1, policy_version 92130 (0.0011) +[2023-10-08 15:26:31,463][102898] Updated weights for policy 1, policy_version 92140 (0.0008) +[2023-10-08 15:26:31,820][102898] Updated weights for policy 1, policy_version 92150 (0.0010) +[2023-10-08 15:26:31,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 188579840. Throughput: 0: 1787.6, 1: 1795.5. Samples: 47157286. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:26:31,876][101941] Avg episode reward: [(0, '9.800'), (1, '23.080')] +[2023-10-08 15:26:32,185][102898] Updated weights for policy 1, policy_version 92160 (0.0010) +[2023-10-08 15:26:34,814][102897] Updated weights for policy 0, policy_version 92040 (0.0008) +[2023-10-08 15:26:35,183][102897] Updated weights for policy 0, policy_version 92050 (0.0009) +[2023-10-08 15:26:35,547][102897] Updated weights for policy 0, policy_version 92060 (0.0008) +[2023-10-08 15:26:35,996][102898] Updated weights for policy 1, policy_version 92170 (0.0007) +[2023-10-08 15:26:36,354][102898] Updated weights for policy 1, policy_version 92180 (0.0007) +[2023-10-08 15:26:36,730][102898] Updated weights for policy 1, policy_version 92190 (0.0009) +[2023-10-08 15:26:36,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14218.0). Total num frames: 188678144. Throughput: 0: 1804.0, 1: 1775.4. Samples: 47169170. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:26:36,875][101941] Avg episode reward: [(0, '10.020'), (1, '23.160')] +[2023-10-08 15:26:39,185][102897] Updated weights for policy 0, policy_version 92070 (0.0009) +[2023-10-08 15:26:39,569][102897] Updated weights for policy 0, policy_version 92080 (0.0008) +[2023-10-08 15:26:39,941][102897] Updated weights for policy 0, policy_version 92090 (0.0008) +[2023-10-08 15:26:40,379][102898] Updated weights for policy 1, policy_version 92200 (0.0008) +[2023-10-08 15:26:40,740][102898] Updated weights for policy 1, policy_version 92210 (0.0009) +[2023-10-08 15:26:41,113][102898] Updated weights for policy 1, policy_version 92220 (0.0007) +[2023-10-08 15:26:41,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 188743680. Throughput: 0: 1794.9, 1: 1806.1. Samples: 47189894. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:26:41,876][101941] Avg episode reward: [(0, '9.890'), (1, '22.880')] +[2023-10-08 15:26:43,843][102897] Updated weights for policy 0, policy_version 92100 (0.0008) +[2023-10-08 15:26:44,219][102897] Updated weights for policy 0, policy_version 92110 (0.0009) +[2023-10-08 15:26:44,583][102897] Updated weights for policy 0, policy_version 92120 (0.0007) +[2023-10-08 15:26:44,999][102898] Updated weights for policy 1, policy_version 92230 (0.0007) +[2023-10-08 15:26:45,377][102898] Updated weights for policy 1, policy_version 92240 (0.0008) +[2023-10-08 15:26:45,754][102898] Updated weights for policy 1, policy_version 92250 (0.0007) +[2023-10-08 15:26:46,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 188809216. Throughput: 0: 1791.3, 1: 1782.3. Samples: 47211102. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:26:46,876][101941] Avg episode reward: [(0, '9.870'), (1, '23.020')] +[2023-10-08 15:26:48,285][102897] Updated weights for policy 0, policy_version 92130 (0.0007) +[2023-10-08 15:26:48,659][102897] Updated weights for policy 0, policy_version 92140 (0.0007) +[2023-10-08 15:26:49,030][102897] Updated weights for policy 0, policy_version 92150 (0.0009) +[2023-10-08 15:26:49,401][102897] Updated weights for policy 0, policy_version 92160 (0.0007) +[2023-10-08 15:26:49,402][102898] Updated weights for policy 1, policy_version 92260 (0.0007) +[2023-10-08 15:26:49,769][102898] Updated weights for policy 1, policy_version 92270 (0.0008) +[2023-10-08 15:26:50,140][102898] Updated weights for policy 1, policy_version 92280 (0.0007) +[2023-10-08 15:26:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 188874752. Throughput: 0: 1791.1, 1: 1808.8. Samples: 47222098. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:26:51,876][101941] Avg episode reward: [(0, '8.580'), (1, '24.320')] +[2023-10-08 15:26:51,877][102760] Saving new best policy, reward=24.320! +[2023-10-08 15:26:53,338][102897] Updated weights for policy 0, policy_version 92170 (0.0007) +[2023-10-08 15:26:53,645][102898] Updated weights for policy 1, policy_version 92290 (0.0009) +[2023-10-08 15:26:53,708][102897] Updated weights for policy 0, policy_version 92180 (0.0008) +[2023-10-08 15:26:54,007][102898] Updated weights for policy 1, policy_version 92300 (0.0009) +[2023-10-08 15:26:54,072][102897] Updated weights for policy 0, policy_version 92190 (0.0008) +[2023-10-08 15:26:54,372][102898] Updated weights for policy 1, policy_version 92310 (0.0010) +[2023-10-08 15:26:54,736][102898] Updated weights for policy 1, policy_version 92320 (0.0007) +[2023-10-08 15:26:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 188940288. Throughput: 0: 1786.5, 1: 1785.1. Samples: 47243168. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:26:56,875][101941] Avg episode reward: [(0, '9.010'), (1, '24.910')] +[2023-10-08 15:26:56,876][102760] Saving new best policy, reward=24.910! +[2023-10-08 15:26:57,941][102897] Updated weights for policy 0, policy_version 92200 (0.0008) +[2023-10-08 15:26:58,316][102897] Updated weights for policy 0, policy_version 92210 (0.0008) +[2023-10-08 15:26:58,378][102898] Updated weights for policy 1, policy_version 92330 (0.0008) +[2023-10-08 15:26:58,687][102897] Updated weights for policy 0, policy_version 92220 (0.0007) +[2023-10-08 15:26:58,746][102898] Updated weights for policy 1, policy_version 92340 (0.0008) +[2023-10-08 15:26:59,116][102898] Updated weights for policy 1, policy_version 92350 (0.0010) +[2023-10-08 15:27:01,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 189005824. Throughput: 0: 1784.1, 1: 1797.2. Samples: 47265726. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:27:01,875][101941] Avg episode reward: [(0, '9.020'), (1, '24.230')] +[2023-10-08 15:27:02,418][102897] Updated weights for policy 0, policy_version 92230 (0.0007) +[2023-10-08 15:27:02,786][102897] Updated weights for policy 0, policy_version 92240 (0.0008) +[2023-10-08 15:27:02,800][102898] Updated weights for policy 1, policy_version 92360 (0.0008) +[2023-10-08 15:27:03,154][102897] Updated weights for policy 0, policy_version 92250 (0.0007) +[2023-10-08 15:27:03,162][102898] Updated weights for policy 1, policy_version 92370 (0.0007) +[2023-10-08 15:27:03,535][102898] Updated weights for policy 1, policy_version 92380 (0.0008) +[2023-10-08 15:27:06,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 189071360. Throughput: 0: 1778.4, 1: 1798.7. Samples: 47275410. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:27:06,876][101941] Avg episode reward: [(0, '8.650'), (1, '22.840')] +[2023-10-08 15:27:06,997][102897] Updated weights for policy 0, policy_version 92260 (0.0009) +[2023-10-08 15:27:07,312][102898] Updated weights for policy 1, policy_version 92390 (0.0009) +[2023-10-08 15:27:07,361][102897] Updated weights for policy 0, policy_version 92270 (0.0008) +[2023-10-08 15:27:07,682][102898] Updated weights for policy 1, policy_version 92400 (0.0007) +[2023-10-08 15:27:07,722][102897] Updated weights for policy 0, policy_version 92280 (0.0007) +[2023-10-08 15:27:08,039][102898] Updated weights for policy 1, policy_version 92410 (0.0007) +[2023-10-08 15:27:11,603][102897] Updated weights for policy 0, policy_version 92290 (0.0007) +[2023-10-08 15:27:11,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 189136896. Throughput: 0: 1772.7, 1: 1802.1. Samples: 47297566. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:27:11,876][101941] Avg episode reward: [(0, '8.720'), (1, '19.480')] +[2023-10-08 15:27:11,934][102898] Updated weights for policy 1, policy_version 92420 (0.0008) +[2023-10-08 15:27:11,969][102897] Updated weights for policy 0, policy_version 92300 (0.0007) +[2023-10-08 15:27:12,299][102898] Updated weights for policy 1, policy_version 92430 (0.0008) +[2023-10-08 15:27:12,338][102897] Updated weights for policy 0, policy_version 92310 (0.0007) +[2023-10-08 15:27:12,672][102898] Updated weights for policy 1, policy_version 92440 (0.0009) +[2023-10-08 15:27:12,705][102897] Updated weights for policy 0, policy_version 92320 (0.0008) +[2023-10-08 15:27:16,419][102898] Updated weights for policy 1, policy_version 92450 (0.0008) +[2023-10-08 15:27:16,585][102897] Updated weights for policy 0, policy_version 92330 (0.0008) +[2023-10-08 15:27:16,774][102898] Updated weights for policy 1, policy_version 92460 (0.0009) +[2023-10-08 15:27:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14106.9). Total num frames: 189202432. Throughput: 0: 1789.2, 1: 1812.4. Samples: 47319360. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:27:16,875][101941] Avg episode reward: [(0, '9.030'), (1, '19.030')] +[2023-10-08 15:27:16,955][102897] Updated weights for policy 0, policy_version 92340 (0.0009) +[2023-10-08 15:27:17,136][102898] Updated weights for policy 1, policy_version 92470 (0.0009) +[2023-10-08 15:27:17,315][102897] Updated weights for policy 0, policy_version 92350 (0.0007) +[2023-10-08 15:27:17,508][102898] Updated weights for policy 1, policy_version 92480 (0.0009) +[2023-10-08 15:27:21,341][102897] Updated weights for policy 0, policy_version 92360 (0.0008) +[2023-10-08 15:27:21,428][102898] Updated weights for policy 1, policy_version 92490 (0.0008) +[2023-10-08 15:27:21,711][102897] Updated weights for policy 0, policy_version 92370 (0.0007) +[2023-10-08 15:27:21,793][102898] Updated weights for policy 1, policy_version 92500 (0.0008) +[2023-10-08 15:27:21,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14106.9). Total num frames: 189267968. Throughput: 0: 1754.5, 1: 1800.6. Samples: 47329152. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:27:21,875][101941] Avg episode reward: [(0, '8.390'), (1, '18.500')] +[2023-10-08 15:27:22,079][102897] Updated weights for policy 0, policy_version 92380 (0.0010) +[2023-10-08 15:27:22,156][102898] Updated weights for policy 1, policy_version 92510 (0.0008) +[2023-10-08 15:27:25,866][102898] Updated weights for policy 1, policy_version 92520 (0.0010) +[2023-10-08 15:27:25,982][102897] Updated weights for policy 0, policy_version 92390 (0.0009) +[2023-10-08 15:27:26,230][102898] Updated weights for policy 1, policy_version 92530 (0.0009) +[2023-10-08 15:27:26,348][102897] Updated weights for policy 0, policy_version 92400 (0.0007) +[2023-10-08 15:27:26,587][102898] Updated weights for policy 1, policy_version 92540 (0.0007) +[2023-10-08 15:27:26,724][102897] Updated weights for policy 0, policy_version 92410 (0.0008) +[2023-10-08 15:27:26,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14106.9). Total num frames: 189366272. Throughput: 0: 1784.4, 1: 1802.3. Samples: 47351292. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 15:27:26,876][101941] Avg episode reward: [(0, '6.940'), (1, '20.820')] +[2023-10-08 15:27:30,255][102898] Updated weights for policy 1, policy_version 92550 (0.0007) +[2023-10-08 15:27:30,476][102897] Updated weights for policy 0, policy_version 92420 (0.0009) +[2023-10-08 15:27:30,613][102898] Updated weights for policy 1, policy_version 92560 (0.0008) +[2023-10-08 15:27:30,838][102897] Updated weights for policy 0, policy_version 92430 (0.0009) +[2023-10-08 15:27:30,984][102898] Updated weights for policy 1, policy_version 92570 (0.0008) +[2023-10-08 15:27:31,215][102897] Updated weights for policy 0, policy_version 92440 (0.0009) +[2023-10-08 15:27:31,875][101941] Fps is (10 sec: 19660.5, 60 sec: 14745.6, 300 sec: 14218.0). Total num frames: 189464576. Throughput: 0: 1754.2, 1: 1795.9. Samples: 47370856. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 15:27:31,876][101941] Avg episode reward: [(0, '7.430'), (1, '22.520')] +[2023-10-08 15:27:34,909][102898] Updated weights for policy 1, policy_version 92580 (0.0007) +[2023-10-08 15:27:35,034][102897] Updated weights for policy 0, policy_version 92450 (0.0007) +[2023-10-08 15:27:35,273][102898] Updated weights for policy 1, policy_version 92590 (0.0007) +[2023-10-08 15:27:35,395][102897] Updated weights for policy 0, policy_version 92460 (0.0007) +[2023-10-08 15:27:35,634][102898] Updated weights for policy 1, policy_version 92600 (0.0007) +[2023-10-08 15:27:35,766][102897] Updated weights for policy 0, policy_version 92470 (0.0008) +[2023-10-08 15:27:36,135][102897] Updated weights for policy 0, policy_version 92480 (0.0008) +[2023-10-08 15:27:36,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 189530112. Throughput: 0: 1779.9, 1: 1794.2. Samples: 47382932. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 15:27:36,875][101941] Avg episode reward: [(0, '8.450'), (1, '22.780')] +[2023-10-08 15:27:39,331][102898] Updated weights for policy 1, policy_version 92610 (0.0008) +[2023-10-08 15:27:39,688][102898] Updated weights for policy 1, policy_version 92620 (0.0009) +[2023-10-08 15:27:39,824][102897] Updated weights for policy 0, policy_version 92490 (0.0007) +[2023-10-08 15:27:40,054][102898] Updated weights for policy 1, policy_version 92630 (0.0009) +[2023-10-08 15:27:40,183][102897] Updated weights for policy 0, policy_version 92500 (0.0007) +[2023-10-08 15:27:40,421][102898] Updated weights for policy 1, policy_version 92640 (0.0009) +[2023-10-08 15:27:40,554][102897] Updated weights for policy 0, policy_version 92510 (0.0008) +[2023-10-08 15:27:41,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 189595648. Throughput: 0: 1759.3, 1: 1793.3. Samples: 47403034. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 15:27:41,876][101941] Avg episode reward: [(0, '8.890'), (1, '21.810')] +[2023-10-08 15:27:44,240][102898] Updated weights for policy 1, policy_version 92650 (0.0009) +[2023-10-08 15:27:44,477][102897] Updated weights for policy 0, policy_version 92520 (0.0008) +[2023-10-08 15:27:44,614][102898] Updated weights for policy 1, policy_version 92660 (0.0007) +[2023-10-08 15:27:44,862][102897] Updated weights for policy 0, policy_version 92530 (0.0009) +[2023-10-08 15:27:44,969][102898] Updated weights for policy 1, policy_version 92670 (0.0008) +[2023-10-08 15:27:45,236][102897] Updated weights for policy 0, policy_version 92540 (0.0009) +[2023-10-08 15:27:46,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 189661184. Throughput: 0: 1752.6, 1: 1781.8. Samples: 47424774. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 15:27:46,876][101941] Avg episode reward: [(0, '9.080'), (1, '20.730')] +[2023-10-08 15:27:48,698][102898] Updated weights for policy 1, policy_version 92680 (0.0009) +[2023-10-08 15:27:48,945][102897] Updated weights for policy 0, policy_version 92550 (0.0009) +[2023-10-08 15:27:49,070][102898] Updated weights for policy 1, policy_version 92690 (0.0008) +[2023-10-08 15:27:49,321][102897] Updated weights for policy 0, policy_version 92560 (0.0007) +[2023-10-08 15:27:49,437][102898] Updated weights for policy 1, policy_version 92700 (0.0008) +[2023-10-08 15:27:49,695][102897] Updated weights for policy 0, policy_version 92570 (0.0007) +[2023-10-08 15:27:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 189726720. Throughput: 0: 1769.8, 1: 1784.4. Samples: 47435352. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 15:27:51,876][101941] Avg episode reward: [(0, '9.390'), (1, '20.120')] +[2023-10-08 15:27:53,254][102898] Updated weights for policy 1, policy_version 92710 (0.0008) +[2023-10-08 15:27:53,323][102897] Updated weights for policy 0, policy_version 92580 (0.0008) +[2023-10-08 15:27:53,611][102898] Updated weights for policy 1, policy_version 92720 (0.0007) +[2023-10-08 15:27:53,697][102897] Updated weights for policy 0, policy_version 92590 (0.0008) +[2023-10-08 15:27:53,973][102898] Updated weights for policy 1, policy_version 92730 (0.0008) +[2023-10-08 15:27:54,069][102897] Updated weights for policy 0, policy_version 92600 (0.0008) +[2023-10-08 15:27:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 189792256. Throughput: 0: 1760.7, 1: 1780.6. Samples: 47456924. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 15:27:56,876][101941] Avg episode reward: [(0, '9.310'), (1, '19.580')] +[2023-10-08 15:27:57,596][102898] Updated weights for policy 1, policy_version 92740 (0.0007) +[2023-10-08 15:27:57,740][102897] Updated weights for policy 0, policy_version 92610 (0.0008) +[2023-10-08 15:27:57,965][102898] Updated weights for policy 1, policy_version 92750 (0.0007) +[2023-10-08 15:27:58,110][102897] Updated weights for policy 0, policy_version 92620 (0.0008) +[2023-10-08 15:27:58,335][102898] Updated weights for policy 1, policy_version 92760 (0.0009) +[2023-10-08 15:27:58,487][102897] Updated weights for policy 0, policy_version 92630 (0.0008) +[2023-10-08 15:27:58,854][102897] Updated weights for policy 0, policy_version 92640 (0.0007) +[2023-10-08 15:28:01,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 189857792. Throughput: 0: 1778.4, 1: 1784.2. Samples: 47479674. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 15:28:01,876][101941] Avg episode reward: [(0, '9.070'), (1, '21.270')] +[2023-10-08 15:28:02,213][102898] Updated weights for policy 1, policy_version 92770 (0.0008) +[2023-10-08 15:28:02,588][102898] Updated weights for policy 1, policy_version 92780 (0.0008) +[2023-10-08 15:28:02,687][102897] Updated weights for policy 0, policy_version 92650 (0.0008) +[2023-10-08 15:28:02,968][102898] Updated weights for policy 1, policy_version 92790 (0.0007) +[2023-10-08 15:28:03,053][102897] Updated weights for policy 0, policy_version 92660 (0.0008) +[2023-10-08 15:28:03,325][102898] Updated weights for policy 1, policy_version 92800 (0.0009) +[2023-10-08 15:28:03,420][102897] Updated weights for policy 0, policy_version 92670 (0.0007) +[2023-10-08 15:28:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14106.9). Total num frames: 189923328. Throughput: 0: 1776.4, 1: 1782.4. Samples: 47489298. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 15:28:06,876][101941] Avg episode reward: [(0, '8.700'), (1, '19.130')] +[2023-10-08 15:28:07,078][102897] Updated weights for policy 0, policy_version 92680 (0.0008) +[2023-10-08 15:28:07,171][102898] Updated weights for policy 1, policy_version 92810 (0.0007) +[2023-10-08 15:28:07,451][102897] Updated weights for policy 0, policy_version 92690 (0.0009) +[2023-10-08 15:28:07,538][102898] Updated weights for policy 1, policy_version 92820 (0.0007) +[2023-10-08 15:28:07,818][102897] Updated weights for policy 0, policy_version 92700 (0.0008) +[2023-10-08 15:28:07,898][102898] Updated weights for policy 1, policy_version 92830 (0.0009) +[2023-10-08 15:28:11,556][102897] Updated weights for policy 0, policy_version 92710 (0.0008) +[2023-10-08 15:28:11,659][102898] Updated weights for policy 1, policy_version 92840 (0.0008) +[2023-10-08 15:28:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 13995.8). Total num frames: 189988864. Throughput: 0: 1782.6, 1: 1781.0. Samples: 47511656. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 15:28:11,875][101941] Avg episode reward: [(0, '9.400'), (1, '18.520')] +[2023-10-08 15:28:11,932][102897] Updated weights for policy 0, policy_version 92720 (0.0008) +[2023-10-08 15:28:12,018][102898] Updated weights for policy 1, policy_version 92850 (0.0008) +[2023-10-08 15:28:12,301][102897] Updated weights for policy 0, policy_version 92730 (0.0008) +[2023-10-08 15:28:12,387][102898] Updated weights for policy 1, policy_version 92860 (0.0007) +[2023-10-08 15:28:16,123][102897] Updated weights for policy 0, policy_version 92740 (0.0007) +[2023-10-08 15:28:16,238][102898] Updated weights for policy 1, policy_version 92870 (0.0009) +[2023-10-08 15:28:16,497][102897] Updated weights for policy 0, policy_version 92750 (0.0009) +[2023-10-08 15:28:16,613][102898] Updated weights for policy 1, policy_version 92880 (0.0009) +[2023-10-08 15:28:16,868][102897] Updated weights for policy 0, policy_version 92760 (0.0008) +[2023-10-08 15:28:16,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 13995.8). Total num frames: 190054400. Throughput: 0: 1799.4, 1: 1796.7. Samples: 47532680. Policy #0 lag: (min: 31.0, avg: 36.1, max: 63.0) +[2023-10-08 15:28:16,875][101941] Avg episode reward: [(0, '9.560'), (1, '19.630')] +[2023-10-08 15:28:16,983][102898] Updated weights for policy 1, policy_version 92890 (0.0008) +[2023-10-08 15:28:17,155][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000092768_94994432.pth... +[2023-10-08 15:28:17,188][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000091104_93290496.pth +[2023-10-08 15:28:17,197][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000092896_95125504.pth... +[2023-10-08 15:28:17,235][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000091232_93421568.pth +[2023-10-08 15:28:20,703][102897] Updated weights for policy 0, policy_version 92770 (0.0008) +[2023-10-08 15:28:20,728][102898] Updated weights for policy 1, policy_version 92900 (0.0007) +[2023-10-08 15:28:21,076][102897] Updated weights for policy 0, policy_version 92780 (0.0007) +[2023-10-08 15:28:21,098][102898] Updated weights for policy 1, policy_version 92910 (0.0007) +[2023-10-08 15:28:21,440][102897] Updated weights for policy 0, policy_version 92790 (0.0007) +[2023-10-08 15:28:21,472][102898] Updated weights for policy 1, policy_version 92920 (0.0008) +[2023-10-08 15:28:21,802][102897] Updated weights for policy 0, policy_version 92800 (0.0008) +[2023-10-08 15:28:21,875][101941] Fps is (10 sec: 19660.3, 60 sec: 15291.7, 300 sec: 14218.0). Total num frames: 190185472. Throughput: 0: 1786.0, 1: 1779.5. Samples: 47543382. Policy #0 lag: (min: 9.0, avg: 18.9, max: 41.0) +[2023-10-08 15:28:21,876][101941] Avg episode reward: [(0, '9.650'), (1, '18.690')] +[2023-10-08 15:28:25,214][102898] Updated weights for policy 1, policy_version 92930 (0.0010) +[2023-10-08 15:28:25,588][102898] Updated weights for policy 1, policy_version 92940 (0.0008) +[2023-10-08 15:28:25,642][102897] Updated weights for policy 0, policy_version 92810 (0.0008) +[2023-10-08 15:28:25,955][102898] Updated weights for policy 1, policy_version 92950 (0.0009) +[2023-10-08 15:28:26,001][102897] Updated weights for policy 0, policy_version 92820 (0.0007) +[2023-10-08 15:28:26,322][102898] Updated weights for policy 1, policy_version 92960 (0.0007) +[2023-10-08 15:28:26,368][102897] Updated weights for policy 0, policy_version 92830 (0.0008) +[2023-10-08 15:28:26,875][101941] Fps is (10 sec: 19660.4, 60 sec: 14745.6, 300 sec: 14218.0). Total num frames: 190251008. Throughput: 0: 1802.8, 1: 1796.8. Samples: 47565016. Policy #0 lag: (min: 9.0, avg: 18.9, max: 41.0) +[2023-10-08 15:28:26,876][101941] Avg episode reward: [(0, '8.640'), (1, '19.270')] +[2023-10-08 15:28:30,080][102898] Updated weights for policy 1, policy_version 92970 (0.0010) +[2023-10-08 15:28:30,366][102897] Updated weights for policy 0, policy_version 92840 (0.0009) +[2023-10-08 15:28:30,434][102898] Updated weights for policy 1, policy_version 92980 (0.0010) +[2023-10-08 15:28:30,740][102897] Updated weights for policy 0, policy_version 92850 (0.0007) +[2023-10-08 15:28:30,799][102898] Updated weights for policy 1, policy_version 92990 (0.0007) +[2023-10-08 15:28:31,115][102897] Updated weights for policy 0, policy_version 92860 (0.0009) +[2023-10-08 15:28:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 190316544. Throughput: 0: 1777.0, 1: 1774.2. Samples: 47584576. Policy #0 lag: (min: 9.0, avg: 18.9, max: 41.0) +[2023-10-08 15:28:31,876][101941] Avg episode reward: [(0, '8.660'), (1, '18.070')] +[2023-10-08 15:28:34,590][102898] Updated weights for policy 1, policy_version 93000 (0.0008) +[2023-10-08 15:28:34,868][102897] Updated weights for policy 0, policy_version 92870 (0.0009) +[2023-10-08 15:28:34,960][102898] Updated weights for policy 1, policy_version 93010 (0.0008) +[2023-10-08 15:28:35,228][102897] Updated weights for policy 0, policy_version 92880 (0.0009) +[2023-10-08 15:28:35,324][102898] Updated weights for policy 1, policy_version 93020 (0.0007) +[2023-10-08 15:28:35,596][102897] Updated weights for policy 0, policy_version 92890 (0.0009) +[2023-10-08 15:28:36,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 190382080. Throughput: 0: 1794.8, 1: 1795.6. Samples: 47596918. Policy #0 lag: (min: 9.0, avg: 18.9, max: 41.0) +[2023-10-08 15:28:36,875][101941] Avg episode reward: [(0, '8.580'), (1, '18.140')] +[2023-10-08 15:28:39,183][102898] Updated weights for policy 1, policy_version 93030 (0.0008) +[2023-10-08 15:28:39,374][102897] Updated weights for policy 0, policy_version 92900 (0.0008) +[2023-10-08 15:28:39,546][102898] Updated weights for policy 1, policy_version 93040 (0.0007) +[2023-10-08 15:28:39,747][102897] Updated weights for policy 0, policy_version 92910 (0.0008) +[2023-10-08 15:28:39,910][102898] Updated weights for policy 1, policy_version 93050 (0.0010) +[2023-10-08 15:28:40,114][102897] Updated weights for policy 0, policy_version 92920 (0.0008) +[2023-10-08 15:28:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 190447616. Throughput: 0: 1775.0, 1: 1774.5. Samples: 47616652. Policy #0 lag: (min: 9.0, avg: 18.9, max: 41.0) +[2023-10-08 15:28:41,876][101941] Avg episode reward: [(0, '8.430'), (1, '17.640')] +[2023-10-08 15:28:43,483][102898] Updated weights for policy 1, policy_version 93060 (0.0007) +[2023-10-08 15:28:43,854][102898] Updated weights for policy 1, policy_version 93070 (0.0008) +[2023-10-08 15:28:43,946][102897] Updated weights for policy 0, policy_version 92930 (0.0010) +[2023-10-08 15:28:44,219][102898] Updated weights for policy 1, policy_version 93080 (0.0009) +[2023-10-08 15:28:44,314][102897] Updated weights for policy 0, policy_version 92940 (0.0007) +[2023-10-08 15:28:44,673][102897] Updated weights for policy 0, policy_version 92950 (0.0010) +[2023-10-08 15:28:45,045][102897] Updated weights for policy 0, policy_version 92960 (0.0009) +[2023-10-08 15:28:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 190513152. Throughput: 0: 1764.6, 1: 1781.9. Samples: 47639264. Policy #0 lag: (min: 9.0, avg: 18.9, max: 41.0) +[2023-10-08 15:28:46,875][101941] Avg episode reward: [(0, '8.260'), (1, '19.740')] +[2023-10-08 15:28:47,922][102898] Updated weights for policy 1, policy_version 93090 (0.0008) +[2023-10-08 15:28:48,282][102898] Updated weights for policy 1, policy_version 93100 (0.0007) +[2023-10-08 15:28:48,649][102898] Updated weights for policy 1, policy_version 93110 (0.0007) +[2023-10-08 15:28:48,870][102897] Updated weights for policy 0, policy_version 92970 (0.0010) +[2023-10-08 15:28:49,018][102898] Updated weights for policy 1, policy_version 93120 (0.0009) +[2023-10-08 15:28:49,247][102897] Updated weights for policy 0, policy_version 92980 (0.0009) +[2023-10-08 15:28:49,617][102897] Updated weights for policy 0, policy_version 92990 (0.0007) +[2023-10-08 15:28:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 190578688. Throughput: 0: 1773.1, 1: 1786.0. Samples: 47649458. Policy #0 lag: (min: 9.0, avg: 18.9, max: 41.0) +[2023-10-08 15:28:51,875][101941] Avg episode reward: [(0, '8.580'), (1, '19.230')] +[2023-10-08 15:28:52,768][102898] Updated weights for policy 1, policy_version 93130 (0.0007) +[2023-10-08 15:28:53,130][102898] Updated weights for policy 1, policy_version 93140 (0.0009) +[2023-10-08 15:28:53,399][102897] Updated weights for policy 0, policy_version 93000 (0.0008) +[2023-10-08 15:28:53,497][102898] Updated weights for policy 1, policy_version 93150 (0.0008) +[2023-10-08 15:28:53,756][102897] Updated weights for policy 0, policy_version 93010 (0.0009) +[2023-10-08 15:28:54,129][102897] Updated weights for policy 0, policy_version 93020 (0.0010) +[2023-10-08 15:28:56,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 190644224. Throughput: 0: 1760.9, 1: 1790.3. Samples: 47671462. Policy #0 lag: (min: 9.0, avg: 18.9, max: 41.0) +[2023-10-08 15:28:56,876][101941] Avg episode reward: [(0, '8.170'), (1, '19.370')] +[2023-10-08 15:28:57,171][102898] Updated weights for policy 1, policy_version 93160 (0.0008) +[2023-10-08 15:28:57,538][102898] Updated weights for policy 1, policy_version 93170 (0.0009) +[2023-10-08 15:28:57,895][102898] Updated weights for policy 1, policy_version 93180 (0.0009) +[2023-10-08 15:28:58,047][102897] Updated weights for policy 0, policy_version 93030 (0.0008) +[2023-10-08 15:28:58,416][102897] Updated weights for policy 0, policy_version 93040 (0.0007) +[2023-10-08 15:28:58,788][102897] Updated weights for policy 0, policy_version 93050 (0.0008) +[2023-10-08 15:29:01,864][102898] Updated weights for policy 1, policy_version 93190 (0.0008) +[2023-10-08 15:29:01,875][101941] Fps is (10 sec: 13106.7, 60 sec: 14199.4, 300 sec: 14106.9). Total num frames: 190709760. Throughput: 0: 1770.3, 1: 1810.9. Samples: 47693836. Policy #0 lag: (min: 9.0, avg: 18.9, max: 41.0) +[2023-10-08 15:29:01,876][101941] Avg episode reward: [(0, '8.290'), (1, '21.230')] +[2023-10-08 15:29:02,243][102898] Updated weights for policy 1, policy_version 93200 (0.0011) +[2023-10-08 15:29:02,598][102897] Updated weights for policy 0, policy_version 93060 (0.0007) +[2023-10-08 15:29:02,610][102898] Updated weights for policy 1, policy_version 93210 (0.0008) +[2023-10-08 15:29:02,965][102897] Updated weights for policy 0, policy_version 93070 (0.0007) +[2023-10-08 15:29:03,331][102897] Updated weights for policy 0, policy_version 93080 (0.0007) +[2023-10-08 15:29:06,203][102898] Updated weights for policy 1, policy_version 93220 (0.0008) +[2023-10-08 15:29:06,571][102898] Updated weights for policy 1, policy_version 93230 (0.0009) +[2023-10-08 15:29:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14106.9). Total num frames: 190775296. Throughput: 0: 1757.7, 1: 1799.4. Samples: 47703450. Policy #0 lag: (min: 9.0, avg: 18.9, max: 41.0) +[2023-10-08 15:29:06,876][101941] Avg episode reward: [(0, '8.340'), (1, '21.970')] +[2023-10-08 15:29:06,939][102898] Updated weights for policy 1, policy_version 93240 (0.0008) +[2023-10-08 15:29:06,985][102897] Updated weights for policy 0, policy_version 93090 (0.0008) +[2023-10-08 15:29:07,352][102897] Updated weights for policy 0, policy_version 93100 (0.0008) +[2023-10-08 15:29:07,729][102897] Updated weights for policy 0, policy_version 93110 (0.0009) +[2023-10-08 15:29:08,102][102897] Updated weights for policy 0, policy_version 93120 (0.0007) +[2023-10-08 15:29:10,783][102898] Updated weights for policy 1, policy_version 93250 (0.0007) +[2023-10-08 15:29:11,152][102898] Updated weights for policy 1, policy_version 93260 (0.0009) +[2023-10-08 15:29:11,514][102898] Updated weights for policy 1, policy_version 93270 (0.0011) +[2023-10-08 15:29:11,873][102897] Updated weights for policy 0, policy_version 93130 (0.0007) +[2023-10-08 15:29:11,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 13995.8). Total num frames: 190840832. Throughput: 0: 1765.7, 1: 1811.7. Samples: 47725998. Policy #0 lag: (min: 9.0, avg: 18.9, max: 41.0) +[2023-10-08 15:29:11,875][101941] Avg episode reward: [(0, '8.880'), (1, '21.360')] +[2023-10-08 15:29:11,884][102898] Updated weights for policy 1, policy_version 93280 (0.0009) +[2023-10-08 15:29:12,244][102897] Updated weights for policy 0, policy_version 93140 (0.0009) +[2023-10-08 15:29:12,610][102897] Updated weights for policy 0, policy_version 93150 (0.0007) +[2023-10-08 15:29:15,784][102898] Updated weights for policy 1, policy_version 93290 (0.0009) +[2023-10-08 15:29:16,144][102898] Updated weights for policy 1, policy_version 93300 (0.0008) +[2023-10-08 15:29:16,443][102897] Updated weights for policy 0, policy_version 93160 (0.0008) +[2023-10-08 15:29:16,509][102898] Updated weights for policy 1, policy_version 93310 (0.0008) +[2023-10-08 15:29:16,807][102897] Updated weights for policy 0, policy_version 93170 (0.0009) +[2023-10-08 15:29:16,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14106.9). Total num frames: 190939136. Throughput: 0: 1798.4, 1: 1806.0. Samples: 47746774. Policy #0 lag: (min: 9.0, avg: 18.9, max: 41.0) +[2023-10-08 15:29:16,875][101941] Avg episode reward: [(0, '9.900'), (1, '20.170')] +[2023-10-08 15:29:17,172][102897] Updated weights for policy 0, policy_version 93180 (0.0011) +[2023-10-08 15:29:20,048][102898] Updated weights for policy 1, policy_version 93320 (0.0010) +[2023-10-08 15:29:20,409][102898] Updated weights for policy 1, policy_version 93330 (0.0010) +[2023-10-08 15:29:20,769][102898] Updated weights for policy 1, policy_version 93340 (0.0009) +[2023-10-08 15:29:20,843][102897] Updated weights for policy 0, policy_version 93190 (0.0009) +[2023-10-08 15:29:21,217][102897] Updated weights for policy 0, policy_version 93200 (0.0007) +[2023-10-08 15:29:21,582][102897] Updated weights for policy 0, policy_version 93210 (0.0008) +[2023-10-08 15:29:21,875][101941] Fps is (10 sec: 19660.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 191037440. Throughput: 0: 1770.3, 1: 1811.4. Samples: 47758094. Policy #0 lag: (min: 26.0, avg: 38.9, max: 58.0) +[2023-10-08 15:29:21,876][101941] Avg episode reward: [(0, '9.380'), (1, '19.730')] +[2023-10-08 15:29:24,494][102898] Updated weights for policy 1, policy_version 93350 (0.0008) +[2023-10-08 15:29:24,858][102898] Updated weights for policy 1, policy_version 93360 (0.0008) +[2023-10-08 15:29:25,233][102898] Updated weights for policy 1, policy_version 93370 (0.0008) +[2023-10-08 15:29:25,301][102897] Updated weights for policy 0, policy_version 93220 (0.0008) +[2023-10-08 15:29:25,669][102897] Updated weights for policy 0, policy_version 93230 (0.0009) +[2023-10-08 15:29:26,027][102897] Updated weights for policy 0, policy_version 93240 (0.0007) +[2023-10-08 15:29:26,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 191102976. Throughput: 0: 1798.4, 1: 1809.6. Samples: 47779008. Policy #0 lag: (min: 26.0, avg: 38.9, max: 58.0) +[2023-10-08 15:29:26,876][101941] Avg episode reward: [(0, '8.740'), (1, '19.020')] +[2023-10-08 15:29:28,919][102898] Updated weights for policy 1, policy_version 93380 (0.0009) +[2023-10-08 15:29:29,301][102898] Updated weights for policy 1, policy_version 93390 (0.0009) +[2023-10-08 15:29:29,665][102898] Updated weights for policy 1, policy_version 93400 (0.0008) +[2023-10-08 15:29:29,675][102897] Updated weights for policy 0, policy_version 93250 (0.0007) +[2023-10-08 15:29:30,045][102897] Updated weights for policy 0, policy_version 93260 (0.0007) +[2023-10-08 15:29:30,412][102897] Updated weights for policy 0, policy_version 93270 (0.0008) +[2023-10-08 15:29:30,786][102897] Updated weights for policy 0, policy_version 93280 (0.0008) +[2023-10-08 15:29:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 191168512. Throughput: 0: 1779.1, 1: 1804.0. Samples: 47800502. Policy #0 lag: (min: 26.0, avg: 38.9, max: 58.0) +[2023-10-08 15:29:31,876][101941] Avg episode reward: [(0, '9.080'), (1, '18.820')] +[2023-10-08 15:29:33,346][102898] Updated weights for policy 1, policy_version 93410 (0.0008) +[2023-10-08 15:29:33,718][102898] Updated weights for policy 1, policy_version 93420 (0.0008) +[2023-10-08 15:29:34,076][102898] Updated weights for policy 1, policy_version 93430 (0.0008) +[2023-10-08 15:29:34,443][102898] Updated weights for policy 1, policy_version 93440 (0.0008) +[2023-10-08 15:29:34,493][102897] Updated weights for policy 0, policy_version 93290 (0.0009) +[2023-10-08 15:29:34,857][102897] Updated weights for policy 0, policy_version 93300 (0.0008) +[2023-10-08 15:29:35,226][102897] Updated weights for policy 0, policy_version 93310 (0.0008) +[2023-10-08 15:29:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 191234048. Throughput: 0: 1797.8, 1: 1808.6. Samples: 47811744. Policy #0 lag: (min: 26.0, avg: 38.9, max: 58.0) +[2023-10-08 15:29:36,875][101941] Avg episode reward: [(0, '9.030'), (1, '20.430')] +[2023-10-08 15:29:38,180][102898] Updated weights for policy 1, policy_version 93450 (0.0008) +[2023-10-08 15:29:38,550][102898] Updated weights for policy 1, policy_version 93460 (0.0007) +[2023-10-08 15:29:38,907][102898] Updated weights for policy 1, policy_version 93470 (0.0008) +[2023-10-08 15:29:39,014][102897] Updated weights for policy 0, policy_version 93320 (0.0009) +[2023-10-08 15:29:39,377][102897] Updated weights for policy 0, policy_version 93330 (0.0008) +[2023-10-08 15:29:39,739][102897] Updated weights for policy 0, policy_version 93340 (0.0007) +[2023-10-08 15:29:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 191299584. Throughput: 0: 1785.2, 1: 1800.5. Samples: 47832818. Policy #0 lag: (min: 26.0, avg: 38.9, max: 58.0) +[2023-10-08 15:29:41,876][101941] Avg episode reward: [(0, '8.680'), (1, '20.630')] +[2023-10-08 15:29:42,712][102898] Updated weights for policy 1, policy_version 93480 (0.0008) +[2023-10-08 15:29:43,076][102898] Updated weights for policy 1, policy_version 93490 (0.0007) +[2023-10-08 15:29:43,446][102898] Updated weights for policy 1, policy_version 93500 (0.0008) +[2023-10-08 15:29:43,642][102897] Updated weights for policy 0, policy_version 93350 (0.0008) +[2023-10-08 15:29:44,016][102897] Updated weights for policy 0, policy_version 93360 (0.0007) +[2023-10-08 15:29:44,382][102897] Updated weights for policy 0, policy_version 93370 (0.0007) +[2023-10-08 15:29:46,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 191365120. Throughput: 0: 1789.2, 1: 1792.4. Samples: 47855008. Policy #0 lag: (min: 26.0, avg: 38.9, max: 58.0) +[2023-10-08 15:29:46,876][101941] Avg episode reward: [(0, '9.240'), (1, '21.310')] +[2023-10-08 15:29:47,330][102898] Updated weights for policy 1, policy_version 93510 (0.0008) +[2023-10-08 15:29:47,709][102898] Updated weights for policy 1, policy_version 93520 (0.0009) +[2023-10-08 15:29:48,073][102898] Updated weights for policy 1, policy_version 93530 (0.0010) +[2023-10-08 15:29:48,179][102897] Updated weights for policy 0, policy_version 93380 (0.0009) +[2023-10-08 15:29:48,547][102897] Updated weights for policy 0, policy_version 93390 (0.0007) +[2023-10-08 15:29:48,907][102897] Updated weights for policy 0, policy_version 93400 (0.0008) +[2023-10-08 15:29:51,751][102898] Updated weights for policy 1, policy_version 93540 (0.0009) +[2023-10-08 15:29:51,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 191430656. Throughput: 0: 1792.0, 1: 1792.1. Samples: 47864736. Policy #0 lag: (min: 26.0, avg: 38.9, max: 58.0) +[2023-10-08 15:29:51,876][101941] Avg episode reward: [(0, '9.520'), (1, '20.280')] +[2023-10-08 15:29:52,115][102898] Updated weights for policy 1, policy_version 93550 (0.0008) +[2023-10-08 15:29:52,478][102898] Updated weights for policy 1, policy_version 93560 (0.0009) +[2023-10-08 15:29:52,726][102897] Updated weights for policy 0, policy_version 93410 (0.0008) +[2023-10-08 15:29:53,102][102897] Updated weights for policy 0, policy_version 93420 (0.0008) +[2023-10-08 15:29:53,469][102897] Updated weights for policy 0, policy_version 93430 (0.0007) +[2023-10-08 15:29:53,833][102897] Updated weights for policy 0, policy_version 93440 (0.0008) +[2023-10-08 15:29:56,253][102898] Updated weights for policy 1, policy_version 93570 (0.0009) +[2023-10-08 15:29:56,616][102898] Updated weights for policy 1, policy_version 93580 (0.0009) +[2023-10-08 15:29:56,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 191496192. Throughput: 0: 1787.8, 1: 1796.8. Samples: 47887302. Policy #0 lag: (min: 26.0, avg: 38.9, max: 58.0) +[2023-10-08 15:29:56,875][101941] Avg episode reward: [(0, '9.630'), (1, '18.560')] +[2023-10-08 15:29:56,985][102898] Updated weights for policy 1, policy_version 93590 (0.0009) +[2023-10-08 15:29:57,347][102898] Updated weights for policy 1, policy_version 93600 (0.0007) +[2023-10-08 15:29:57,661][102897] Updated weights for policy 0, policy_version 93450 (0.0007) +[2023-10-08 15:29:58,038][102897] Updated weights for policy 0, policy_version 93460 (0.0007) +[2023-10-08 15:29:58,410][102897] Updated weights for policy 0, policy_version 93470 (0.0008) +[2023-10-08 15:30:01,141][102898] Updated weights for policy 1, policy_version 93610 (0.0008) +[2023-10-08 15:30:01,512][102898] Updated weights for policy 1, policy_version 93620 (0.0008) +[2023-10-08 15:30:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 191561728. Throughput: 0: 1792.0, 1: 1806.6. Samples: 47908712. Policy #0 lag: (min: 26.0, avg: 38.9, max: 58.0) +[2023-10-08 15:30:01,876][101941] Avg episode reward: [(0, '8.850'), (1, '20.400')] +[2023-10-08 15:30:01,877][102898] Updated weights for policy 1, policy_version 93630 (0.0009) +[2023-10-08 15:30:02,242][102897] Updated weights for policy 0, policy_version 93480 (0.0009) +[2023-10-08 15:30:02,614][102897] Updated weights for policy 0, policy_version 93490 (0.0010) +[2023-10-08 15:30:02,982][102897] Updated weights for policy 0, policy_version 93500 (0.0008) +[2023-10-08 15:30:05,588][102898] Updated weights for policy 1, policy_version 93640 (0.0008) +[2023-10-08 15:30:05,967][102898] Updated weights for policy 1, policy_version 93650 (0.0011) +[2023-10-08 15:30:06,333][102898] Updated weights for policy 1, policy_version 93660 (0.0010) +[2023-10-08 15:30:06,644][102897] Updated weights for policy 0, policy_version 93510 (0.0007) +[2023-10-08 15:30:06,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 191660032. Throughput: 0: 1787.2, 1: 1794.5. Samples: 47919268. Policy #0 lag: (min: 26.0, avg: 38.9, max: 58.0) +[2023-10-08 15:30:06,875][101941] Avg episode reward: [(0, '8.300'), (1, '18.020')] +[2023-10-08 15:30:07,008][102897] Updated weights for policy 0, policy_version 93520 (0.0008) +[2023-10-08 15:30:07,373][102897] Updated weights for policy 0, policy_version 93530 (0.0008) +[2023-10-08 15:30:09,990][102898] Updated weights for policy 1, policy_version 93670 (0.0009) +[2023-10-08 15:30:10,346][102898] Updated weights for policy 1, policy_version 93680 (0.0010) +[2023-10-08 15:30:10,709][102898] Updated weights for policy 1, policy_version 93690 (0.0008) +[2023-10-08 15:30:11,180][102897] Updated weights for policy 0, policy_version 93540 (0.0008) +[2023-10-08 15:30:11,542][102897] Updated weights for policy 0, policy_version 93550 (0.0008) +[2023-10-08 15:30:11,875][101941] Fps is (10 sec: 16384.2, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 191725568. Throughput: 0: 1792.5, 1: 1809.7. Samples: 47941108. Policy #0 lag: (min: 26.0, avg: 38.9, max: 58.0) +[2023-10-08 15:30:11,876][101941] Avg episode reward: [(0, '9.090'), (1, '18.920')] +[2023-10-08 15:30:11,911][102897] Updated weights for policy 0, policy_version 93560 (0.0010) +[2023-10-08 15:30:14,348][102898] Updated weights for policy 1, policy_version 93700 (0.0007) +[2023-10-08 15:30:14,713][102898] Updated weights for policy 1, policy_version 93710 (0.0009) +[2023-10-08 15:30:15,082][102898] Updated weights for policy 1, policy_version 93720 (0.0007) +[2023-10-08 15:30:15,622][102897] Updated weights for policy 0, policy_version 93570 (0.0009) +[2023-10-08 15:30:15,990][102897] Updated weights for policy 0, policy_version 93580 (0.0010) +[2023-10-08 15:30:16,358][102897] Updated weights for policy 0, policy_version 93590 (0.0007) +[2023-10-08 15:30:16,727][102897] Updated weights for policy 0, policy_version 93600 (0.0008) +[2023-10-08 15:30:16,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 191823872. Throughput: 0: 1794.4, 1: 1799.9. Samples: 47962248. Policy #0 lag: (min: 26.0, avg: 38.9, max: 58.0) +[2023-10-08 15:30:16,876][101941] Avg episode reward: [(0, '8.550'), (1, '21.070')] +[2023-10-08 15:30:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000093600_95846400.pth... +[2023-10-08 15:30:16,883][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000093728_95977472.pth... +[2023-10-08 15:30:16,922][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000091936_94142464.pth +[2023-10-08 15:30:16,923][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000092032_94240768.pth +[2023-10-08 15:30:18,730][102898] Updated weights for policy 1, policy_version 93730 (0.0008) +[2023-10-08 15:30:19,093][102898] Updated weights for policy 1, policy_version 93740 (0.0010) +[2023-10-08 15:30:19,469][102898] Updated weights for policy 1, policy_version 93750 (0.0011) +[2023-10-08 15:30:19,832][102898] Updated weights for policy 1, policy_version 93760 (0.0008) +[2023-10-08 15:30:20,494][102897] Updated weights for policy 0, policy_version 93610 (0.0008) +[2023-10-08 15:30:20,853][102897] Updated weights for policy 0, policy_version 93620 (0.0009) +[2023-10-08 15:30:21,222][102897] Updated weights for policy 0, policy_version 93630 (0.0011) +[2023-10-08 15:30:21,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 191889408. Throughput: 0: 1788.7, 1: 1807.3. Samples: 47973564. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:30:21,876][101941] Avg episode reward: [(0, '8.670'), (1, '20.000')] +[2023-10-08 15:30:23,562][102898] Updated weights for policy 1, policy_version 93770 (0.0007) +[2023-10-08 15:30:23,924][102898] Updated weights for policy 1, policy_version 93780 (0.0008) +[2023-10-08 15:30:24,293][102898] Updated weights for policy 1, policy_version 93790 (0.0010) +[2023-10-08 15:30:25,060][102897] Updated weights for policy 0, policy_version 93640 (0.0007) +[2023-10-08 15:30:25,427][102897] Updated weights for policy 0, policy_version 93650 (0.0009) +[2023-10-08 15:30:25,797][102897] Updated weights for policy 0, policy_version 93660 (0.0010) +[2023-10-08 15:30:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 191954944. Throughput: 0: 1791.6, 1: 1800.3. Samples: 47994452. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:30:26,875][101941] Avg episode reward: [(0, '8.960'), (1, '22.000')] +[2023-10-08 15:30:28,047][102898] Updated weights for policy 1, policy_version 93800 (0.0009) +[2023-10-08 15:30:28,411][102898] Updated weights for policy 1, policy_version 93810 (0.0008) +[2023-10-08 15:30:28,776][102898] Updated weights for policy 1, policy_version 93820 (0.0009) +[2023-10-08 15:30:29,653][102897] Updated weights for policy 0, policy_version 93670 (0.0010) +[2023-10-08 15:30:30,033][102897] Updated weights for policy 0, policy_version 93680 (0.0010) +[2023-10-08 15:30:30,396][102897] Updated weights for policy 0, policy_version 93690 (0.0011) +[2023-10-08 15:30:31,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 192020480. Throughput: 0: 1771.0, 1: 1803.4. Samples: 48015858. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:30:31,876][101941] Avg episode reward: [(0, '8.970'), (1, '23.810')] +[2023-10-08 15:30:32,702][102898] Updated weights for policy 1, policy_version 93830 (0.0008) +[2023-10-08 15:30:33,069][102898] Updated weights for policy 1, policy_version 93840 (0.0008) +[2023-10-08 15:30:33,444][102898] Updated weights for policy 1, policy_version 93850 (0.0010) +[2023-10-08 15:30:34,235][102897] Updated weights for policy 0, policy_version 93700 (0.0008) +[2023-10-08 15:30:34,593][102897] Updated weights for policy 0, policy_version 93710 (0.0008) +[2023-10-08 15:30:34,967][102897] Updated weights for policy 0, policy_version 93720 (0.0009) +[2023-10-08 15:30:36,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 192086016. Throughput: 0: 1796.8, 1: 1802.8. Samples: 48026716. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:30:36,876][101941] Avg episode reward: [(0, '8.630'), (1, '23.580')] +[2023-10-08 15:30:37,010][102898] Updated weights for policy 1, policy_version 93860 (0.0007) +[2023-10-08 15:30:37,381][102898] Updated weights for policy 1, policy_version 93870 (0.0011) +[2023-10-08 15:30:37,748][102898] Updated weights for policy 1, policy_version 93880 (0.0007) +[2023-10-08 15:30:38,810][102897] Updated weights for policy 0, policy_version 93730 (0.0008) +[2023-10-08 15:30:39,170][102897] Updated weights for policy 0, policy_version 93740 (0.0007) +[2023-10-08 15:30:39,538][102897] Updated weights for policy 0, policy_version 93750 (0.0008) +[2023-10-08 15:30:39,910][102897] Updated weights for policy 0, policy_version 93760 (0.0007) +[2023-10-08 15:30:41,557][102898] Updated weights for policy 1, policy_version 93890 (0.0009) +[2023-10-08 15:30:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 192151552. Throughput: 0: 1772.0, 1: 1798.7. Samples: 48047986. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:30:41,876][101941] Avg episode reward: [(0, '8.490'), (1, '24.210')] +[2023-10-08 15:30:41,917][102898] Updated weights for policy 1, policy_version 93900 (0.0008) +[2023-10-08 15:30:42,280][102898] Updated weights for policy 1, policy_version 93910 (0.0009) +[2023-10-08 15:30:42,651][102898] Updated weights for policy 1, policy_version 93920 (0.0008) +[2023-10-08 15:30:43,595][102897] Updated weights for policy 0, policy_version 93770 (0.0007) +[2023-10-08 15:30:43,959][102897] Updated weights for policy 0, policy_version 93780 (0.0007) +[2023-10-08 15:30:44,328][102897] Updated weights for policy 0, policy_version 93790 (0.0007) +[2023-10-08 15:30:46,311][102898] Updated weights for policy 1, policy_version 93930 (0.0009) +[2023-10-08 15:30:46,668][102898] Updated weights for policy 1, policy_version 93940 (0.0007) +[2023-10-08 15:30:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 192217088. Throughput: 0: 1770.0, 1: 1810.5. Samples: 48069838. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:30:46,876][101941] Avg episode reward: [(0, '9.230'), (1, '26.800')] +[2023-10-08 15:30:47,032][102898] Updated weights for policy 1, policy_version 93950 (0.0007) +[2023-10-08 15:30:47,103][102760] Saving new best policy, reward=26.800! +[2023-10-08 15:30:48,280][102897] Updated weights for policy 0, policy_version 93800 (0.0008) +[2023-10-08 15:30:48,667][102897] Updated weights for policy 0, policy_version 93810 (0.0008) +[2023-10-08 15:30:49,048][102897] Updated weights for policy 0, policy_version 93820 (0.0007) +[2023-10-08 15:30:50,680][102898] Updated weights for policy 1, policy_version 93960 (0.0007) +[2023-10-08 15:30:51,033][102898] Updated weights for policy 1, policy_version 93970 (0.0008) +[2023-10-08 15:30:51,402][102898] Updated weights for policy 1, policy_version 93980 (0.0008) +[2023-10-08 15:30:51,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 192315392. Throughput: 0: 1767.2, 1: 1806.7. Samples: 48080098. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:30:51,876][101941] Avg episode reward: [(0, '9.380'), (1, '27.710')] +[2023-10-08 15:30:51,878][102760] Saving new best policy, reward=27.710! +[2023-10-08 15:30:52,735][102897] Updated weights for policy 0, policy_version 93830 (0.0009) +[2023-10-08 15:30:53,108][102897] Updated weights for policy 0, policy_version 93840 (0.0010) +[2023-10-08 15:30:53,480][102897] Updated weights for policy 0, policy_version 93850 (0.0010) +[2023-10-08 15:30:55,226][102898] Updated weights for policy 1, policy_version 93990 (0.0008) +[2023-10-08 15:30:55,591][102898] Updated weights for policy 1, policy_version 94000 (0.0009) +[2023-10-08 15:30:55,952][102898] Updated weights for policy 1, policy_version 94010 (0.0008) +[2023-10-08 15:30:56,875][101941] Fps is (10 sec: 16384.4, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 192380928. Throughput: 0: 1763.8, 1: 1808.5. Samples: 48101860. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:30:56,875][101941] Avg episode reward: [(0, '8.850'), (1, '24.880')] +[2023-10-08 15:30:57,304][102897] Updated weights for policy 0, policy_version 93860 (0.0009) +[2023-10-08 15:30:57,681][102897] Updated weights for policy 0, policy_version 93870 (0.0008) +[2023-10-08 15:30:58,052][102897] Updated weights for policy 0, policy_version 93880 (0.0008) +[2023-10-08 15:30:59,763][102898] Updated weights for policy 1, policy_version 94020 (0.0008) +[2023-10-08 15:31:00,126][102898] Updated weights for policy 1, policy_version 94030 (0.0007) +[2023-10-08 15:31:00,491][102898] Updated weights for policy 1, policy_version 94040 (0.0007) +[2023-10-08 15:31:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 192446464. Throughput: 0: 1786.1, 1: 1795.4. Samples: 48123418. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:31:01,876][101941] Avg episode reward: [(0, '8.680'), (1, '25.910')] +[2023-10-08 15:31:01,956][102897] Updated weights for policy 0, policy_version 93890 (0.0007) +[2023-10-08 15:31:02,328][102897] Updated weights for policy 0, policy_version 93900 (0.0008) +[2023-10-08 15:31:02,698][102897] Updated weights for policy 0, policy_version 93910 (0.0007) +[2023-10-08 15:31:03,068][102897] Updated weights for policy 0, policy_version 93920 (0.0008) +[2023-10-08 15:31:04,142][102898] Updated weights for policy 1, policy_version 94050 (0.0007) +[2023-10-08 15:31:04,510][102898] Updated weights for policy 1, policy_version 94060 (0.0011) +[2023-10-08 15:31:04,882][102898] Updated weights for policy 1, policy_version 94070 (0.0010) +[2023-10-08 15:31:05,249][102898] Updated weights for policy 1, policy_version 94080 (0.0009) +[2023-10-08 15:31:06,737][102897] Updated weights for policy 0, policy_version 93930 (0.0009) +[2023-10-08 15:31:06,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 192512000. Throughput: 0: 1763.3, 1: 1805.6. Samples: 48134164. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:31:06,875][101941] Avg episode reward: [(0, '8.510'), (1, '25.670')] +[2023-10-08 15:31:07,115][102897] Updated weights for policy 0, policy_version 93940 (0.0008) +[2023-10-08 15:31:07,501][102897] Updated weights for policy 0, policy_version 93950 (0.0008) +[2023-10-08 15:31:09,135][102898] Updated weights for policy 1, policy_version 94090 (0.0009) +[2023-10-08 15:31:09,501][102898] Updated weights for policy 1, policy_version 94100 (0.0008) +[2023-10-08 15:31:09,877][102898] Updated weights for policy 1, policy_version 94110 (0.0007) +[2023-10-08 15:31:11,273][102897] Updated weights for policy 0, policy_version 93960 (0.0008) +[2023-10-08 15:31:11,642][102897] Updated weights for policy 0, policy_version 93970 (0.0009) +[2023-10-08 15:31:11,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 192577536. Throughput: 0: 1787.6, 1: 1797.0. Samples: 48155760. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:31:11,875][101941] Avg episode reward: [(0, '9.120'), (1, '23.910')] +[2023-10-08 15:31:12,016][102897] Updated weights for policy 0, policy_version 93980 (0.0007) +[2023-10-08 15:31:13,586][102898] Updated weights for policy 1, policy_version 94120 (0.0008) +[2023-10-08 15:31:13,950][102898] Updated weights for policy 1, policy_version 94130 (0.0008) +[2023-10-08 15:31:14,315][102898] Updated weights for policy 1, policy_version 94140 (0.0008) +[2023-10-08 15:31:15,896][102897] Updated weights for policy 0, policy_version 93990 (0.0011) +[2023-10-08 15:31:16,257][102897] Updated weights for policy 0, policy_version 94000 (0.0010) +[2023-10-08 15:31:16,637][102897] Updated weights for policy 0, policy_version 94010 (0.0009) +[2023-10-08 15:31:16,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 192675840. Throughput: 0: 1783.6, 1: 1802.1. Samples: 48177216. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:31:16,875][101941] Avg episode reward: [(0, '8.950'), (1, '24.700')] +[2023-10-08 15:31:17,996][102898] Updated weights for policy 1, policy_version 94150 (0.0007) +[2023-10-08 15:31:18,367][102898] Updated weights for policy 1, policy_version 94160 (0.0008) +[2023-10-08 15:31:18,725][102898] Updated weights for policy 1, policy_version 94170 (0.0008) +[2023-10-08 15:31:20,456][102897] Updated weights for policy 0, policy_version 94020 (0.0009) +[2023-10-08 15:31:20,819][102897] Updated weights for policy 0, policy_version 94030 (0.0011) +[2023-10-08 15:31:21,195][102897] Updated weights for policy 0, policy_version 94040 (0.0007) +[2023-10-08 15:31:21,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 192741376. Throughput: 0: 1775.3, 1: 1800.8. Samples: 48187640. Policy #0 lag: (min: 19.0, avg: 24.7, max: 51.0) +[2023-10-08 15:31:21,876][101941] Avg episode reward: [(0, '9.300'), (1, '24.850')] +[2023-10-08 15:31:22,575][102898] Updated weights for policy 1, policy_version 94180 (0.0007) +[2023-10-08 15:31:22,947][102898] Updated weights for policy 1, policy_version 94190 (0.0009) +[2023-10-08 15:31:23,311][102898] Updated weights for policy 1, policy_version 94200 (0.0007) +[2023-10-08 15:31:24,925][102897] Updated weights for policy 0, policy_version 94050 (0.0008) +[2023-10-08 15:31:25,298][102897] Updated weights for policy 0, policy_version 94060 (0.0009) +[2023-10-08 15:31:25,664][102897] Updated weights for policy 0, policy_version 94070 (0.0010) +[2023-10-08 15:31:26,031][102897] Updated weights for policy 0, policy_version 94080 (0.0011) +[2023-10-08 15:31:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 192806912. Throughput: 0: 1787.5, 1: 1793.5. Samples: 48209130. Policy #0 lag: (min: 19.0, avg: 24.7, max: 51.0) +[2023-10-08 15:31:26,875][101941] Avg episode reward: [(0, '9.560'), (1, '25.260')] +[2023-10-08 15:31:27,258][102898] Updated weights for policy 1, policy_version 94210 (0.0007) +[2023-10-08 15:31:27,618][102898] Updated weights for policy 1, policy_version 94220 (0.0008) +[2023-10-08 15:31:27,985][102898] Updated weights for policy 1, policy_version 94230 (0.0008) +[2023-10-08 15:31:28,352][102898] Updated weights for policy 1, policy_version 94240 (0.0009) +[2023-10-08 15:31:29,775][102897] Updated weights for policy 0, policy_version 94090 (0.0010) +[2023-10-08 15:31:30,142][102897] Updated weights for policy 0, policy_version 94100 (0.0008) +[2023-10-08 15:31:30,516][102897] Updated weights for policy 0, policy_version 94110 (0.0008) +[2023-10-08 15:31:31,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 192872448. Throughput: 0: 1770.9, 1: 1803.7. Samples: 48230698. Policy #0 lag: (min: 19.0, avg: 24.7, max: 51.0) +[2023-10-08 15:31:31,875][101941] Avg episode reward: [(0, '8.750'), (1, '22.230')] +[2023-10-08 15:31:31,956][102898] Updated weights for policy 1, policy_version 94250 (0.0007) +[2023-10-08 15:31:32,331][102898] Updated weights for policy 1, policy_version 94260 (0.0007) +[2023-10-08 15:31:32,691][102898] Updated weights for policy 1, policy_version 94270 (0.0007) +[2023-10-08 15:31:34,391][102897] Updated weights for policy 0, policy_version 94120 (0.0008) +[2023-10-08 15:31:34,769][102897] Updated weights for policy 0, policy_version 94130 (0.0008) +[2023-10-08 15:31:35,123][102897] Updated weights for policy 0, policy_version 94140 (0.0007) +[2023-10-08 15:31:36,389][102898] Updated weights for policy 1, policy_version 94280 (0.0007) +[2023-10-08 15:31:36,747][102898] Updated weights for policy 1, policy_version 94290 (0.0009) +[2023-10-08 15:31:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 192937984. Throughput: 0: 1797.0, 1: 1791.6. Samples: 48241584. Policy #0 lag: (min: 19.0, avg: 24.7, max: 51.0) +[2023-10-08 15:31:36,876][101941] Avg episode reward: [(0, '9.060'), (1, '22.480')] +[2023-10-08 15:31:37,123][102898] Updated weights for policy 1, policy_version 94300 (0.0009) +[2023-10-08 15:31:38,821][102897] Updated weights for policy 0, policy_version 94150 (0.0008) +[2023-10-08 15:31:39,190][102897] Updated weights for policy 0, policy_version 94160 (0.0009) +[2023-10-08 15:31:39,568][102897] Updated weights for policy 0, policy_version 94170 (0.0009) +[2023-10-08 15:31:40,775][102898] Updated weights for policy 1, policy_version 94310 (0.0008) +[2023-10-08 15:31:41,141][102898] Updated weights for policy 1, policy_version 94320 (0.0008) +[2023-10-08 15:31:41,517][102898] Updated weights for policy 1, policy_version 94330 (0.0008) +[2023-10-08 15:31:41,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 193036288. Throughput: 0: 1772.5, 1: 1809.0. Samples: 48263030. Policy #0 lag: (min: 19.0, avg: 24.7, max: 51.0) +[2023-10-08 15:31:41,876][101941] Avg episode reward: [(0, '9.150'), (1, '21.980')] +[2023-10-08 15:31:43,395][102897] Updated weights for policy 0, policy_version 94180 (0.0007) +[2023-10-08 15:31:43,768][102897] Updated weights for policy 0, policy_version 94190 (0.0008) +[2023-10-08 15:31:44,134][102897] Updated weights for policy 0, policy_version 94200 (0.0007) +[2023-10-08 15:31:45,200][102898] Updated weights for policy 1, policy_version 94340 (0.0008) +[2023-10-08 15:31:45,562][102898] Updated weights for policy 1, policy_version 94350 (0.0008) +[2023-10-08 15:31:45,934][102898] Updated weights for policy 1, policy_version 94360 (0.0007) +[2023-10-08 15:31:46,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 193101824. Throughput: 0: 1770.5, 1: 1798.6. Samples: 48284030. Policy #0 lag: (min: 19.0, avg: 24.7, max: 51.0) +[2023-10-08 15:31:46,876][101941] Avg episode reward: [(0, '9.620'), (1, '24.680')] +[2023-10-08 15:31:47,904][102897] Updated weights for policy 0, policy_version 94210 (0.0008) +[2023-10-08 15:31:48,281][102897] Updated weights for policy 0, policy_version 94220 (0.0007) +[2023-10-08 15:31:48,650][102897] Updated weights for policy 0, policy_version 94230 (0.0008) +[2023-10-08 15:31:49,020][102897] Updated weights for policy 0, policy_version 94240 (0.0007) +[2023-10-08 15:31:49,734][102898] Updated weights for policy 1, policy_version 94370 (0.0007) +[2023-10-08 15:31:50,096][102898] Updated weights for policy 1, policy_version 94380 (0.0008) +[2023-10-08 15:31:50,459][102898] Updated weights for policy 1, policy_version 94390 (0.0009) +[2023-10-08 15:31:50,822][102898] Updated weights for policy 1, policy_version 94400 (0.0007) +[2023-10-08 15:31:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 193167360. Throughput: 0: 1772.2, 1: 1808.8. Samples: 48295312. Policy #0 lag: (min: 19.0, avg: 24.7, max: 51.0) +[2023-10-08 15:31:51,876][101941] Avg episode reward: [(0, '9.100'), (1, '28.060')] +[2023-10-08 15:31:51,878][102760] Saving new best policy, reward=28.060! +[2023-10-08 15:31:52,809][102897] Updated weights for policy 0, policy_version 94250 (0.0008) +[2023-10-08 15:31:53,182][102897] Updated weights for policy 0, policy_version 94260 (0.0007) +[2023-10-08 15:31:53,555][102897] Updated weights for policy 0, policy_version 94270 (0.0008) +[2023-10-08 15:31:54,579][102898] Updated weights for policy 1, policy_version 94410 (0.0008) +[2023-10-08 15:31:54,941][102898] Updated weights for policy 1, policy_version 94420 (0.0008) +[2023-10-08 15:31:55,307][102898] Updated weights for policy 1, policy_version 94430 (0.0010) +[2023-10-08 15:31:56,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 193232896. Throughput: 0: 1773.2, 1: 1799.5. Samples: 48316532. Policy #0 lag: (min: 19.0, avg: 24.7, max: 51.0) +[2023-10-08 15:31:56,875][101941] Avg episode reward: [(0, '9.320'), (1, '26.650')] +[2023-10-08 15:31:57,239][102897] Updated weights for policy 0, policy_version 94280 (0.0009) +[2023-10-08 15:31:57,611][102897] Updated weights for policy 0, policy_version 94290 (0.0009) +[2023-10-08 15:31:57,995][102897] Updated weights for policy 0, policy_version 94300 (0.0009) +[2023-10-08 15:31:59,000][102898] Updated weights for policy 1, policy_version 94440 (0.0009) +[2023-10-08 15:31:59,365][102898] Updated weights for policy 1, policy_version 94450 (0.0008) +[2023-10-08 15:31:59,725][102898] Updated weights for policy 1, policy_version 94460 (0.0008) +[2023-10-08 15:32:01,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 193298432. Throughput: 0: 1792.8, 1: 1798.7. Samples: 48338832. Policy #0 lag: (min: 19.0, avg: 24.7, max: 51.0) +[2023-10-08 15:32:01,876][101941] Avg episode reward: [(0, '9.700'), (1, '25.950')] +[2023-10-08 15:32:01,935][102897] Updated weights for policy 0, policy_version 94310 (0.0008) +[2023-10-08 15:32:02,307][102897] Updated weights for policy 0, policy_version 94320 (0.0009) +[2023-10-08 15:32:02,680][102897] Updated weights for policy 0, policy_version 94330 (0.0008) +[2023-10-08 15:32:03,457][102898] Updated weights for policy 1, policy_version 94470 (0.0008) +[2023-10-08 15:32:03,822][102898] Updated weights for policy 1, policy_version 94480 (0.0008) +[2023-10-08 15:32:04,191][102898] Updated weights for policy 1, policy_version 94490 (0.0009) +[2023-10-08 15:32:06,247][102897] Updated weights for policy 0, policy_version 94340 (0.0009) +[2023-10-08 15:32:06,623][102897] Updated weights for policy 0, policy_version 94350 (0.0010) +[2023-10-08 15:32:06,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 193363968. Throughput: 0: 1775.8, 1: 1803.8. Samples: 48348722. Policy #0 lag: (min: 19.0, avg: 24.7, max: 51.0) +[2023-10-08 15:32:06,876][101941] Avg episode reward: [(0, '9.650'), (1, '24.670')] +[2023-10-08 15:32:06,991][102897] Updated weights for policy 0, policy_version 94360 (0.0008) +[2023-10-08 15:32:07,866][102898] Updated weights for policy 1, policy_version 94500 (0.0008) +[2023-10-08 15:32:08,226][102898] Updated weights for policy 1, policy_version 94510 (0.0008) +[2023-10-08 15:32:08,594][102898] Updated weights for policy 1, policy_version 94520 (0.0008) +[2023-10-08 15:32:10,839][102897] Updated weights for policy 0, policy_version 94370 (0.0008) +[2023-10-08 15:32:11,196][102897] Updated weights for policy 0, policy_version 94380 (0.0009) +[2023-10-08 15:32:11,568][102897] Updated weights for policy 0, policy_version 94390 (0.0009) +[2023-10-08 15:32:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 193429504. Throughput: 0: 1787.7, 1: 1815.5. Samples: 48371274. Policy #0 lag: (min: 19.0, avg: 24.7, max: 51.0) +[2023-10-08 15:32:11,876][101941] Avg episode reward: [(0, '9.220'), (1, '22.230')] +[2023-10-08 15:32:11,942][102897] Updated weights for policy 0, policy_version 94400 (0.0007) +[2023-10-08 15:32:12,345][102898] Updated weights for policy 1, policy_version 94530 (0.0009) +[2023-10-08 15:32:12,711][102898] Updated weights for policy 1, policy_version 94540 (0.0011) +[2023-10-08 15:32:13,088][102898] Updated weights for policy 1, policy_version 94550 (0.0011) +[2023-10-08 15:32:13,455][102898] Updated weights for policy 1, policy_version 94560 (0.0010) +[2023-10-08 15:32:15,599][102897] Updated weights for policy 0, policy_version 94410 (0.0011) +[2023-10-08 15:32:15,976][102897] Updated weights for policy 0, policy_version 94420 (0.0009) +[2023-10-08 15:32:16,336][102897] Updated weights for policy 0, policy_version 94430 (0.0009) +[2023-10-08 15:32:16,875][101941] Fps is (10 sec: 16383.7, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 193527808. Throughput: 0: 1779.1, 1: 1815.4. Samples: 48392448. Policy #0 lag: (min: 19.0, avg: 24.7, max: 51.0) +[2023-10-08 15:32:16,876][101941] Avg episode reward: [(0, '8.610'), (1, '21.370')] +[2023-10-08 15:32:16,889][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000094432_96698368.pth... +[2023-10-08 15:32:16,926][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000092768_94994432.pth +[2023-10-08 15:32:17,200][102898] Updated weights for policy 1, policy_version 94570 (0.0010) +[2023-10-08 15:32:17,566][102898] Updated weights for policy 1, policy_version 94580 (0.0011) +[2023-10-08 15:32:17,942][102898] Updated weights for policy 1, policy_version 94590 (0.0011) +[2023-10-08 15:32:18,008][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000094592_96862208.pth... +[2023-10-08 15:32:18,037][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000092896_95125504.pth +[2023-10-08 15:32:20,207][102897] Updated weights for policy 0, policy_version 94440 (0.0007) +[2023-10-08 15:32:20,587][102897] Updated weights for policy 0, policy_version 94450 (0.0007) +[2023-10-08 15:32:20,964][102897] Updated weights for policy 0, policy_version 94460 (0.0009) +[2023-10-08 15:32:21,613][102898] Updated weights for policy 1, policy_version 94600 (0.0008) +[2023-10-08 15:32:21,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 193593344. Throughput: 0: 1788.3, 1: 1807.8. Samples: 48403410. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 15:32:21,876][101941] Avg episode reward: [(0, '8.950'), (1, '22.610')] +[2023-10-08 15:32:21,977][102898] Updated weights for policy 1, policy_version 94610 (0.0008) +[2023-10-08 15:32:22,354][102898] Updated weights for policy 1, policy_version 94620 (0.0010) +[2023-10-08 15:32:24,710][102897] Updated weights for policy 0, policy_version 94470 (0.0007) +[2023-10-08 15:32:25,082][102897] Updated weights for policy 0, policy_version 94480 (0.0007) +[2023-10-08 15:32:25,448][102897] Updated weights for policy 0, policy_version 94490 (0.0007) +[2023-10-08 15:32:26,091][102898] Updated weights for policy 1, policy_version 94630 (0.0008) +[2023-10-08 15:32:26,456][102898] Updated weights for policy 1, policy_version 94640 (0.0010) +[2023-10-08 15:32:26,829][102898] Updated weights for policy 1, policy_version 94650 (0.0008) +[2023-10-08 15:32:26,875][101941] Fps is (10 sec: 13107.7, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 193658880. Throughput: 0: 1784.7, 1: 1808.4. Samples: 48424718. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 15:32:26,875][101941] Avg episode reward: [(0, '9.490'), (1, '21.150')] +[2023-10-08 15:32:29,228][102897] Updated weights for policy 0, policy_version 94500 (0.0007) +[2023-10-08 15:32:29,593][102897] Updated weights for policy 0, policy_version 94510 (0.0007) +[2023-10-08 15:32:29,969][102897] Updated weights for policy 0, policy_version 94520 (0.0009) +[2023-10-08 15:32:30,638][102898] Updated weights for policy 1, policy_version 94660 (0.0011) +[2023-10-08 15:32:30,995][102898] Updated weights for policy 1, policy_version 94670 (0.0008) +[2023-10-08 15:32:31,367][102898] Updated weights for policy 1, policy_version 94680 (0.0007) +[2023-10-08 15:32:31,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.5, 300 sec: 14329.0). Total num frames: 193757184. Throughput: 0: 1776.3, 1: 1811.9. Samples: 48445500. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 15:32:31,876][101941] Avg episode reward: [(0, '9.000'), (1, '20.260')] +[2023-10-08 15:32:33,714][102897] Updated weights for policy 0, policy_version 94530 (0.0009) +[2023-10-08 15:32:34,085][102897] Updated weights for policy 0, policy_version 94540 (0.0007) +[2023-10-08 15:32:34,448][102897] Updated weights for policy 0, policy_version 94550 (0.0010) +[2023-10-08 15:32:34,821][102897] Updated weights for policy 0, policy_version 94560 (0.0010) +[2023-10-08 15:32:35,057][102898] Updated weights for policy 1, policy_version 94690 (0.0008) +[2023-10-08 15:32:35,431][102898] Updated weights for policy 1, policy_version 94700 (0.0008) +[2023-10-08 15:32:35,792][102898] Updated weights for policy 1, policy_version 94710 (0.0009) +[2023-10-08 15:32:36,159][102898] Updated weights for policy 1, policy_version 94720 (0.0008) +[2023-10-08 15:32:36,875][101941] Fps is (10 sec: 16383.9, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 193822720. Throughput: 0: 1791.4, 1: 1805.5. Samples: 48457172. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 15:32:36,876][101941] Avg episode reward: [(0, '9.380'), (1, '20.610')] +[2023-10-08 15:32:38,530][102897] Updated weights for policy 0, policy_version 94570 (0.0009) +[2023-10-08 15:32:38,894][102897] Updated weights for policy 0, policy_version 94580 (0.0007) +[2023-10-08 15:32:39,271][102897] Updated weights for policy 0, policy_version 94590 (0.0007) +[2023-10-08 15:32:39,844][102898] Updated weights for policy 1, policy_version 94730 (0.0009) +[2023-10-08 15:32:40,219][102898] Updated weights for policy 1, policy_version 94740 (0.0007) +[2023-10-08 15:32:40,577][102898] Updated weights for policy 1, policy_version 94750 (0.0009) +[2023-10-08 15:32:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 193888256. Throughput: 0: 1779.1, 1: 1814.0. Samples: 48478220. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 15:32:41,876][101941] Avg episode reward: [(0, '9.700'), (1, '22.730')] +[2023-10-08 15:32:43,056][102897] Updated weights for policy 0, policy_version 94600 (0.0008) +[2023-10-08 15:32:43,418][102897] Updated weights for policy 0, policy_version 94610 (0.0008) +[2023-10-08 15:32:43,801][102897] Updated weights for policy 0, policy_version 94620 (0.0008) +[2023-10-08 15:32:44,310][102898] Updated weights for policy 1, policy_version 94760 (0.0008) +[2023-10-08 15:32:44,676][102898] Updated weights for policy 1, policy_version 94770 (0.0008) +[2023-10-08 15:32:45,039][102898] Updated weights for policy 1, policy_version 94780 (0.0009) +[2023-10-08 15:32:46,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 193953792. Throughput: 0: 1787.5, 1: 1807.2. Samples: 48500594. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 15:32:46,876][101941] Avg episode reward: [(0, '9.010'), (1, '22.850')] +[2023-10-08 15:32:47,524][102897] Updated weights for policy 0, policy_version 94630 (0.0009) +[2023-10-08 15:32:47,890][102897] Updated weights for policy 0, policy_version 94640 (0.0007) +[2023-10-08 15:32:48,250][102897] Updated weights for policy 0, policy_version 94650 (0.0008) +[2023-10-08 15:32:48,900][102898] Updated weights for policy 1, policy_version 94790 (0.0010) +[2023-10-08 15:32:49,278][102898] Updated weights for policy 1, policy_version 94800 (0.0008) +[2023-10-08 15:32:49,641][102898] Updated weights for policy 1, policy_version 94810 (0.0008) +[2023-10-08 15:32:51,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 194019328. Throughput: 0: 1788.4, 1: 1815.5. Samples: 48510894. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 15:32:51,876][101941] Avg episode reward: [(0, '8.410'), (1, '25.470')] +[2023-10-08 15:32:52,061][102897] Updated weights for policy 0, policy_version 94660 (0.0009) +[2023-10-08 15:32:52,427][102897] Updated weights for policy 0, policy_version 94670 (0.0008) +[2023-10-08 15:32:52,800][102897] Updated weights for policy 0, policy_version 94680 (0.0007) +[2023-10-08 15:32:53,384][102898] Updated weights for policy 1, policy_version 94820 (0.0010) +[2023-10-08 15:32:53,761][102898] Updated weights for policy 1, policy_version 94830 (0.0009) +[2023-10-08 15:32:54,115][102898] Updated weights for policy 1, policy_version 94840 (0.0007) +[2023-10-08 15:32:56,612][102897] Updated weights for policy 0, policy_version 94690 (0.0007) +[2023-10-08 15:32:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 194084864. Throughput: 0: 1794.8, 1: 1794.3. Samples: 48532782. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 15:32:56,876][101941] Avg episode reward: [(0, '8.960'), (1, '29.120')] +[2023-10-08 15:32:56,878][102760] Saving new best policy, reward=29.120! +[2023-10-08 15:32:56,986][102897] Updated weights for policy 0, policy_version 94700 (0.0008) +[2023-10-08 15:32:57,365][102897] Updated weights for policy 0, policy_version 94710 (0.0008) +[2023-10-08 15:32:57,739][102897] Updated weights for policy 0, policy_version 94720 (0.0008) +[2023-10-08 15:32:57,830][102898] Updated weights for policy 1, policy_version 94850 (0.0008) +[2023-10-08 15:32:58,198][102898] Updated weights for policy 1, policy_version 94860 (0.0009) +[2023-10-08 15:32:58,566][102898] Updated weights for policy 1, policy_version 94870 (0.0008) +[2023-10-08 15:32:58,933][102898] Updated weights for policy 1, policy_version 94880 (0.0008) +[2023-10-08 15:33:01,469][102897] Updated weights for policy 0, policy_version 94730 (0.0007) +[2023-10-08 15:33:01,838][102897] Updated weights for policy 0, policy_version 94740 (0.0008) +[2023-10-08 15:33:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 194150400. Throughput: 0: 1817.3, 1: 1787.1. Samples: 48554644. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 15:33:01,875][101941] Avg episode reward: [(0, '9.240'), (1, '28.460')] +[2023-10-08 15:33:02,223][102897] Updated weights for policy 0, policy_version 94750 (0.0008) +[2023-10-08 15:33:02,628][102898] Updated weights for policy 1, policy_version 94890 (0.0007) +[2023-10-08 15:33:03,001][102898] Updated weights for policy 1, policy_version 94900 (0.0007) +[2023-10-08 15:33:03,366][102898] Updated weights for policy 1, policy_version 94910 (0.0008) +[2023-10-08 15:33:06,140][102897] Updated weights for policy 0, policy_version 94760 (0.0009) +[2023-10-08 15:33:06,520][102897] Updated weights for policy 0, policy_version 94770 (0.0009) +[2023-10-08 15:33:06,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 194215936. Throughput: 0: 1794.7, 1: 1793.4. Samples: 48564876. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 15:33:06,876][101941] Avg episode reward: [(0, '9.140'), (1, '28.550')] +[2023-10-08 15:33:06,885][102897] Updated weights for policy 0, policy_version 94780 (0.0008) +[2023-10-08 15:33:07,017][102898] Updated weights for policy 1, policy_version 94920 (0.0007) +[2023-10-08 15:33:07,388][102898] Updated weights for policy 1, policy_version 94930 (0.0007) +[2023-10-08 15:33:07,756][102898] Updated weights for policy 1, policy_version 94940 (0.0009) +[2023-10-08 15:33:10,496][102897] Updated weights for policy 0, policy_version 94790 (0.0007) +[2023-10-08 15:33:10,864][102897] Updated weights for policy 0, policy_version 94800 (0.0009) +[2023-10-08 15:33:11,245][102897] Updated weights for policy 0, policy_version 94810 (0.0008) +[2023-10-08 15:33:11,453][102898] Updated weights for policy 1, policy_version 94950 (0.0008) +[2023-10-08 15:33:11,819][102898] Updated weights for policy 1, policy_version 94960 (0.0007) +[2023-10-08 15:33:11,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 194314240. Throughput: 0: 1812.9, 1: 1797.5. Samples: 48587188. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 15:33:11,875][101941] Avg episode reward: [(0, '8.860'), (1, '26.900')] +[2023-10-08 15:33:12,188][102898] Updated weights for policy 1, policy_version 94970 (0.0007) +[2023-10-08 15:33:14,906][102897] Updated weights for policy 0, policy_version 94820 (0.0007) +[2023-10-08 15:33:15,272][102897] Updated weights for policy 0, policy_version 94830 (0.0007) +[2023-10-08 15:33:15,642][102897] Updated weights for policy 0, policy_version 94840 (0.0008) +[2023-10-08 15:33:16,124][102898] Updated weights for policy 1, policy_version 94980 (0.0007) +[2023-10-08 15:33:16,491][102898] Updated weights for policy 1, policy_version 94990 (0.0008) +[2023-10-08 15:33:16,854][102898] Updated weights for policy 1, policy_version 95000 (0.0009) +[2023-10-08 15:33:16,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 194379776. Throughput: 0: 1795.1, 1: 1813.8. Samples: 48607900. Policy #0 lag: (min: 18.0, avg: 18.0, max: 18.0) +[2023-10-08 15:33:16,876][101941] Avg episode reward: [(0, '9.110'), (1, '25.460')] +[2023-10-08 15:33:19,424][102897] Updated weights for policy 0, policy_version 94850 (0.0007) +[2023-10-08 15:33:19,788][102897] Updated weights for policy 0, policy_version 94860 (0.0008) +[2023-10-08 15:33:20,165][102897] Updated weights for policy 0, policy_version 94870 (0.0009) +[2023-10-08 15:33:20,536][102897] Updated weights for policy 0, policy_version 94880 (0.0008) +[2023-10-08 15:33:20,683][102898] Updated weights for policy 1, policy_version 95010 (0.0009) +[2023-10-08 15:33:21,043][102898] Updated weights for policy 1, policy_version 95020 (0.0010) +[2023-10-08 15:33:21,410][102898] Updated weights for policy 1, policy_version 95030 (0.0008) +[2023-10-08 15:33:21,784][102898] Updated weights for policy 1, policy_version 95040 (0.0008) +[2023-10-08 15:33:21,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 194478080. Throughput: 0: 1812.2, 1: 1797.2. Samples: 48619598. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:33:21,875][101941] Avg episode reward: [(0, '8.760'), (1, '23.990')] +[2023-10-08 15:33:24,252][102897] Updated weights for policy 0, policy_version 94890 (0.0007) +[2023-10-08 15:33:24,622][102897] Updated weights for policy 0, policy_version 94900 (0.0007) +[2023-10-08 15:33:24,987][102897] Updated weights for policy 0, policy_version 94910 (0.0008) +[2023-10-08 15:33:25,493][102898] Updated weights for policy 1, policy_version 95050 (0.0008) +[2023-10-08 15:33:25,855][102898] Updated weights for policy 1, policy_version 95060 (0.0010) +[2023-10-08 15:33:26,220][102898] Updated weights for policy 1, policy_version 95070 (0.0010) +[2023-10-08 15:33:26,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.5, 300 sec: 14329.1). Total num frames: 194543616. Throughput: 0: 1787.1, 1: 1808.4. Samples: 48640020. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:33:26,876][101941] Avg episode reward: [(0, '9.150'), (1, '28.870')] +[2023-10-08 15:33:28,909][102897] Updated weights for policy 0, policy_version 94920 (0.0009) +[2023-10-08 15:33:29,274][102897] Updated weights for policy 0, policy_version 94930 (0.0010) +[2023-10-08 15:33:29,643][102897] Updated weights for policy 0, policy_version 94940 (0.0009) +[2023-10-08 15:33:29,875][102898] Updated weights for policy 1, policy_version 95080 (0.0009) +[2023-10-08 15:33:30,243][102898] Updated weights for policy 1, policy_version 95090 (0.0008) +[2023-10-08 15:33:30,605][102898] Updated weights for policy 1, policy_version 95100 (0.0008) +[2023-10-08 15:33:31,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 194609152. Throughput: 0: 1782.8, 1: 1792.4. Samples: 48661478. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:33:31,876][101941] Avg episode reward: [(0, '10.100'), (1, '26.950')] +[2023-10-08 15:33:33,466][102897] Updated weights for policy 0, policy_version 94950 (0.0008) +[2023-10-08 15:33:33,838][102897] Updated weights for policy 0, policy_version 94960 (0.0010) +[2023-10-08 15:33:34,204][102897] Updated weights for policy 0, policy_version 94970 (0.0009) +[2023-10-08 15:33:34,366][102898] Updated weights for policy 1, policy_version 95110 (0.0009) +[2023-10-08 15:33:34,737][102898] Updated weights for policy 1, policy_version 95120 (0.0010) +[2023-10-08 15:33:35,103][102898] Updated weights for policy 1, policy_version 95130 (0.0009) +[2023-10-08 15:33:36,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 194674688. Throughput: 0: 1778.1, 1: 1804.5. Samples: 48672112. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:33:36,875][101941] Avg episode reward: [(0, '9.290'), (1, '26.650')] +[2023-10-08 15:33:37,915][102897] Updated weights for policy 0, policy_version 94980 (0.0008) +[2023-10-08 15:33:38,289][102897] Updated weights for policy 0, policy_version 94990 (0.0008) +[2023-10-08 15:33:38,659][102897] Updated weights for policy 0, policy_version 95000 (0.0009) +[2023-10-08 15:33:38,712][102898] Updated weights for policy 1, policy_version 95140 (0.0009) +[2023-10-08 15:33:39,075][102898] Updated weights for policy 1, policy_version 95150 (0.0010) +[2023-10-08 15:33:39,437][102898] Updated weights for policy 1, policy_version 95160 (0.0007) +[2023-10-08 15:33:41,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 194740224. Throughput: 0: 1773.3, 1: 1797.9. Samples: 48693484. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:33:41,875][101941] Avg episode reward: [(0, '8.540'), (1, '29.400')] +[2023-10-08 15:33:41,876][102760] Saving new best policy, reward=29.400! +[2023-10-08 15:33:42,538][102897] Updated weights for policy 0, policy_version 95010 (0.0008) +[2023-10-08 15:33:42,905][102897] Updated weights for policy 0, policy_version 95020 (0.0007) +[2023-10-08 15:33:43,102][102898] Updated weights for policy 1, policy_version 95170 (0.0008) +[2023-10-08 15:33:43,269][102897] Updated weights for policy 0, policy_version 95030 (0.0009) +[2023-10-08 15:33:43,460][102898] Updated weights for policy 1, policy_version 95180 (0.0007) +[2023-10-08 15:33:43,644][102897] Updated weights for policy 0, policy_version 95040 (0.0007) +[2023-10-08 15:33:43,823][102898] Updated weights for policy 1, policy_version 95190 (0.0008) +[2023-10-08 15:33:44,190][102898] Updated weights for policy 1, policy_version 95200 (0.0010) +[2023-10-08 15:33:46,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 194805760. Throughput: 0: 1775.3, 1: 1802.3. Samples: 48715636. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:33:46,876][101941] Avg episode reward: [(0, '8.760'), (1, '25.480')] +[2023-10-08 15:33:47,594][102897] Updated weights for policy 0, policy_version 95050 (0.0009) +[2023-10-08 15:33:47,957][102897] Updated weights for policy 0, policy_version 95060 (0.0009) +[2023-10-08 15:33:48,120][102898] Updated weights for policy 1, policy_version 95210 (0.0007) +[2023-10-08 15:33:48,331][102897] Updated weights for policy 0, policy_version 95070 (0.0007) +[2023-10-08 15:33:48,488][102898] Updated weights for policy 1, policy_version 95220 (0.0010) +[2023-10-08 15:33:48,854][102898] Updated weights for policy 1, policy_version 95230 (0.0008) +[2023-10-08 15:33:51,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 194871296. Throughput: 0: 1767.2, 1: 1799.7. Samples: 48725388. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:33:51,876][101941] Avg episode reward: [(0, '8.900'), (1, '25.050')] +[2023-10-08 15:33:52,157][102897] Updated weights for policy 0, policy_version 95080 (0.0008) +[2023-10-08 15:33:52,533][102897] Updated weights for policy 0, policy_version 95090 (0.0008) +[2023-10-08 15:33:52,629][102898] Updated weights for policy 1, policy_version 95240 (0.0007) +[2023-10-08 15:33:52,909][102897] Updated weights for policy 0, policy_version 95100 (0.0009) +[2023-10-08 15:33:52,996][102898] Updated weights for policy 1, policy_version 95250 (0.0007) +[2023-10-08 15:33:53,360][102898] Updated weights for policy 1, policy_version 95260 (0.0007) +[2023-10-08 15:33:56,572][102897] Updated weights for policy 0, policy_version 95110 (0.0009) +[2023-10-08 15:33:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 194936832. Throughput: 0: 1776.4, 1: 1783.7. Samples: 48747394. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:33:56,876][101941] Avg episode reward: [(0, '8.760'), (1, '24.980')] +[2023-10-08 15:33:56,931][102897] Updated weights for policy 0, policy_version 95120 (0.0008) +[2023-10-08 15:33:57,240][102898] Updated weights for policy 1, policy_version 95270 (0.0009) +[2023-10-08 15:33:57,303][102897] Updated weights for policy 0, policy_version 95130 (0.0008) +[2023-10-08 15:33:57,609][102898] Updated weights for policy 1, policy_version 95280 (0.0007) +[2023-10-08 15:33:57,981][102898] Updated weights for policy 1, policy_version 95290 (0.0011) +[2023-10-08 15:34:01,033][102897] Updated weights for policy 0, policy_version 95140 (0.0008) +[2023-10-08 15:34:01,411][102897] Updated weights for policy 0, policy_version 95150 (0.0008) +[2023-10-08 15:34:01,783][102897] Updated weights for policy 0, policy_version 95160 (0.0008) +[2023-10-08 15:34:01,798][102898] Updated weights for policy 1, policy_version 95300 (0.0010) +[2023-10-08 15:34:01,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 195002368. Throughput: 0: 1789.7, 1: 1791.7. Samples: 48769062. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:34:01,875][101941] Avg episode reward: [(0, '8.860'), (1, '26.730')] +[2023-10-08 15:34:02,162][102898] Updated weights for policy 1, policy_version 95310 (0.0008) +[2023-10-08 15:34:02,526][102898] Updated weights for policy 1, policy_version 95320 (0.0010) +[2023-10-08 15:34:05,451][102897] Updated weights for policy 0, policy_version 95170 (0.0008) +[2023-10-08 15:34:05,818][102897] Updated weights for policy 0, policy_version 95180 (0.0009) +[2023-10-08 15:34:06,186][102897] Updated weights for policy 0, policy_version 95190 (0.0010) +[2023-10-08 15:34:06,291][102898] Updated weights for policy 1, policy_version 95330 (0.0007) +[2023-10-08 15:34:06,557][102897] Updated weights for policy 0, policy_version 95200 (0.0008) +[2023-10-08 15:34:06,656][102898] Updated weights for policy 1, policy_version 95340 (0.0009) +[2023-10-08 15:34:06,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 195100672. Throughput: 0: 1773.5, 1: 1780.8. Samples: 48779542. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:34:06,876][101941] Avg episode reward: [(0, '9.110'), (1, '27.070')] +[2023-10-08 15:34:07,022][102898] Updated weights for policy 1, policy_version 95350 (0.0010) +[2023-10-08 15:34:07,392][102898] Updated weights for policy 1, policy_version 95360 (0.0009) +[2023-10-08 15:34:10,235][102897] Updated weights for policy 0, policy_version 95210 (0.0007) +[2023-10-08 15:34:10,615][102897] Updated weights for policy 0, policy_version 95220 (0.0007) +[2023-10-08 15:34:10,980][102897] Updated weights for policy 0, policy_version 95230 (0.0008) +[2023-10-08 15:34:11,185][102898] Updated weights for policy 1, policy_version 95370 (0.0008) +[2023-10-08 15:34:11,549][102898] Updated weights for policy 1, policy_version 95380 (0.0010) +[2023-10-08 15:34:11,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 195166208. Throughput: 0: 1793.4, 1: 1790.2. Samples: 48801282. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:34:11,876][101941] Avg episode reward: [(0, '8.720'), (1, '26.000')] +[2023-10-08 15:34:11,914][102898] Updated weights for policy 1, policy_version 95390 (0.0009) +[2023-10-08 15:34:14,878][102897] Updated weights for policy 0, policy_version 95240 (0.0007) +[2023-10-08 15:34:15,246][102897] Updated weights for policy 0, policy_version 95250 (0.0007) +[2023-10-08 15:34:15,611][102897] Updated weights for policy 0, policy_version 95260 (0.0007) +[2023-10-08 15:34:15,776][102898] Updated weights for policy 1, policy_version 95400 (0.0008) +[2023-10-08 15:34:16,136][102898] Updated weights for policy 1, policy_version 95410 (0.0008) +[2023-10-08 15:34:16,505][102898] Updated weights for policy 1, policy_version 95420 (0.0007) +[2023-10-08 15:34:16,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.7, 300 sec: 14329.1). Total num frames: 195264512. Throughput: 0: 1777.1, 1: 1780.9. Samples: 48821590. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:34:16,875][101941] Avg episode reward: [(0, '8.450'), (1, '26.300')] +[2023-10-08 15:34:16,883][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000095264_97550336.pth... +[2023-10-08 15:34:16,883][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000095424_97714176.pth... +[2023-10-08 15:34:16,912][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000093600_95846400.pth +[2023-10-08 15:34:16,924][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000093728_95977472.pth +[2023-10-08 15:34:19,293][102897] Updated weights for policy 0, policy_version 95270 (0.0009) +[2023-10-08 15:34:19,666][102897] Updated weights for policy 0, policy_version 95280 (0.0009) +[2023-10-08 15:34:20,025][102897] Updated weights for policy 0, policy_version 95290 (0.0010) +[2023-10-08 15:34:20,402][102898] Updated weights for policy 1, policy_version 95430 (0.0008) +[2023-10-08 15:34:20,786][102898] Updated weights for policy 1, policy_version 95440 (0.0010) +[2023-10-08 15:34:21,149][102898] Updated weights for policy 1, policy_version 95450 (0.0007) +[2023-10-08 15:34:21,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 195330048. Throughput: 0: 1803.7, 1: 1784.4. Samples: 48833578. Policy #0 lag: (min: 31.0, avg: 35.8, max: 63.0) +[2023-10-08 15:34:21,876][101941] Avg episode reward: [(0, '8.710'), (1, '28.460')] +[2023-10-08 15:34:23,900][102897] Updated weights for policy 0, policy_version 95300 (0.0010) +[2023-10-08 15:34:24,273][102897] Updated weights for policy 0, policy_version 95310 (0.0008) +[2023-10-08 15:34:24,632][102897] Updated weights for policy 0, policy_version 95320 (0.0009) +[2023-10-08 15:34:24,931][102898] Updated weights for policy 1, policy_version 95460 (0.0008) +[2023-10-08 15:34:25,295][102898] Updated weights for policy 1, policy_version 95470 (0.0008) +[2023-10-08 15:34:25,662][102898] Updated weights for policy 1, policy_version 95480 (0.0008) +[2023-10-08 15:34:26,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 195395584. Throughput: 0: 1775.5, 1: 1785.0. Samples: 48853708. Policy #0 lag: (min: 31.0, avg: 35.8, max: 63.0) +[2023-10-08 15:34:26,876][101941] Avg episode reward: [(0, '9.550'), (1, '24.340')] +[2023-10-08 15:34:28,326][102897] Updated weights for policy 0, policy_version 95330 (0.0008) +[2023-10-08 15:34:28,696][102897] Updated weights for policy 0, policy_version 95340 (0.0009) +[2023-10-08 15:34:29,071][102897] Updated weights for policy 0, policy_version 95350 (0.0010) +[2023-10-08 15:34:29,438][102897] Updated weights for policy 0, policy_version 95360 (0.0007) +[2023-10-08 15:34:29,490][102898] Updated weights for policy 1, policy_version 95490 (0.0010) +[2023-10-08 15:34:29,848][102898] Updated weights for policy 1, policy_version 95500 (0.0007) +[2023-10-08 15:34:30,214][102898] Updated weights for policy 1, policy_version 95510 (0.0007) +[2023-10-08 15:34:30,577][102898] Updated weights for policy 1, policy_version 95520 (0.0009) +[2023-10-08 15:34:31,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 195461120. Throughput: 0: 1781.1, 1: 1768.0. Samples: 48875344. Policy #0 lag: (min: 31.0, avg: 35.8, max: 63.0) +[2023-10-08 15:34:31,875][101941] Avg episode reward: [(0, '9.530'), (1, '24.520')] +[2023-10-08 15:34:33,178][102897] Updated weights for policy 0, policy_version 95370 (0.0008) +[2023-10-08 15:34:33,544][102897] Updated weights for policy 0, policy_version 95380 (0.0008) +[2023-10-08 15:34:33,910][102897] Updated weights for policy 0, policy_version 95390 (0.0008) +[2023-10-08 15:34:34,315][102898] Updated weights for policy 1, policy_version 95530 (0.0010) +[2023-10-08 15:34:34,691][102898] Updated weights for policy 1, policy_version 95540 (0.0009) +[2023-10-08 15:34:35,060][102898] Updated weights for policy 1, policy_version 95550 (0.0008) +[2023-10-08 15:34:36,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 195526656. Throughput: 0: 1782.3, 1: 1788.8. Samples: 48886088. Policy #0 lag: (min: 31.0, avg: 35.8, max: 63.0) +[2023-10-08 15:34:36,876][101941] Avg episode reward: [(0, '9.190'), (1, '24.450')] +[2023-10-08 15:34:37,844][102897] Updated weights for policy 0, policy_version 95400 (0.0009) +[2023-10-08 15:34:38,232][102897] Updated weights for policy 0, policy_version 95410 (0.0008) +[2023-10-08 15:34:38,596][102897] Updated weights for policy 0, policy_version 95420 (0.0007) +[2023-10-08 15:34:38,748][102898] Updated weights for policy 1, policy_version 95560 (0.0007) +[2023-10-08 15:34:39,120][102898] Updated weights for policy 1, policy_version 95570 (0.0007) +[2023-10-08 15:34:39,483][102898] Updated weights for policy 1, policy_version 95580 (0.0007) +[2023-10-08 15:34:41,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 195592192. Throughput: 0: 1783.7, 1: 1777.4. Samples: 48907642. Policy #0 lag: (min: 31.0, avg: 35.8, max: 63.0) +[2023-10-08 15:34:41,876][101941] Avg episode reward: [(0, '9.260'), (1, '24.710')] +[2023-10-08 15:34:42,223][102897] Updated weights for policy 0, policy_version 95430 (0.0008) +[2023-10-08 15:34:42,602][102897] Updated weights for policy 0, policy_version 95440 (0.0008) +[2023-10-08 15:34:42,964][102897] Updated weights for policy 0, policy_version 95450 (0.0008) +[2023-10-08 15:34:43,089][102898] Updated weights for policy 1, policy_version 95590 (0.0009) +[2023-10-08 15:34:43,454][102898] Updated weights for policy 1, policy_version 95600 (0.0008) +[2023-10-08 15:34:43,827][102898] Updated weights for policy 1, policy_version 95610 (0.0008) +[2023-10-08 15:34:46,807][102897] Updated weights for policy 0, policy_version 95460 (0.0009) +[2023-10-08 15:34:46,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 195657728. Throughput: 0: 1792.0, 1: 1782.4. Samples: 48929908. Policy #0 lag: (min: 31.0, avg: 35.8, max: 63.0) +[2023-10-08 15:34:46,875][101941] Avg episode reward: [(0, '8.570'), (1, '25.300')] +[2023-10-08 15:34:47,185][102897] Updated weights for policy 0, policy_version 95470 (0.0009) +[2023-10-08 15:34:47,545][102897] Updated weights for policy 0, policy_version 95480 (0.0008) +[2023-10-08 15:34:47,611][102898] Updated weights for policy 1, policy_version 95620 (0.0007) +[2023-10-08 15:34:47,979][102898] Updated weights for policy 1, policy_version 95630 (0.0008) +[2023-10-08 15:34:48,351][102898] Updated weights for policy 1, policy_version 95640 (0.0008) +[2023-10-08 15:34:51,369][102897] Updated weights for policy 0, policy_version 95490 (0.0008) +[2023-10-08 15:34:51,732][102897] Updated weights for policy 0, policy_version 95500 (0.0008) +[2023-10-08 15:34:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 195723264. Throughput: 0: 1777.5, 1: 1784.1. Samples: 48939814. Policy #0 lag: (min: 31.0, avg: 35.8, max: 63.0) +[2023-10-08 15:34:51,876][101941] Avg episode reward: [(0, '8.690'), (1, '28.290')] +[2023-10-08 15:34:52,020][102898] Updated weights for policy 1, policy_version 95650 (0.0009) +[2023-10-08 15:34:52,109][102897] Updated weights for policy 0, policy_version 95510 (0.0009) +[2023-10-08 15:34:52,378][102898] Updated weights for policy 1, policy_version 95660 (0.0007) +[2023-10-08 15:34:52,469][102897] Updated weights for policy 0, policy_version 95520 (0.0007) +[2023-10-08 15:34:52,746][102898] Updated weights for policy 1, policy_version 95670 (0.0009) +[2023-10-08 15:34:53,104][102898] Updated weights for policy 1, policy_version 95680 (0.0011) +[2023-10-08 15:34:56,138][102897] Updated weights for policy 0, policy_version 95530 (0.0011) +[2023-10-08 15:34:56,513][102897] Updated weights for policy 0, policy_version 95540 (0.0009) +[2023-10-08 15:34:56,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 195788800. Throughput: 0: 1795.8, 1: 1784.0. Samples: 48962372. Policy #0 lag: (min: 31.0, avg: 35.8, max: 63.0) +[2023-10-08 15:34:56,875][101941] Avg episode reward: [(0, '8.750'), (1, '26.830')] +[2023-10-08 15:34:56,881][102897] Updated weights for policy 0, policy_version 95550 (0.0008) +[2023-10-08 15:34:56,943][102898] Updated weights for policy 1, policy_version 95690 (0.0008) +[2023-10-08 15:34:57,311][102898] Updated weights for policy 1, policy_version 95700 (0.0007) +[2023-10-08 15:34:57,661][102898] Updated weights for policy 1, policy_version 95710 (0.0007) +[2023-10-08 15:35:00,739][102897] Updated weights for policy 0, policy_version 95560 (0.0008) +[2023-10-08 15:35:01,112][102897] Updated weights for policy 0, policy_version 95570 (0.0007) +[2023-10-08 15:35:01,371][102898] Updated weights for policy 1, policy_version 95720 (0.0008) +[2023-10-08 15:35:01,475][102897] Updated weights for policy 0, policy_version 95580 (0.0007) +[2023-10-08 15:35:01,741][102898] Updated weights for policy 1, policy_version 95730 (0.0007) +[2023-10-08 15:35:01,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.0). Total num frames: 195887104. Throughput: 0: 1785.6, 1: 1805.0. Samples: 48983166. Policy #0 lag: (min: 31.0, avg: 35.8, max: 63.0) +[2023-10-08 15:35:01,875][101941] Avg episode reward: [(0, '8.960'), (1, '25.170')] +[2023-10-08 15:35:02,116][102898] Updated weights for policy 1, policy_version 95740 (0.0010) +[2023-10-08 15:35:05,301][102897] Updated weights for policy 0, policy_version 95590 (0.0008) +[2023-10-08 15:35:05,672][102897] Updated weights for policy 0, policy_version 95600 (0.0007) +[2023-10-08 15:35:06,041][102897] Updated weights for policy 0, policy_version 95610 (0.0008) +[2023-10-08 15:35:06,181][102898] Updated weights for policy 1, policy_version 95750 (0.0009) +[2023-10-08 15:35:06,567][102898] Updated weights for policy 1, policy_version 95760 (0.0008) +[2023-10-08 15:35:06,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 195952640. Throughput: 0: 1785.4, 1: 1790.5. Samples: 48994496. Policy #0 lag: (min: 31.0, avg: 35.8, max: 63.0) +[2023-10-08 15:35:06,875][101941] Avg episode reward: [(0, '9.890'), (1, '22.430')] +[2023-10-08 15:35:06,935][102898] Updated weights for policy 1, policy_version 95770 (0.0008) +[2023-10-08 15:35:09,784][102897] Updated weights for policy 0, policy_version 95620 (0.0009) +[2023-10-08 15:35:10,155][102897] Updated weights for policy 0, policy_version 95630 (0.0009) +[2023-10-08 15:35:10,531][102897] Updated weights for policy 0, policy_version 95640 (0.0008) +[2023-10-08 15:35:10,619][102898] Updated weights for policy 1, policy_version 95780 (0.0008) +[2023-10-08 15:35:10,991][102898] Updated weights for policy 1, policy_version 95790 (0.0011) +[2023-10-08 15:35:11,350][102898] Updated weights for policy 1, policy_version 95800 (0.0010) +[2023-10-08 15:35:11,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 196050944. Throughput: 0: 1790.0, 1: 1807.4. Samples: 49015592. Policy #0 lag: (min: 31.0, avg: 35.8, max: 63.0) +[2023-10-08 15:35:11,876][101941] Avg episode reward: [(0, '8.830'), (1, '22.430')] +[2023-10-08 15:35:14,281][102897] Updated weights for policy 0, policy_version 95650 (0.0008) +[2023-10-08 15:35:14,653][102897] Updated weights for policy 0, policy_version 95660 (0.0009) +[2023-10-08 15:35:15,038][102897] Updated weights for policy 0, policy_version 95670 (0.0010) +[2023-10-08 15:35:15,334][102898] Updated weights for policy 1, policy_version 95810 (0.0010) +[2023-10-08 15:35:15,400][102897] Updated weights for policy 0, policy_version 95680 (0.0009) +[2023-10-08 15:35:15,696][102898] Updated weights for policy 1, policy_version 95820 (0.0008) +[2023-10-08 15:35:16,052][102898] Updated weights for policy 1, policy_version 95830 (0.0007) +[2023-10-08 15:35:16,418][102898] Updated weights for policy 1, policy_version 95840 (0.0008) +[2023-10-08 15:35:16,875][101941] Fps is (10 sec: 16383.4, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 196116480. Throughput: 0: 1777.6, 1: 1786.0. Samples: 49035710. Policy #0 lag: (min: 31.0, avg: 35.8, max: 63.0) +[2023-10-08 15:35:16,876][101941] Avg episode reward: [(0, '8.980'), (1, '26.790')] +[2023-10-08 15:35:19,095][102897] Updated weights for policy 0, policy_version 95690 (0.0008) +[2023-10-08 15:35:19,464][102897] Updated weights for policy 0, policy_version 95700 (0.0009) +[2023-10-08 15:35:19,838][102897] Updated weights for policy 0, policy_version 95710 (0.0011) +[2023-10-08 15:35:20,279][102898] Updated weights for policy 1, policy_version 95850 (0.0012) +[2023-10-08 15:35:20,644][102898] Updated weights for policy 1, policy_version 95860 (0.0009) +[2023-10-08 15:35:21,007][102898] Updated weights for policy 1, policy_version 95870 (0.0007) +[2023-10-08 15:35:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 196182016. Throughput: 0: 1795.4, 1: 1796.5. Samples: 49047720. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:35:21,876][101941] Avg episode reward: [(0, '9.370'), (1, '25.880')] +[2023-10-08 15:35:23,596][102897] Updated weights for policy 0, policy_version 95720 (0.0010) +[2023-10-08 15:35:23,958][102897] Updated weights for policy 0, policy_version 95730 (0.0010) +[2023-10-08 15:35:24,330][102897] Updated weights for policy 0, policy_version 95740 (0.0008) +[2023-10-08 15:35:24,787][102898] Updated weights for policy 1, policy_version 95880 (0.0009) +[2023-10-08 15:35:25,160][102898] Updated weights for policy 1, policy_version 95890 (0.0011) +[2023-10-08 15:35:25,522][102898] Updated weights for policy 1, policy_version 95900 (0.0010) +[2023-10-08 15:35:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 196247552. Throughput: 0: 1780.0, 1: 1788.3. Samples: 49068216. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:35:26,876][101941] Avg episode reward: [(0, '9.600'), (1, '29.500')] +[2023-10-08 15:35:26,877][102760] Saving new best policy, reward=29.500! +[2023-10-08 15:35:28,114][102897] Updated weights for policy 0, policy_version 95750 (0.0007) +[2023-10-08 15:35:28,494][102897] Updated weights for policy 0, policy_version 95760 (0.0008) +[2023-10-08 15:35:28,865][102897] Updated weights for policy 0, policy_version 95770 (0.0008) +[2023-10-08 15:35:29,249][102898] Updated weights for policy 1, policy_version 95910 (0.0008) +[2023-10-08 15:35:29,612][102898] Updated weights for policy 1, policy_version 95920 (0.0011) +[2023-10-08 15:35:29,983][102898] Updated weights for policy 1, policy_version 95930 (0.0010) +[2023-10-08 15:35:31,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 196313088. Throughput: 0: 1789.2, 1: 1782.0. Samples: 49090612. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:35:31,876][101941] Avg episode reward: [(0, '10.350'), (1, '30.360')] +[2023-10-08 15:35:31,886][102760] Saving new best policy, reward=30.360! +[2023-10-08 15:35:32,550][102897] Updated weights for policy 0, policy_version 95780 (0.0008) +[2023-10-08 15:35:32,917][102897] Updated weights for policy 0, policy_version 95790 (0.0010) +[2023-10-08 15:35:33,285][102897] Updated weights for policy 0, policy_version 95800 (0.0007) +[2023-10-08 15:35:33,663][102898] Updated weights for policy 1, policy_version 95940 (0.0009) +[2023-10-08 15:35:34,030][102898] Updated weights for policy 1, policy_version 95950 (0.0008) +[2023-10-08 15:35:34,393][102898] Updated weights for policy 1, policy_version 95960 (0.0008) +[2023-10-08 15:35:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 196378624. Throughput: 0: 1785.5, 1: 1790.3. Samples: 49100728. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:35:36,876][101941] Avg episode reward: [(0, '10.340'), (1, '31.890')] +[2023-10-08 15:35:36,878][102760] Saving new best policy, reward=31.890! +[2023-10-08 15:35:37,185][102897] Updated weights for policy 0, policy_version 95810 (0.0007) +[2023-10-08 15:35:37,561][102897] Updated weights for policy 0, policy_version 95820 (0.0008) +[2023-10-08 15:35:37,933][102897] Updated weights for policy 0, policy_version 95830 (0.0010) +[2023-10-08 15:35:38,060][102898] Updated weights for policy 1, policy_version 95970 (0.0008) +[2023-10-08 15:35:38,300][102897] Updated weights for policy 0, policy_version 95840 (0.0007) +[2023-10-08 15:35:38,415][102898] Updated weights for policy 1, policy_version 95980 (0.0007) +[2023-10-08 15:35:38,776][102898] Updated weights for policy 1, policy_version 95990 (0.0008) +[2023-10-08 15:35:39,144][102898] Updated weights for policy 1, policy_version 96000 (0.0007) +[2023-10-08 15:35:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 196444160. Throughput: 0: 1777.9, 1: 1786.5. Samples: 49122772. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:35:41,876][101941] Avg episode reward: [(0, '9.500'), (1, '30.420')] +[2023-10-08 15:35:42,051][102897] Updated weights for policy 0, policy_version 95850 (0.0009) +[2023-10-08 15:35:42,428][102897] Updated weights for policy 0, policy_version 95860 (0.0009) +[2023-10-08 15:35:42,796][102897] Updated weights for policy 0, policy_version 95870 (0.0007) +[2023-10-08 15:35:42,837][102898] Updated weights for policy 1, policy_version 96010 (0.0007) +[2023-10-08 15:35:43,203][102898] Updated weights for policy 1, policy_version 96020 (0.0008) +[2023-10-08 15:35:43,568][102898] Updated weights for policy 1, policy_version 96030 (0.0007) +[2023-10-08 15:35:46,659][102897] Updated weights for policy 0, policy_version 95880 (0.0009) +[2023-10-08 15:35:46,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 196509696. Throughput: 0: 1797.7, 1: 1798.9. Samples: 49145012. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:35:46,875][101941] Avg episode reward: [(0, '9.370'), (1, '30.860')] +[2023-10-08 15:35:47,023][102897] Updated weights for policy 0, policy_version 95890 (0.0007) +[2023-10-08 15:35:47,104][102898] Updated weights for policy 1, policy_version 96040 (0.0007) +[2023-10-08 15:35:47,377][102897] Updated weights for policy 0, policy_version 95900 (0.0007) +[2023-10-08 15:35:47,464][102898] Updated weights for policy 1, policy_version 96050 (0.0007) +[2023-10-08 15:35:47,832][102898] Updated weights for policy 1, policy_version 96060 (0.0009) +[2023-10-08 15:35:51,162][102897] Updated weights for policy 0, policy_version 95910 (0.0007) +[2023-10-08 15:35:51,528][102897] Updated weights for policy 0, policy_version 95920 (0.0007) +[2023-10-08 15:35:51,549][102898] Updated weights for policy 1, policy_version 96070 (0.0010) +[2023-10-08 15:35:51,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 196575232. Throughput: 0: 1776.3, 1: 1789.5. Samples: 49154954. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:35:51,876][101941] Avg episode reward: [(0, '9.190'), (1, '29.730')] +[2023-10-08 15:35:51,892][102897] Updated weights for policy 0, policy_version 95930 (0.0008) +[2023-10-08 15:35:51,927][102898] Updated weights for policy 1, policy_version 96080 (0.0009) +[2023-10-08 15:35:52,287][102898] Updated weights for policy 1, policy_version 96090 (0.0009) +[2023-10-08 15:35:55,680][102897] Updated weights for policy 0, policy_version 95940 (0.0010) +[2023-10-08 15:35:56,049][102897] Updated weights for policy 0, policy_version 95950 (0.0011) +[2023-10-08 15:35:56,249][102898] Updated weights for policy 1, policy_version 96100 (0.0010) +[2023-10-08 15:35:56,421][102897] Updated weights for policy 0, policy_version 95960 (0.0009) +[2023-10-08 15:35:56,617][102898] Updated weights for policy 1, policy_version 96110 (0.0009) +[2023-10-08 15:35:56,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 196673536. Throughput: 0: 1800.5, 1: 1790.6. Samples: 49177192. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:35:56,876][101941] Avg episode reward: [(0, '9.240'), (1, '29.050')] +[2023-10-08 15:35:56,982][102898] Updated weights for policy 1, policy_version 96120 (0.0008) +[2023-10-08 15:36:00,216][102897] Updated weights for policy 0, policy_version 95970 (0.0008) +[2023-10-08 15:36:00,579][102897] Updated weights for policy 0, policy_version 95980 (0.0007) +[2023-10-08 15:36:00,844][102898] Updated weights for policy 1, policy_version 96130 (0.0007) +[2023-10-08 15:36:00,943][102897] Updated weights for policy 0, policy_version 95990 (0.0007) +[2023-10-08 15:36:01,209][102898] Updated weights for policy 1, policy_version 96140 (0.0008) +[2023-10-08 15:36:01,309][102897] Updated weights for policy 0, policy_version 96000 (0.0007) +[2023-10-08 15:36:01,578][102898] Updated weights for policy 1, policy_version 96150 (0.0008) +[2023-10-08 15:36:01,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 196739072. Throughput: 0: 1776.9, 1: 1806.1. Samples: 49196946. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:36:01,875][101941] Avg episode reward: [(0, '9.730'), (1, '30.920')] +[2023-10-08 15:36:01,938][102898] Updated weights for policy 1, policy_version 96160 (0.0010) +[2023-10-08 15:36:05,136][102897] Updated weights for policy 0, policy_version 96010 (0.0009) +[2023-10-08 15:36:05,495][102897] Updated weights for policy 0, policy_version 96020 (0.0009) +[2023-10-08 15:36:05,579][102898] Updated weights for policy 1, policy_version 96170 (0.0008) +[2023-10-08 15:36:05,869][102897] Updated weights for policy 0, policy_version 96030 (0.0009) +[2023-10-08 15:36:05,934][102898] Updated weights for policy 1, policy_version 96180 (0.0009) +[2023-10-08 15:36:06,307][102898] Updated weights for policy 1, policy_version 96190 (0.0008) +[2023-10-08 15:36:06,875][101941] Fps is (10 sec: 16384.0, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 196837376. Throughput: 0: 1793.7, 1: 1792.7. Samples: 49209108. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:36:06,876][101941] Avg episode reward: [(0, '9.030'), (1, '28.530')] +[2023-10-08 15:36:09,739][102897] Updated weights for policy 0, policy_version 96040 (0.0008) +[2023-10-08 15:36:09,978][102898] Updated weights for policy 1, policy_version 96200 (0.0007) +[2023-10-08 15:36:10,112][102897] Updated weights for policy 0, policy_version 96050 (0.0008) +[2023-10-08 15:36:10,349][102898] Updated weights for policy 1, policy_version 96210 (0.0008) +[2023-10-08 15:36:10,486][102897] Updated weights for policy 0, policy_version 96060 (0.0008) +[2023-10-08 15:36:10,712][102898] Updated weights for policy 1, policy_version 96220 (0.0007) +[2023-10-08 15:36:11,875][101941] Fps is (10 sec: 16383.5, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 196902912. Throughput: 0: 1776.8, 1: 1798.3. Samples: 49229096. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:36:11,876][101941] Avg episode reward: [(0, '8.250'), (1, '29.580')] +[2023-10-08 15:36:14,268][102897] Updated weights for policy 0, policy_version 96070 (0.0007) +[2023-10-08 15:36:14,494][102898] Updated weights for policy 1, policy_version 96230 (0.0007) +[2023-10-08 15:36:14,639][102897] Updated weights for policy 0, policy_version 96080 (0.0007) +[2023-10-08 15:36:14,866][102898] Updated weights for policy 1, policy_version 96240 (0.0007) +[2023-10-08 15:36:14,998][102897] Updated weights for policy 0, policy_version 96090 (0.0007) +[2023-10-08 15:36:15,236][102898] Updated weights for policy 1, policy_version 96250 (0.0007) +[2023-10-08 15:36:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 196968448. Throughput: 0: 1759.9, 1: 1787.9. Samples: 49250264. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:36:16,876][101941] Avg episode reward: [(0, '8.840'), (1, '31.440')] +[2023-10-08 15:36:16,885][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000096256_98566144.pth... +[2023-10-08 15:36:16,885][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000096096_98402304.pth... +[2023-10-08 15:36:16,922][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000094432_96698368.pth +[2023-10-08 15:36:16,924][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000094592_96862208.pth +[2023-10-08 15:36:18,643][102897] Updated weights for policy 0, policy_version 96100 (0.0007) +[2023-10-08 15:36:19,011][102897] Updated weights for policy 0, policy_version 96110 (0.0009) +[2023-10-08 15:36:19,071][102898] Updated weights for policy 1, policy_version 96260 (0.0008) +[2023-10-08 15:36:19,381][102897] Updated weights for policy 0, policy_version 96120 (0.0008) +[2023-10-08 15:36:19,427][102898] Updated weights for policy 1, policy_version 96270 (0.0007) +[2023-10-08 15:36:19,799][102898] Updated weights for policy 1, policy_version 96280 (0.0007) +[2023-10-08 15:36:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 197033984. Throughput: 0: 1771.2, 1: 1792.5. Samples: 49261096. Policy #0 lag: (min: 13.0, avg: 37.0, max: 40.0) +[2023-10-08 15:36:21,876][101941] Avg episode reward: [(0, '9.360'), (1, '28.780')] +[2023-10-08 15:36:23,063][102897] Updated weights for policy 0, policy_version 96130 (0.0008) +[2023-10-08 15:36:23,438][102897] Updated weights for policy 0, policy_version 96140 (0.0007) +[2023-10-08 15:36:23,565][102898] Updated weights for policy 1, policy_version 96290 (0.0007) +[2023-10-08 15:36:23,814][102897] Updated weights for policy 0, policy_version 96150 (0.0007) +[2023-10-08 15:36:23,933][102898] Updated weights for policy 1, policy_version 96300 (0.0009) +[2023-10-08 15:36:24,173][102897] Updated weights for policy 0, policy_version 96160 (0.0007) +[2023-10-08 15:36:24,298][102898] Updated weights for policy 1, policy_version 96310 (0.0008) +[2023-10-08 15:36:24,659][102898] Updated weights for policy 1, policy_version 96320 (0.0007) +[2023-10-08 15:36:26,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 197099520. Throughput: 0: 1765.8, 1: 1778.6. Samples: 49282270. Policy #0 lag: (min: 13.0, avg: 37.0, max: 40.0) +[2023-10-08 15:36:26,875][101941] Avg episode reward: [(0, '9.130'), (1, '29.020')] +[2023-10-08 15:36:28,171][102897] Updated weights for policy 0, policy_version 96170 (0.0008) +[2023-10-08 15:36:28,434][102898] Updated weights for policy 1, policy_version 96330 (0.0008) +[2023-10-08 15:36:28,546][102897] Updated weights for policy 0, policy_version 96180 (0.0008) +[2023-10-08 15:36:28,801][102898] Updated weights for policy 1, policy_version 96340 (0.0009) +[2023-10-08 15:36:28,926][102897] Updated weights for policy 0, policy_version 96190 (0.0008) +[2023-10-08 15:36:29,170][102898] Updated weights for policy 1, policy_version 96350 (0.0007) +[2023-10-08 15:36:31,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 197165056. Throughput: 0: 1768.8, 1: 1774.3. Samples: 49304454. Policy #0 lag: (min: 13.0, avg: 37.0, max: 40.0) +[2023-10-08 15:36:31,875][101941] Avg episode reward: [(0, '8.730'), (1, '31.580')] +[2023-10-08 15:36:32,660][102897] Updated weights for policy 0, policy_version 96200 (0.0007) +[2023-10-08 15:36:32,820][102898] Updated weights for policy 1, policy_version 96360 (0.0007) +[2023-10-08 15:36:33,028][102897] Updated weights for policy 0, policy_version 96210 (0.0007) +[2023-10-08 15:36:33,186][102898] Updated weights for policy 1, policy_version 96370 (0.0008) +[2023-10-08 15:36:33,394][102897] Updated weights for policy 0, policy_version 96220 (0.0009) +[2023-10-08 15:36:33,545][102898] Updated weights for policy 1, policy_version 96380 (0.0007) +[2023-10-08 15:36:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 197230592. Throughput: 0: 1767.6, 1: 1774.8. Samples: 49314366. Policy #0 lag: (min: 13.0, avg: 37.0, max: 40.0) +[2023-10-08 15:36:36,876][101941] Avg episode reward: [(0, '8.680'), (1, '29.300')] +[2023-10-08 15:36:37,342][102897] Updated weights for policy 0, policy_version 96230 (0.0008) +[2023-10-08 15:36:37,527][102898] Updated weights for policy 1, policy_version 96390 (0.0009) +[2023-10-08 15:36:37,705][102897] Updated weights for policy 0, policy_version 96240 (0.0008) +[2023-10-08 15:36:37,905][102898] Updated weights for policy 1, policy_version 96400 (0.0009) +[2023-10-08 15:36:38,079][102897] Updated weights for policy 0, policy_version 96250 (0.0008) +[2023-10-08 15:36:38,263][102898] Updated weights for policy 1, policy_version 96410 (0.0009) +[2023-10-08 15:36:41,761][102897] Updated weights for policy 0, policy_version 96260 (0.0009) +[2023-10-08 15:36:41,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 197296128. Throughput: 0: 1768.9, 1: 1768.4. Samples: 49336370. Policy #0 lag: (min: 13.0, avg: 37.0, max: 40.0) +[2023-10-08 15:36:41,876][101941] Avg episode reward: [(0, '9.540'), (1, '33.700')] +[2023-10-08 15:36:41,878][102760] Saving new best policy, reward=33.700! +[2023-10-08 15:36:42,122][102897] Updated weights for policy 0, policy_version 96270 (0.0007) +[2023-10-08 15:36:42,238][102898] Updated weights for policy 1, policy_version 96420 (0.0008) +[2023-10-08 15:36:42,493][102897] Updated weights for policy 0, policy_version 96280 (0.0007) +[2023-10-08 15:36:42,600][102898] Updated weights for policy 1, policy_version 96430 (0.0008) +[2023-10-08 15:36:42,970][102898] Updated weights for policy 1, policy_version 96440 (0.0009) +[2023-10-08 15:36:46,502][102897] Updated weights for policy 0, policy_version 96290 (0.0008) +[2023-10-08 15:36:46,837][102898] Updated weights for policy 1, policy_version 96450 (0.0010) +[2023-10-08 15:36:46,874][102897] Updated weights for policy 0, policy_version 96300 (0.0009) +[2023-10-08 15:36:46,875][101941] Fps is (10 sec: 13106.8, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 197361664. Throughput: 0: 1798.9, 1: 1785.9. Samples: 49358262. Policy #0 lag: (min: 13.0, avg: 37.0, max: 40.0) +[2023-10-08 15:36:46,876][101941] Avg episode reward: [(0, '9.480'), (1, '30.310')] +[2023-10-08 15:36:47,195][102898] Updated weights for policy 1, policy_version 96460 (0.0007) +[2023-10-08 15:36:47,246][102897] Updated weights for policy 0, policy_version 96310 (0.0008) +[2023-10-08 15:36:47,554][102898] Updated weights for policy 1, policy_version 96470 (0.0007) +[2023-10-08 15:36:47,619][102897] Updated weights for policy 0, policy_version 96320 (0.0007) +[2023-10-08 15:36:47,922][102898] Updated weights for policy 1, policy_version 96480 (0.0010) +[2023-10-08 15:36:51,464][102897] Updated weights for policy 0, policy_version 96330 (0.0007) +[2023-10-08 15:36:51,786][102898] Updated weights for policy 1, policy_version 96490 (0.0009) +[2023-10-08 15:36:51,839][102897] Updated weights for policy 0, policy_version 96340 (0.0010) +[2023-10-08 15:36:51,875][101941] Fps is (10 sec: 13107.4, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 197427200. Throughput: 0: 1761.1, 1: 1767.4. Samples: 49367890. Policy #0 lag: (min: 13.0, avg: 37.0, max: 40.0) +[2023-10-08 15:36:51,876][101941] Avg episode reward: [(0, '9.640'), (1, '30.730')] +[2023-10-08 15:36:52,152][102898] Updated weights for policy 1, policy_version 96500 (0.0007) +[2023-10-08 15:36:52,197][102897] Updated weights for policy 0, policy_version 96350 (0.0008) +[2023-10-08 15:36:52,508][102898] Updated weights for policy 1, policy_version 96510 (0.0008) +[2023-10-08 15:36:56,001][102897] Updated weights for policy 0, policy_version 96360 (0.0008) +[2023-10-08 15:36:56,369][102897] Updated weights for policy 0, policy_version 96370 (0.0007) +[2023-10-08 15:36:56,441][102898] Updated weights for policy 1, policy_version 96520 (0.0008) +[2023-10-08 15:36:56,740][102897] Updated weights for policy 0, policy_version 96380 (0.0007) +[2023-10-08 15:36:56,807][102898] Updated weights for policy 1, policy_version 96530 (0.0007) +[2023-10-08 15:36:56,875][101941] Fps is (10 sec: 13107.3, 60 sec: 13653.3, 300 sec: 14218.0). Total num frames: 197492736. Throughput: 0: 1796.0, 1: 1786.2. Samples: 49390294. Policy #0 lag: (min: 13.0, avg: 37.0, max: 40.0) +[2023-10-08 15:36:56,876][101941] Avg episode reward: [(0, '9.720'), (1, '30.430')] +[2023-10-08 15:36:57,170][102898] Updated weights for policy 1, policy_version 96540 (0.0009) +[2023-10-08 15:37:00,457][102897] Updated weights for policy 0, policy_version 96390 (0.0008) +[2023-10-08 15:37:00,824][102897] Updated weights for policy 0, policy_version 96400 (0.0008) +[2023-10-08 15:37:00,913][102898] Updated weights for policy 1, policy_version 96550 (0.0009) +[2023-10-08 15:37:01,188][102897] Updated weights for policy 0, policy_version 96410 (0.0008) +[2023-10-08 15:37:01,274][102898] Updated weights for policy 1, policy_version 96560 (0.0007) +[2023-10-08 15:37:01,647][102898] Updated weights for policy 1, policy_version 96570 (0.0008) +[2023-10-08 15:37:01,875][101941] Fps is (10 sec: 19660.7, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 197623808. Throughput: 0: 1771.5, 1: 1780.4. Samples: 49410100. Policy #0 lag: (min: 13.0, avg: 37.0, max: 40.0) +[2023-10-08 15:37:01,876][101941] Avg episode reward: [(0, '9.180'), (1, '32.150')] +[2023-10-08 15:37:05,113][102897] Updated weights for policy 0, policy_version 96420 (0.0008) +[2023-10-08 15:37:05,415][102898] Updated weights for policy 1, policy_version 96580 (0.0009) +[2023-10-08 15:37:05,480][102897] Updated weights for policy 0, policy_version 96430 (0.0010) +[2023-10-08 15:37:05,777][102898] Updated weights for policy 1, policy_version 96590 (0.0008) +[2023-10-08 15:37:05,846][102897] Updated weights for policy 0, policy_version 96440 (0.0007) +[2023-10-08 15:37:06,133][102898] Updated weights for policy 1, policy_version 96600 (0.0007) +[2023-10-08 15:37:06,875][101941] Fps is (10 sec: 19660.8, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 197689344. Throughput: 0: 1791.9, 1: 1785.1. Samples: 49422060. Policy #0 lag: (min: 13.0, avg: 37.0, max: 40.0) +[2023-10-08 15:37:06,876][101941] Avg episode reward: [(0, '9.380'), (1, '35.570')] +[2023-10-08 15:37:06,878][102760] Saving new best policy, reward=35.570! +[2023-10-08 15:37:09,478][102897] Updated weights for policy 0, policy_version 96450 (0.0008) +[2023-10-08 15:37:09,856][102897] Updated weights for policy 0, policy_version 96460 (0.0009) +[2023-10-08 15:37:10,006][102898] Updated weights for policy 1, policy_version 96610 (0.0008) +[2023-10-08 15:37:10,228][102897] Updated weights for policy 0, policy_version 96470 (0.0008) +[2023-10-08 15:37:10,372][102898] Updated weights for policy 1, policy_version 96620 (0.0008) +[2023-10-08 15:37:10,591][102897] Updated weights for policy 0, policy_version 96480 (0.0009) +[2023-10-08 15:37:10,742][102898] Updated weights for policy 1, policy_version 96630 (0.0008) +[2023-10-08 15:37:11,113][102898] Updated weights for policy 1, policy_version 96640 (0.0008) +[2023-10-08 15:37:11,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 197754880. Throughput: 0: 1773.2, 1: 1788.5. Samples: 49442546. Policy #0 lag: (min: 13.0, avg: 37.0, max: 40.0) +[2023-10-08 15:37:11,876][101941] Avg episode reward: [(0, '8.960'), (1, '30.840')] +[2023-10-08 15:37:14,379][102897] Updated weights for policy 0, policy_version 96490 (0.0009) +[2023-10-08 15:37:14,746][102897] Updated weights for policy 0, policy_version 96500 (0.0009) +[2023-10-08 15:37:14,802][102898] Updated weights for policy 1, policy_version 96650 (0.0011) +[2023-10-08 15:37:15,113][102897] Updated weights for policy 0, policy_version 96510 (0.0007) +[2023-10-08 15:37:15,169][102898] Updated weights for policy 1, policy_version 96660 (0.0008) +[2023-10-08 15:37:15,531][102898] Updated weights for policy 1, policy_version 96670 (0.0011) +[2023-10-08 15:37:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 197820416. Throughput: 0: 1773.5, 1: 1767.0. Samples: 49463778. Policy #0 lag: (min: 13.0, avg: 37.0, max: 40.0) +[2023-10-08 15:37:16,876][101941] Avg episode reward: [(0, '9.230'), (1, '34.280')] +[2023-10-08 15:37:18,796][102897] Updated weights for policy 0, policy_version 96520 (0.0007) +[2023-10-08 15:37:19,162][102897] Updated weights for policy 0, policy_version 96530 (0.0007) +[2023-10-08 15:37:19,439][102898] Updated weights for policy 1, policy_version 96680 (0.0008) +[2023-10-08 15:37:19,529][102897] Updated weights for policy 0, policy_version 96540 (0.0008) +[2023-10-08 15:37:19,817][102898] Updated weights for policy 1, policy_version 96690 (0.0010) +[2023-10-08 15:37:20,178][102898] Updated weights for policy 1, policy_version 96700 (0.0007) +[2023-10-08 15:37:21,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14329.0). Total num frames: 197885952. Throughput: 0: 1780.6, 1: 1785.9. Samples: 49474860. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:37:21,876][101941] Avg episode reward: [(0, '9.370'), (1, '31.400')] +[2023-10-08 15:37:23,329][102897] Updated weights for policy 0, policy_version 96550 (0.0007) +[2023-10-08 15:37:23,701][102897] Updated weights for policy 0, policy_version 96560 (0.0008) +[2023-10-08 15:37:23,846][102898] Updated weights for policy 1, policy_version 96710 (0.0008) +[2023-10-08 15:37:24,067][102897] Updated weights for policy 0, policy_version 96570 (0.0008) +[2023-10-08 15:37:24,219][102898] Updated weights for policy 1, policy_version 96720 (0.0008) +[2023-10-08 15:37:24,584][102898] Updated weights for policy 1, policy_version 96730 (0.0008) +[2023-10-08 15:37:26,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 197951488. Throughput: 0: 1768.6, 1: 1772.0. Samples: 49495696. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:37:26,876][101941] Avg episode reward: [(0, '10.170'), (1, '33.080')] +[2023-10-08 15:37:27,815][102897] Updated weights for policy 0, policy_version 96580 (0.0008) +[2023-10-08 15:37:28,188][102897] Updated weights for policy 0, policy_version 96590 (0.0009) +[2023-10-08 15:37:28,408][102898] Updated weights for policy 1, policy_version 96740 (0.0007) +[2023-10-08 15:37:28,548][102897] Updated weights for policy 0, policy_version 96600 (0.0007) +[2023-10-08 15:37:28,811][102898] Updated weights for policy 1, policy_version 96750 (0.0008) +[2023-10-08 15:37:29,179][102898] Updated weights for policy 1, policy_version 96760 (0.0011) +[2023-10-08 15:37:31,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 198017024. Throughput: 0: 1775.4, 1: 1775.6. Samples: 49518058. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:37:31,875][101941] Avg episode reward: [(0, '9.460'), (1, '31.120')] +[2023-10-08 15:37:32,257][102897] Updated weights for policy 0, policy_version 96610 (0.0008) +[2023-10-08 15:37:32,636][102897] Updated weights for policy 0, policy_version 96620 (0.0007) +[2023-10-08 15:37:32,884][102898] Updated weights for policy 1, policy_version 96770 (0.0010) +[2023-10-08 15:37:33,013][102897] Updated weights for policy 0, policy_version 96630 (0.0008) +[2023-10-08 15:37:33,265][102898] Updated weights for policy 1, policy_version 96780 (0.0008) +[2023-10-08 15:37:33,375][102897] Updated weights for policy 0, policy_version 96640 (0.0009) +[2023-10-08 15:37:33,628][102898] Updated weights for policy 1, policy_version 96790 (0.0008) +[2023-10-08 15:37:33,994][102898] Updated weights for policy 1, policy_version 96800 (0.0010) +[2023-10-08 15:37:36,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 198082560. Throughput: 0: 1776.8, 1: 1777.6. Samples: 49527836. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:37:36,876][101941] Avg episode reward: [(0, '9.520'), (1, '30.500')] +[2023-10-08 15:37:37,245][102897] Updated weights for policy 0, policy_version 96650 (0.0010) +[2023-10-08 15:37:37,613][102897] Updated weights for policy 0, policy_version 96660 (0.0007) +[2023-10-08 15:37:37,695][102898] Updated weights for policy 1, policy_version 96810 (0.0008) +[2023-10-08 15:37:37,982][102897] Updated weights for policy 0, policy_version 96670 (0.0007) +[2023-10-08 15:37:38,066][102898] Updated weights for policy 1, policy_version 96820 (0.0008) +[2023-10-08 15:37:38,434][102898] Updated weights for policy 1, policy_version 96830 (0.0009) +[2023-10-08 15:37:41,867][102897] Updated weights for policy 0, policy_version 96680 (0.0008) +[2023-10-08 15:37:41,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 198148096. Throughput: 0: 1772.3, 1: 1780.8. Samples: 49550184. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:37:41,876][101941] Avg episode reward: [(0, '9.100'), (1, '33.140')] +[2023-10-08 15:37:42,167][102898] Updated weights for policy 1, policy_version 96840 (0.0007) +[2023-10-08 15:37:42,237][102897] Updated weights for policy 0, policy_version 96690 (0.0007) +[2023-10-08 15:37:42,539][102898] Updated weights for policy 1, policy_version 96850 (0.0008) +[2023-10-08 15:37:42,605][102897] Updated weights for policy 0, policy_version 96700 (0.0008) +[2023-10-08 15:37:42,914][102898] Updated weights for policy 1, policy_version 96860 (0.0007) +[2023-10-08 15:37:46,333][102897] Updated weights for policy 0, policy_version 96710 (0.0008) +[2023-10-08 15:37:46,611][102898] Updated weights for policy 1, policy_version 96870 (0.0007) +[2023-10-08 15:37:46,698][102897] Updated weights for policy 0, policy_version 96720 (0.0007) +[2023-10-08 15:37:46,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 198213632. Throughput: 0: 1798.2, 1: 1803.8. Samples: 49572192. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:37:46,876][101941] Avg episode reward: [(0, '9.010'), (1, '31.090')] +[2023-10-08 15:37:46,974][102898] Updated weights for policy 1, policy_version 96880 (0.0007) +[2023-10-08 15:37:47,069][102897] Updated weights for policy 0, policy_version 96730 (0.0007) +[2023-10-08 15:37:47,348][102898] Updated weights for policy 1, policy_version 96890 (0.0007) +[2023-10-08 15:37:50,821][102897] Updated weights for policy 0, policy_version 96740 (0.0008) +[2023-10-08 15:37:51,118][102898] Updated weights for policy 1, policy_version 96900 (0.0007) +[2023-10-08 15:37:51,191][102897] Updated weights for policy 0, policy_version 96750 (0.0007) +[2023-10-08 15:37:51,480][102898] Updated weights for policy 1, policy_version 96910 (0.0008) +[2023-10-08 15:37:51,555][102897] Updated weights for policy 0, policy_version 96760 (0.0007) +[2023-10-08 15:37:51,852][102898] Updated weights for policy 1, policy_version 96920 (0.0009) +[2023-10-08 15:37:51,875][101941] Fps is (10 sec: 16384.3, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 198311936. Throughput: 0: 1775.8, 1: 1787.2. Samples: 49582394. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:37:51,876][101941] Avg episode reward: [(0, '9.970'), (1, '25.250')] +[2023-10-08 15:37:55,499][102897] Updated weights for policy 0, policy_version 96770 (0.0008) +[2023-10-08 15:37:55,572][102898] Updated weights for policy 1, policy_version 96930 (0.0009) +[2023-10-08 15:37:55,866][102897] Updated weights for policy 0, policy_version 96780 (0.0009) +[2023-10-08 15:37:55,935][102898] Updated weights for policy 1, policy_version 96940 (0.0008) +[2023-10-08 15:37:56,228][102897] Updated weights for policy 0, policy_version 96790 (0.0008) +[2023-10-08 15:37:56,299][102898] Updated weights for policy 1, policy_version 96950 (0.0009) +[2023-10-08 15:37:56,601][102897] Updated weights for policy 0, policy_version 96800 (0.0007) +[2023-10-08 15:37:56,668][102898] Updated weights for policy 1, policy_version 96960 (0.0007) +[2023-10-08 15:37:56,875][101941] Fps is (10 sec: 19660.5, 60 sec: 15291.7, 300 sec: 14440.1). Total num frames: 198410240. Throughput: 0: 1799.1, 1: 1803.1. Samples: 49604648. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:37:56,876][101941] Avg episode reward: [(0, '9.750'), (1, '24.160')] +[2023-10-08 15:38:00,388][102898] Updated weights for policy 1, policy_version 96970 (0.0008) +[2023-10-08 15:38:00,493][102897] Updated weights for policy 0, policy_version 96810 (0.0009) +[2023-10-08 15:38:00,754][102898] Updated weights for policy 1, policy_version 96980 (0.0009) +[2023-10-08 15:38:00,860][102897] Updated weights for policy 0, policy_version 96820 (0.0007) +[2023-10-08 15:38:01,121][102898] Updated weights for policy 1, policy_version 96990 (0.0007) +[2023-10-08 15:38:01,234][102897] Updated weights for policy 0, policy_version 96830 (0.0007) +[2023-10-08 15:38:01,875][101941] Fps is (10 sec: 16383.8, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 198475776. Throughput: 0: 1764.4, 1: 1791.2. Samples: 49623784. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:38:01,876][101941] Avg episode reward: [(0, '9.330'), (1, '29.190')] +[2023-10-08 15:38:04,910][102898] Updated weights for policy 1, policy_version 97000 (0.0008) +[2023-10-08 15:38:04,943][102897] Updated weights for policy 0, policy_version 96840 (0.0008) +[2023-10-08 15:38:05,276][102898] Updated weights for policy 1, policy_version 97010 (0.0009) +[2023-10-08 15:38:05,309][102897] Updated weights for policy 0, policy_version 96850 (0.0009) +[2023-10-08 15:38:05,632][102898] Updated weights for policy 1, policy_version 97020 (0.0009) +[2023-10-08 15:38:05,676][102897] Updated weights for policy 0, policy_version 96860 (0.0007) +[2023-10-08 15:38:06,875][101941] Fps is (10 sec: 13107.5, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 198541312. Throughput: 0: 1787.4, 1: 1800.9. Samples: 49636332. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:38:06,875][101941] Avg episode reward: [(0, '8.620'), (1, '27.360')] +[2023-10-08 15:38:09,285][102898] Updated weights for policy 1, policy_version 97030 (0.0007) +[2023-10-08 15:38:09,388][102897] Updated weights for policy 0, policy_version 96870 (0.0007) +[2023-10-08 15:38:09,649][102898] Updated weights for policy 1, policy_version 97040 (0.0008) +[2023-10-08 15:38:09,758][102897] Updated weights for policy 0, policy_version 96880 (0.0008) +[2023-10-08 15:38:10,021][102898] Updated weights for policy 1, policy_version 97050 (0.0007) +[2023-10-08 15:38:10,129][102897] Updated weights for policy 0, policy_version 96890 (0.0007) +[2023-10-08 15:38:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 198606848. Throughput: 0: 1763.0, 1: 1791.0. Samples: 49655624. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:38:11,876][101941] Avg episode reward: [(0, '8.330'), (1, '27.760')] +[2023-10-08 15:38:13,823][102898] Updated weights for policy 1, policy_version 97060 (0.0009) +[2023-10-08 15:38:13,935][102897] Updated weights for policy 0, policy_version 96900 (0.0009) +[2023-10-08 15:38:14,201][102898] Updated weights for policy 1, policy_version 97070 (0.0008) +[2023-10-08 15:38:14,312][102897] Updated weights for policy 0, policy_version 96910 (0.0008) +[2023-10-08 15:38:14,575][102898] Updated weights for policy 1, policy_version 97080 (0.0008) +[2023-10-08 15:38:14,670][102897] Updated weights for policy 0, policy_version 96920 (0.0007) +[2023-10-08 15:38:16,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 198672384. Throughput: 0: 1763.7, 1: 1794.4. Samples: 49678170. Policy #0 lag: (min: 21.0, avg: 21.0, max: 21.0) +[2023-10-08 15:38:16,876][101941] Avg episode reward: [(0, '9.100'), (1, '30.660')] +[2023-10-08 15:38:16,884][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000097088_99418112.pth... +[2023-10-08 15:38:16,885][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000096928_99254272.pth... +[2023-10-08 15:38:16,916][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000095424_97714176.pth +[2023-10-08 15:38:16,919][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000095264_97550336.pth +[2023-10-08 15:38:18,279][102898] Updated weights for policy 1, policy_version 97090 (0.0008) +[2023-10-08 15:38:18,512][102897] Updated weights for policy 0, policy_version 96930 (0.0008) +[2023-10-08 15:38:18,636][102898] Updated weights for policy 1, policy_version 97100 (0.0009) +[2023-10-08 15:38:18,890][102897] Updated weights for policy 0, policy_version 96940 (0.0008) +[2023-10-08 15:38:19,000][102898] Updated weights for policy 1, policy_version 97110 (0.0009) +[2023-10-08 15:38:19,260][102897] Updated weights for policy 0, policy_version 96950 (0.0008) +[2023-10-08 15:38:19,361][102898] Updated weights for policy 1, policy_version 97120 (0.0008) +[2023-10-08 15:38:19,628][102897] Updated weights for policy 0, policy_version 96960 (0.0008) +[2023-10-08 15:38:21,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 198737920. Throughput: 0: 1774.8, 1: 1795.1. Samples: 49688480. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:38:21,875][101941] Avg episode reward: [(0, '9.910'), (1, '33.670')] +[2023-10-08 15:38:23,139][102898] Updated weights for policy 1, policy_version 97130 (0.0008) +[2023-10-08 15:38:23,347][102897] Updated weights for policy 0, policy_version 96970 (0.0008) +[2023-10-08 15:38:23,507][102898] Updated weights for policy 1, policy_version 97140 (0.0009) +[2023-10-08 15:38:23,721][102897] Updated weights for policy 0, policy_version 96980 (0.0008) +[2023-10-08 15:38:23,877][102898] Updated weights for policy 1, policy_version 97150 (0.0007) +[2023-10-08 15:38:24,094][102897] Updated weights for policy 0, policy_version 96990 (0.0007) +[2023-10-08 15:38:26,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 198803456. Throughput: 0: 1773.3, 1: 1792.3. Samples: 49710634. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:38:26,876][101941] Avg episode reward: [(0, '9.330'), (1, '27.890')] +[2023-10-08 15:38:27,793][102898] Updated weights for policy 1, policy_version 97160 (0.0010) +[2023-10-08 15:38:27,805][102897] Updated weights for policy 0, policy_version 97000 (0.0008) +[2023-10-08 15:38:28,157][102898] Updated weights for policy 1, policy_version 97170 (0.0009) +[2023-10-08 15:38:28,180][102897] Updated weights for policy 0, policy_version 97010 (0.0009) +[2023-10-08 15:38:28,529][102898] Updated weights for policy 1, policy_version 97180 (0.0007) +[2023-10-08 15:38:28,551][102897] Updated weights for policy 0, policy_version 97020 (0.0008) +[2023-10-08 15:38:31,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 198868992. Throughput: 0: 1782.8, 1: 1784.6. Samples: 49732724. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:38:31,876][101941] Avg episode reward: [(0, '9.330'), (1, '27.720')] +[2023-10-08 15:38:32,266][102898] Updated weights for policy 1, policy_version 97190 (0.0008) +[2023-10-08 15:38:32,436][102897] Updated weights for policy 0, policy_version 97030 (0.0007) +[2023-10-08 15:38:32,630][102898] Updated weights for policy 1, policy_version 97200 (0.0009) +[2023-10-08 15:38:32,806][102897] Updated weights for policy 0, policy_version 97040 (0.0008) +[2023-10-08 15:38:32,999][102898] Updated weights for policy 1, policy_version 97210 (0.0010) +[2023-10-08 15:38:33,185][102897] Updated weights for policy 0, policy_version 97050 (0.0008) +[2023-10-08 15:38:36,807][102898] Updated weights for policy 1, policy_version 97220 (0.0008) +[2023-10-08 15:38:36,838][102897] Updated weights for policy 0, policy_version 97060 (0.0007) +[2023-10-08 15:38:36,875][101941] Fps is (10 sec: 13107.1, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 198934528. Throughput: 0: 1773.4, 1: 1780.3. Samples: 49742310. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:38:36,876][101941] Avg episode reward: [(0, '9.560'), (1, '26.730')] +[2023-10-08 15:38:37,176][102898] Updated weights for policy 1, policy_version 97230 (0.0009) +[2023-10-08 15:38:37,209][102897] Updated weights for policy 0, policy_version 97070 (0.0007) +[2023-10-08 15:38:37,542][102898] Updated weights for policy 1, policy_version 97240 (0.0009) +[2023-10-08 15:38:37,589][102897] Updated weights for policy 0, policy_version 97080 (0.0007) +[2023-10-08 15:38:41,411][102897] Updated weights for policy 0, policy_version 97090 (0.0008) +[2023-10-08 15:38:41,451][102898] Updated weights for policy 1, policy_version 97250 (0.0008) +[2023-10-08 15:38:41,780][102897] Updated weights for policy 0, policy_version 97100 (0.0009) +[2023-10-08 15:38:41,814][102898] Updated weights for policy 1, policy_version 97260 (0.0008) +[2023-10-08 15:38:41,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 199000064. Throughput: 0: 1779.2, 1: 1775.4. Samples: 49764604. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:38:41,875][101941] Avg episode reward: [(0, '9.890'), (1, '22.790')] +[2023-10-08 15:38:42,157][102897] Updated weights for policy 0, policy_version 97110 (0.0008) +[2023-10-08 15:38:42,182][102898] Updated weights for policy 1, policy_version 97270 (0.0007) +[2023-10-08 15:38:42,518][102897] Updated weights for policy 0, policy_version 97120 (0.0008) +[2023-10-08 15:38:42,547][102898] Updated weights for policy 1, policy_version 97280 (0.0007) +[2023-10-08 15:38:46,253][102897] Updated weights for policy 0, policy_version 97130 (0.0008) +[2023-10-08 15:38:46,404][102898] Updated weights for policy 1, policy_version 97290 (0.0007) +[2023-10-08 15:38:46,629][102897] Updated weights for policy 0, policy_version 97140 (0.0007) +[2023-10-08 15:38:46,766][102898] Updated weights for policy 1, policy_version 97300 (0.0008) +[2023-10-08 15:38:46,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 199065600. Throughput: 0: 1802.8, 1: 1798.6. Samples: 49785848. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:38:46,875][101941] Avg episode reward: [(0, '9.270'), (1, '22.270')] +[2023-10-08 15:38:47,001][102897] Updated weights for policy 0, policy_version 97150 (0.0007) +[2023-10-08 15:38:47,141][102898] Updated weights for policy 1, policy_version 97310 (0.0008) +[2023-10-08 15:38:50,917][102898] Updated weights for policy 1, policy_version 97320 (0.0011) +[2023-10-08 15:38:50,925][102897] Updated weights for policy 0, policy_version 97160 (0.0007) +[2023-10-08 15:38:51,286][102898] Updated weights for policy 1, policy_version 97330 (0.0009) +[2023-10-08 15:38:51,295][102897] Updated weights for policy 0, policy_version 97170 (0.0008) +[2023-10-08 15:38:51,646][102898] Updated weights for policy 1, policy_version 97340 (0.0007) +[2023-10-08 15:38:51,660][102897] Updated weights for policy 0, policy_version 97180 (0.0008) +[2023-10-08 15:38:51,875][101941] Fps is (10 sec: 19660.6, 60 sec: 14745.6, 300 sec: 14440.1). Total num frames: 199196672. Throughput: 0: 1783.4, 1: 1779.2. Samples: 49796650. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:38:51,876][101941] Avg episode reward: [(0, '8.820'), (1, '23.560')] +[2023-10-08 15:38:55,347][102897] Updated weights for policy 0, policy_version 97190 (0.0008) +[2023-10-08 15:38:55,451][102898] Updated weights for policy 1, policy_version 97350 (0.0008) +[2023-10-08 15:38:55,717][102897] Updated weights for policy 0, policy_version 97200 (0.0009) +[2023-10-08 15:38:55,813][102898] Updated weights for policy 1, policy_version 97360 (0.0009) +[2023-10-08 15:38:56,089][102897] Updated weights for policy 0, policy_version 97210 (0.0007) +[2023-10-08 15:38:56,183][102898] Updated weights for policy 1, policy_version 97370 (0.0007) +[2023-10-08 15:38:56,875][101941] Fps is (10 sec: 19660.8, 60 sec: 14199.5, 300 sec: 14440.1). Total num frames: 199262208. Throughput: 0: 1806.6, 1: 1805.1. Samples: 49818150. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:38:56,875][101941] Avg episode reward: [(0, '9.040'), (1, '25.310')] +[2023-10-08 15:38:59,862][102897] Updated weights for policy 0, policy_version 97220 (0.0007) +[2023-10-08 15:39:00,031][102898] Updated weights for policy 1, policy_version 97380 (0.0007) +[2023-10-08 15:39:00,227][102897] Updated weights for policy 0, policy_version 97230 (0.0008) +[2023-10-08 15:39:00,419][102898] Updated weights for policy 1, policy_version 97390 (0.0008) +[2023-10-08 15:39:00,591][102897] Updated weights for policy 0, policy_version 97240 (0.0008) +[2023-10-08 15:39:00,781][102898] Updated weights for policy 1, policy_version 97400 (0.0008) +[2023-10-08 15:39:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14329.1). Total num frames: 199327744. Throughput: 0: 1775.7, 1: 1772.5. Samples: 49837842. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:39:01,876][101941] Avg episode reward: [(0, '9.060'), (1, '28.430')] +[2023-10-08 15:39:04,398][102898] Updated weights for policy 1, policy_version 97410 (0.0007) +[2023-10-08 15:39:04,462][102897] Updated weights for policy 0, policy_version 97250 (0.0007) +[2023-10-08 15:39:04,764][102898] Updated weights for policy 1, policy_version 97420 (0.0008) +[2023-10-08 15:39:04,829][102897] Updated weights for policy 0, policy_version 97260 (0.0007) +[2023-10-08 15:39:05,135][102898] Updated weights for policy 1, policy_version 97430 (0.0007) +[2023-10-08 15:39:05,199][102897] Updated weights for policy 0, policy_version 97270 (0.0008) +[2023-10-08 15:39:05,498][102898] Updated weights for policy 1, policy_version 97440 (0.0008) +[2023-10-08 15:39:05,572][102897] Updated weights for policy 0, policy_version 97280 (0.0008) +[2023-10-08 15:39:06,875][101941] Fps is (10 sec: 13107.0, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 199393280. Throughput: 0: 1796.9, 1: 1801.0. Samples: 49850388. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:39:06,876][101941] Avg episode reward: [(0, '9.650'), (1, '27.650')] +[2023-10-08 15:39:09,295][102898] Updated weights for policy 1, policy_version 97450 (0.0008) +[2023-10-08 15:39:09,412][102897] Updated weights for policy 0, policy_version 97290 (0.0008) +[2023-10-08 15:39:09,664][102898] Updated weights for policy 1, policy_version 97460 (0.0007) +[2023-10-08 15:39:09,780][102897] Updated weights for policy 0, policy_version 97300 (0.0008) +[2023-10-08 15:39:10,035][102898] Updated weights for policy 1, policy_version 97470 (0.0008) +[2023-10-08 15:39:10,148][102897] Updated weights for policy 0, policy_version 97310 (0.0008) +[2023-10-08 15:39:11,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 199458816. Throughput: 0: 1762.3, 1: 1775.7. Samples: 49869844. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:39:11,876][101941] Avg episode reward: [(0, '9.850'), (1, '28.040')] +[2023-10-08 15:39:13,804][102898] Updated weights for policy 1, policy_version 97480 (0.0009) +[2023-10-08 15:39:14,173][102898] Updated weights for policy 1, policy_version 97490 (0.0010) +[2023-10-08 15:39:14,231][102897] Updated weights for policy 0, policy_version 97320 (0.0007) +[2023-10-08 15:39:14,540][102898] Updated weights for policy 1, policy_version 97500 (0.0007) +[2023-10-08 15:39:14,611][102897] Updated weights for policy 0, policy_version 97330 (0.0007) +[2023-10-08 15:39:14,971][102897] Updated weights for policy 0, policy_version 97340 (0.0010) +[2023-10-08 15:39:16,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 199524352. Throughput: 0: 1761.1, 1: 1781.0. Samples: 49892118. Policy #0 lag: (min: 3.0, avg: 3.0, max: 3.0) +[2023-10-08 15:39:16,876][101941] Avg episode reward: [(0, '9.580'), (1, '29.820')] +[2023-10-08 15:39:18,321][102898] Updated weights for policy 1, policy_version 97510 (0.0007) +[2023-10-08 15:39:18,682][102898] Updated weights for policy 1, policy_version 97520 (0.0007) +[2023-10-08 15:39:18,728][102897] Updated weights for policy 0, policy_version 97350 (0.0007) +[2023-10-08 15:39:19,052][102898] Updated weights for policy 1, policy_version 97530 (0.0007) +[2023-10-08 15:39:19,095][102897] Updated weights for policy 0, policy_version 97360 (0.0008) +[2023-10-08 15:39:19,458][102897] Updated weights for policy 0, policy_version 97370 (0.0010) +[2023-10-08 15:39:21,875][101941] Fps is (10 sec: 13106.9, 60 sec: 14199.4, 300 sec: 14218.0). Total num frames: 199589888. Throughput: 0: 1774.8, 1: 1781.1. Samples: 49902326. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:39:21,876][101941] Avg episode reward: [(0, '9.600'), (1, '37.830')] +[2023-10-08 15:39:21,878][102760] Saving new best policy, reward=37.830! +[2023-10-08 15:39:22,866][102898] Updated weights for policy 1, policy_version 97540 (0.0008) +[2023-10-08 15:39:23,158][102897] Updated weights for policy 0, policy_version 97380 (0.0008) +[2023-10-08 15:39:23,230][102898] Updated weights for policy 1, policy_version 97550 (0.0008) +[2023-10-08 15:39:23,527][102897] Updated weights for policy 0, policy_version 97390 (0.0008) +[2023-10-08 15:39:23,589][102898] Updated weights for policy 1, policy_version 97560 (0.0007) +[2023-10-08 15:39:23,908][102897] Updated weights for policy 0, policy_version 97400 (0.0009) +[2023-10-08 15:39:26,875][101941] Fps is (10 sec: 13107.3, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 199655424. Throughput: 0: 1760.4, 1: 1783.7. Samples: 49924088. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:39:26,876][101941] Avg episode reward: [(0, '9.770'), (1, '35.780')] +[2023-10-08 15:39:27,239][102898] Updated weights for policy 1, policy_version 97570 (0.0007) +[2023-10-08 15:39:27,557][102897] Updated weights for policy 0, policy_version 97410 (0.0008) +[2023-10-08 15:39:27,608][102898] Updated weights for policy 1, policy_version 97580 (0.0007) +[2023-10-08 15:39:27,921][102897] Updated weights for policy 0, policy_version 97420 (0.0008) +[2023-10-08 15:39:27,977][102898] Updated weights for policy 1, policy_version 97590 (0.0007) +[2023-10-08 15:39:28,287][102897] Updated weights for policy 0, policy_version 97430 (0.0008) +[2023-10-08 15:39:28,343][102898] Updated weights for policy 1, policy_version 97600 (0.0010) +[2023-10-08 15:39:28,658][102897] Updated weights for policy 0, policy_version 97440 (0.0007) +[2023-10-08 15:39:31,875][101941] Fps is (10 sec: 13107.6, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 199720960. Throughput: 0: 1775.7, 1: 1797.0. Samples: 49946620. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:39:31,875][101941] Avg episode reward: [(0, '9.660'), (1, '33.580')] +[2023-10-08 15:39:31,997][102898] Updated weights for policy 1, policy_version 97610 (0.0009) +[2023-10-08 15:39:32,363][102898] Updated weights for policy 1, policy_version 97620 (0.0007) +[2023-10-08 15:39:32,438][102897] Updated weights for policy 0, policy_version 97450 (0.0007) +[2023-10-08 15:39:32,731][102898] Updated weights for policy 1, policy_version 97630 (0.0007) +[2023-10-08 15:39:32,808][102897] Updated weights for policy 0, policy_version 97460 (0.0007) +[2023-10-08 15:39:33,179][102897] Updated weights for policy 0, policy_version 97470 (0.0007) +[2023-10-08 15:39:36,545][102898] Updated weights for policy 1, policy_version 97640 (0.0008) +[2023-10-08 15:39:36,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 199786496. Throughput: 0: 1761.2, 1: 1787.6. Samples: 49956346. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:39:36,875][101941] Avg episode reward: [(0, '9.330'), (1, '33.580')] +[2023-10-08 15:39:36,890][102897] Updated weights for policy 0, policy_version 97480 (0.0007) +[2023-10-08 15:39:36,911][102898] Updated weights for policy 1, policy_version 97650 (0.0008) +[2023-10-08 15:39:37,265][102897] Updated weights for policy 0, policy_version 97490 (0.0007) +[2023-10-08 15:39:37,279][102898] Updated weights for policy 1, policy_version 97660 (0.0008) +[2023-10-08 15:39:37,631][102897] Updated weights for policy 0, policy_version 97500 (0.0009) +[2023-10-08 15:39:40,949][102898] Updated weights for policy 1, policy_version 97670 (0.0008) +[2023-10-08 15:39:41,310][102898] Updated weights for policy 1, policy_version 97680 (0.0008) +[2023-10-08 15:39:41,436][102897] Updated weights for policy 0, policy_version 97510 (0.0007) +[2023-10-08 15:39:41,674][102898] Updated weights for policy 1, policy_version 97690 (0.0007) +[2023-10-08 15:39:41,794][102897] Updated weights for policy 0, policy_version 97520 (0.0007) +[2023-10-08 15:39:41,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.5, 300 sec: 14218.0). Total num frames: 199852032. Throughput: 0: 1776.7, 1: 1801.7. Samples: 49979178. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:39:41,875][101941] Avg episode reward: [(0, '9.550'), (1, '34.970')] +[2023-10-08 15:39:42,164][102897] Updated weights for policy 0, policy_version 97530 (0.0010) +[2023-10-08 15:39:45,394][102898] Updated weights for policy 1, policy_version 97700 (0.0009) +[2023-10-08 15:39:45,759][102898] Updated weights for policy 1, policy_version 97710 (0.0010) +[2023-10-08 15:39:46,101][102897] Updated weights for policy 0, policy_version 97540 (0.0008) +[2023-10-08 15:39:46,129][102898] Updated weights for policy 1, policy_version 97720 (0.0008) +[2023-10-08 15:39:46,472][102897] Updated weights for policy 0, policy_version 97550 (0.0008) +[2023-10-08 15:39:46,848][102897] Updated weights for policy 0, policy_version 97560 (0.0007) +[2023-10-08 15:39:46,875][101941] Fps is (10 sec: 16384.1, 60 sec: 14745.6, 300 sec: 14329.1). Total num frames: 199950336. Throughput: 0: 1792.9, 1: 1798.4. Samples: 49999452. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:39:46,875][101941] Avg episode reward: [(0, '9.430'), (1, '30.610')] +[2023-10-08 15:39:49,916][102898] Updated weights for policy 1, policy_version 97730 (0.0009) +[2023-10-08 15:39:50,286][102898] Updated weights for policy 1, policy_version 97740 (0.0010) +[2023-10-08 15:39:50,638][102897] Updated weights for policy 0, policy_version 97570 (0.0009) +[2023-10-08 15:39:50,661][102898] Updated weights for policy 1, policy_version 97750 (0.0010) +[2023-10-08 15:39:51,012][102897] Updated weights for policy 0, policy_version 97580 (0.0008) +[2023-10-08 15:39:51,027][102898] Updated weights for policy 1, policy_version 97760 (0.0010) +[2023-10-08 15:39:51,381][102897] Updated weights for policy 0, policy_version 97590 (0.0010) +[2023-10-08 15:39:51,755][102897] Updated weights for policy 0, policy_version 97600 (0.0010) +[2023-10-08 15:39:51,875][101941] Fps is (10 sec: 19660.3, 60 sec: 14199.4, 300 sec: 14440.1). Total num frames: 200048640. Throughput: 0: 1768.4, 1: 1798.4. Samples: 50010896. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:39:51,876][101941] Avg episode reward: [(0, '8.780'), (1, '29.540')] +[2023-10-08 15:39:54,690][102898] Updated weights for policy 1, policy_version 97770 (0.0008) +[2023-10-08 15:39:55,052][102898] Updated weights for policy 1, policy_version 97780 (0.0007) +[2023-10-08 15:39:55,416][102898] Updated weights for policy 1, policy_version 97790 (0.0009) +[2023-10-08 15:39:55,560][102897] Updated weights for policy 0, policy_version 97610 (0.0009) +[2023-10-08 15:39:55,929][102897] Updated weights for policy 0, policy_version 97620 (0.0009) +[2023-10-08 15:39:56,313][102897] Updated weights for policy 0, policy_version 97630 (0.0009) +[2023-10-08 15:39:56,875][101941] Fps is (10 sec: 16383.6, 60 sec: 14199.4, 300 sec: 14329.1). Total num frames: 200114176. Throughput: 0: 1801.7, 1: 1795.9. Samples: 50031736. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:39:56,876][101941] Avg episode reward: [(0, '8.670'), (1, '28.420')] +[2023-10-08 15:39:59,109][102898] Updated weights for policy 1, policy_version 97800 (0.0009) +[2023-10-08 15:39:59,484][102898] Updated weights for policy 1, policy_version 97810 (0.0008) +[2023-10-08 15:39:59,857][102898] Updated weights for policy 1, policy_version 97820 (0.0007) +[2023-10-08 15:40:00,121][102897] Updated weights for policy 0, policy_version 97640 (0.0008) +[2023-10-08 15:40:00,497][102897] Updated weights for policy 0, policy_version 97650 (0.0009) +[2023-10-08 15:40:00,854][102897] Updated weights for policy 0, policy_version 97660 (0.0008) +[2023-10-08 15:40:01,875][101941] Fps is (10 sec: 13107.2, 60 sec: 14199.4, 300 sec: 14329.0). Total num frames: 200179712. Throughput: 0: 1772.1, 1: 1795.8. Samples: 50052672. Policy #0 lag: (min: 31.0, avg: 31.0, max: 31.0) +[2023-10-08 15:40:01,876][101941] Avg episode reward: [(0, '9.130'), (1, '25.760')] +[2023-10-08 15:40:03,601][102898] Updated weights for policy 1, policy_version 97830 (0.0007) +[2023-10-08 15:40:03,967][102898] Updated weights for policy 1, policy_version 97840 (0.0007) +[2023-10-08 15:40:04,338][102898] Updated weights for policy 1, policy_version 97850 (0.0007) +[2023-10-08 15:40:04,556][102936] Stopping RolloutWorker_w5... +[2023-10-08 15:40:04,556][102941] Stopping RolloutWorker_w10... +[2023-10-08 15:40:04,556][102935] Stopping RolloutWorker_w2... +[2023-10-08 15:40:04,557][102941] Loop rollout_proc10_evt_loop terminating... +[2023-10-08 15:40:04,557][102936] Loop rollout_proc5_evt_loop terminating... +[2023-10-08 15:40:04,557][102935] Loop rollout_proc2_evt_loop terminating... +[2023-10-08 15:40:04,557][102944] Stopping RolloutWorker_w13... +[2023-10-08 15:40:04,556][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000097856_100204544.pth... +[2023-10-08 15:40:04,557][102942] Stopping RolloutWorker_w11... +[2023-10-08 15:40:04,557][102932] Stopping RolloutWorker_w3... +[2023-10-08 15:40:04,557][103679] Stopping RolloutWorker_w15... +[2023-10-08 15:40:04,557][102940] Stopping RolloutWorker_w9... +[2023-10-08 15:40:04,557][101941] Component RolloutWorker_w5 stopped! +[2023-10-08 15:40:04,557][102944] Loop rollout_proc13_evt_loop terminating... +[2023-10-08 15:40:04,557][102942] Loop rollout_proc11_evt_loop terminating... +[2023-10-08 15:40:04,557][102932] Loop rollout_proc3_evt_loop terminating... +[2023-10-08 15:40:04,557][103679] Loop rollout_proc15_evt_loop terminating... +[2023-10-08 15:40:04,557][102940] Loop rollout_proc9_evt_loop terminating... +[2023-10-08 15:40:04,557][101941] Component RolloutWorker_w10 stopped! +[2023-10-08 15:40:04,558][101941] Component RolloutWorker_w2 stopped! +[2023-10-08 15:40:04,558][102930] Stopping RolloutWorker_w0... +[2023-10-08 15:40:04,558][102930] Loop rollout_proc0_evt_loop terminating... +[2023-10-08 15:40:04,558][101941] Component RolloutWorker_w13 stopped! +[2023-10-08 15:40:04,559][102939] Stopping RolloutWorker_w8... +[2023-10-08 15:40:04,559][101941] Component RolloutWorker_w9 stopped! +[2023-10-08 15:40:04,559][102939] Loop rollout_proc8_evt_loop terminating... +[2023-10-08 15:40:04,559][101941] Component RolloutWorker_w11 stopped! +[2023-10-08 15:40:04,559][101941] Component RolloutWorker_w3 stopped! +[2023-10-08 15:40:04,560][102934] Stopping RolloutWorker_w4... +[2023-10-08 15:40:04,560][102943] Stopping RolloutWorker_w12... +[2023-10-08 15:40:04,560][101941] Component RolloutWorker_w15 stopped! +[2023-10-08 15:40:04,560][102934] Loop rollout_proc4_evt_loop terminating... +[2023-10-08 15:40:04,560][102943] Loop rollout_proc12_evt_loop terminating... +[2023-10-08 15:40:04,560][101941] Component Batcher_1 stopped! +[2023-10-08 15:40:04,560][102937] Stopping RolloutWorker_w6... +[2023-10-08 15:40:04,560][103647] Stopping RolloutWorker_w14... +[2023-10-08 15:40:04,561][101941] Component RolloutWorker_w0 stopped! +[2023-10-08 15:40:04,561][102937] Loop rollout_proc6_evt_loop terminating... +[2023-10-08 15:40:04,561][103647] Loop rollout_proc14_evt_loop terminating... +[2023-10-08 15:40:04,561][101941] Component RolloutWorker_w8 stopped! +[2023-10-08 15:40:04,561][101941] Component RolloutWorker_w4 stopped! +[2023-10-08 15:40:04,562][101941] Component RolloutWorker_w12 stopped! +[2023-10-08 15:40:04,562][101941] Component RolloutWorker_w6 stopped! +[2023-10-08 15:40:04,557][102760] Stopping Batcher_1... +[2023-10-08 15:40:04,562][101941] Component RolloutWorker_w14 stopped! +[2023-10-08 15:40:04,562][102933] Stopping RolloutWorker_w1... +[2023-10-08 15:40:04,562][101941] Component RolloutWorker_w1 stopped! +[2023-10-08 15:40:04,563][102938] Stopping RolloutWorker_w7... +[2023-10-08 15:40:04,563][102933] Loop rollout_proc1_evt_loop terminating... +[2023-10-08 15:40:04,563][101941] Component RolloutWorker_w7 stopped! +[2023-10-08 15:40:04,563][102938] Loop rollout_proc7_evt_loop terminating... +[2023-10-08 15:40:04,573][101941] Component Batcher_0 stopped! +[2023-10-08 15:40:04,573][102634] Stopping Batcher_0... +[2023-10-08 15:40:04,574][102634] Loop batcher_evt_loop terminating... +[2023-10-08 15:40:04,585][102898] Weights refcount: 2 0 +[2023-10-08 15:40:04,586][102898] Stopping InferenceWorker_p1-w0... +[2023-10-08 15:40:04,587][102898] Loop inference_proc1-0_evt_loop terminating... +[2023-10-08 15:40:04,586][101941] Component InferenceWorker_p1-w0 stopped! +[2023-10-08 15:40:04,576][102760] Loop batcher_evt_loop terminating... +[2023-10-08 15:40:04,594][102897] Weights refcount: 2 0 +[2023-10-08 15:40:04,596][102897] Stopping InferenceWorker_p0-w0... +[2023-10-08 15:40:04,596][102897] Loop inference_proc0-0_evt_loop terminating... +[2023-10-08 15:40:04,596][101941] Component InferenceWorker_p0-w0 stopped! +[2023-10-08 15:40:04,602][102760] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000096256_98566144.pth +[2023-10-08 15:40:04,609][102760] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p1/checkpoint_000097856_100204544.pth... +[2023-10-08 15:40:04,665][102760] Stopping LearnerWorker_p1... +[2023-10-08 15:40:04,665][102760] Loop learner_proc1_evt_loop terminating... +[2023-10-08 15:40:04,665][101941] Component LearnerWorker_p1 stopped! +[2023-10-08 15:40:05,596][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000097696_100040704.pth... +[2023-10-08 15:40:05,623][102634] Removing ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000096096_98402304.pth +[2023-10-08 15:40:05,627][102634] Saving ./train_atari/atari_asteroid_APPO/checkpoint_p0/checkpoint_000097696_100040704.pth... +[2023-10-08 15:40:05,659][102634] Stopping LearnerWorker_p0... +[2023-10-08 15:40:05,660][102634] Loop learner_proc0_evt_loop terminating... +[2023-10-08 15:40:05,660][101941] Component LearnerWorker_p0 stopped! +[2023-10-08 15:40:05,661][101941] Waiting for process learner_proc0 to stop... +[2023-10-08 15:40:06,191][101941] Waiting for process learner_proc1 to stop... +[2023-10-08 15:40:06,192][101941] Waiting for process inference_proc0-0 to join... +[2023-10-08 15:40:06,193][101941] Waiting for process inference_proc1-0 to join... +[2023-10-08 15:40:06,193][101941] Waiting for process rollout_proc0 to join... +[2023-10-08 15:40:06,194][101941] Waiting for process rollout_proc1 to join... +[2023-10-08 15:40:06,195][101941] Waiting for process rollout_proc2 to join... +[2023-10-08 15:40:06,196][101941] Waiting for process rollout_proc3 to join... +[2023-10-08 15:40:06,196][101941] Waiting for process rollout_proc4 to join... +[2023-10-08 15:40:06,197][101941] Waiting for process rollout_proc5 to join... +[2023-10-08 15:40:06,198][101941] Waiting for process rollout_proc6 to join... +[2023-10-08 15:40:06,199][101941] Waiting for process rollout_proc7 to join... +[2023-10-08 15:40:06,199][101941] Waiting for process rollout_proc8 to join... +[2023-10-08 15:40:06,200][101941] Waiting for process rollout_proc9 to join... +[2023-10-08 15:40:06,200][101941] Waiting for process rollout_proc10 to join... +[2023-10-08 15:40:06,200][101941] Waiting for process rollout_proc11 to join... +[2023-10-08 15:40:06,201][101941] Waiting for process rollout_proc12 to join... +[2023-10-08 15:40:06,201][101941] Waiting for process rollout_proc13 to join... +[2023-10-08 15:40:06,202][101941] Waiting for process rollout_proc14 to join... +[2023-10-08 15:40:06,202][101941] Waiting for process rollout_proc15 to join... +[2023-10-08 15:40:06,202][101941] Batcher 0 profile tree view: +batching: 171.0279, releasing_batches: 0.0929 +[2023-10-08 15:40:06,204][101941] Batcher 1 profile tree view: +batching: 169.7871, releasing_batches: 0.0925 +[2023-10-08 15:40:06,205][101941] InferenceWorker_p0-w0 profile tree view: +wait_policy: 0.0001 + wait_policy_total: 1970.7953 +update_model: 201.2267 + weight_update: 0.0008 +one_step: 0.0090 + handle_policy_step: 11171.5407 + deserialize: 63.0314, stack: 190.6981, obs_to_device_normalize: 2478.2967, forward: 5033.6175, prepare_outputs: 2464.9669, send_messages: 458.3914 +[2023-10-08 15:40:06,205][101941] InferenceWorker_p1-w0 profile tree view: +wait_policy: 0.0001 + wait_policy_total: 2021.7401 +update_model: 202.6953 + weight_update: 0.0007 +one_step: 0.0025 + handle_policy_step: 11116.2784 + deserialize: 62.4807, stack: 189.6100, obs_to_device_normalize: 2488.6581, forward: 5031.1309, prepare_outputs: 2411.8007, send_messages: 451.6470 +[2023-10-08 15:40:06,205][101941] Learner 0 profile tree view: +misc: 0.0179, prepare_batch: 261.5680 +train: 3640.3996 + epoch_init: 0.1921, minibatch_init: 12.8987, losses_postprocess: 896.2134, kl_divergence: 31.4947, update: 389.3411, after_optimizer: 2123.3663 + calculate_losses: 169.8546 + losses_init: 0.5065, forward_head: 59.4638, bptt_initial: 1.4370, bptt: 2.0005, tail: 37.7696, advantages_returns: 11.0680, losses: 43.9035 +[2023-10-08 15:40:06,206][101941] Learner 1 profile tree view: +misc: 0.0193, prepare_batch: 262.5004 +train: 3608.3261 + epoch_init: 0.1902, minibatch_init: 13.3086, losses_postprocess: 888.9247, kl_divergence: 31.0962, update: 385.4054, after_optimizer: 2106.8407 + calculate_losses: 165.6187 + losses_init: 0.3784, forward_head: 55.6647, bptt_initial: 1.4469, bptt: 2.0263, tail: 37.8630, advantages_returns: 11.0136, losses: 43.5468 +[2023-10-08 15:40:06,206][101941] RolloutWorker_w0 profile tree view: +wait_for_trajectories: 1.2392, enqueue_policy_requests: 411.7840, process_policy_outputs: 192.8088, env_step: 6659.5815, finalize_trajectories: 3.9178, complete_rollouts: 2.9180 +post_env_step: 379.1797 + process_env_step: 86.1744 +[2023-10-08 15:40:06,206][101941] RolloutWorker_w15 profile tree view: +wait_for_trajectories: 1.2036, enqueue_policy_requests: 405.6322, process_policy_outputs: 190.1012, env_step: 6657.5732, finalize_trajectories: 3.3736, complete_rollouts: 2.8807 +post_env_step: 375.8591 + process_env_step: 85.2973 +[2023-10-08 15:40:06,207][101941] Loop Runner_EvtLoop terminating... +[2023-10-08 15:40:06,207][101941] Runner profile tree view: +main_loop: 14024.8015 +[2023-10-08 15:40:06,207][101941] Collected {0: 100040704, 1: 100204544}, FPS: 14277.9